In [1]:
!git clone https://github.com/RichardStaszkiewicz/CNN-Hyperparameter-Tuning.git
!mv /content/CNN-Hyperparameter-Tuning/modules /content/modules
!mv /content/CNN-Hyperparameter-Tuning/model /content/model
!mkdir logs
!pip install "ray[tune]" torch torchvision pytorch-lightning

Cloning into 'CNN-Hyperparameter-Tuning'...
remote: Enumerating objects: 43, done.[K
remote: Counting objects: 100% (43/43), done.[K
remote: Compressing objects: 100% (34/34), done.[K
remote: Total 43 (delta 13), reused 33 (delta 6), pack-reused 0[K
Receiving objects: 100% (43/43), 94.01 KiB | 7.23 MiB/s, done.
Resolving deltas: 100% (13/13), done.
Collecting ray[tune]
  Downloading ray-2.6.3-cp310-cp310-manylinux2014_x86_64.whl (56.9 MB)
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m56.9/56.9 MB[0m [31m17.7 MB/s[0m eta [36m0:00:00[0m
Collecting pytorch-lightning
  Downloading pytorch_lightning-2.0.8-py3-none-any.whl (727 kB)
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m727.0/727.0 kB[0m [31m60.8 MB/s[0m eta [36m0:00:00[0m
Collecting tensorboardX>=1.9 (from ray[tune])
  Downloading tensorboardX-2.6.2.2-py2.py3-none-any.whl (101 kB)
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m101.7/101.7 kB[0m [31m12.9 MB/s[0m eta [3

In [2]:
from modules import plmodules as plm
from ray import tune, air
from ray.tune import CLIReporter
from ray.tune.schedulers import ASHAScheduler, PopulationBasedTraining
from ray.tune.integration.pytorch_lightning import TuneReportCallback, TuneReportCheckpointCallback
import pytorch_lightning as pl
import yaml

## Config

In [3]:
with open("/content/model/configs/model.yaml", 'r') as stream:
      default_config=yaml.safe_load(stream)

default_config = default_config['model']

In [7]:
# Grid search
# search_config = {
#     "batch_size": tune.grid_search([64, 128, 256]),
#     "lr": tune.grid_search([0.01, 0.1]),
#     "mlp_out_l0": tune.grid_search([64, 128]),
#     "mlp_af_l0": tune.grid_search(['relu', 'none']),
#     "mlp_bn_l0": tune.grid_search([True, False]),
#     "mlp_do_l0": tune.grid_search([0.1, 0.3])
# }
# Random search
search_config = {
    "batch_size": tune.choice([64, 128, 256]),
    "lr": tune.uniform(0.01, 0.1),
    "mlp_out_l0": tune.uniform(64, 128),
    "mlp_af_l0": tune.choice(['relu', 'None']),
    "mlp_bn_l0": tune.choice([True, False]),
    "mlp_do_l0": tune.uniform(0.095, 0.305)
}

In [8]:
config = default_config | search_config

## Scheduers

In [9]:
scheduler_asha = ASHAScheduler(
    time_attr="time_total_s",
    max_t=150,
    grace_period=30,
    reduction_factor=2,
)

## Callbacks

In [10]:
tune_report_callback = TuneReportCheckpointCallback(
    metrics={
    "ptl/train_loss": "ptl/train_loss",
    'ptl/train_accuracy': 'ptl/train_accuracy',
    'ptl/val_loss': 'ptl/val_loss',
    'ptl/val_accuracy': 'ptl/val_accuracy',
    'time_total_s': 'time_total_s',
    },
    filename="ray_ckpt",
    on="validation_end",
)

## Trainable

In [None]:
def actualise_config(config):
  mlp = [int(k.replace("mlp_out_l", '')) for k in config.keys() if "mlp_out_l" in k]
  for l in mlp:
    config["mlp_config"]['block_list'][l]['out_size'] = config[f"mlp_out_l{l}"]
    config["mlp_config"]['block_list'][l+1]['in_size'] = config[f"mlp_out_l{l}"]
  mlp = [int(k.replace("mlp_af_l", '')) for k in config.keys() if "mlp_af_l" in k]
  for af in mlp:
    config["mlp_config"]['block_list'][af]['activation_fun'] = config[f"mlp_af_l{af}"]
  mlp = [int(k.replace("mlp_bn_l", '')) for k in config.keys() if "mlp_bn_l" in k]
  for bn in mlp:
    config["mlp_config"]['block_list'][bn]['batch_norm'] = config[f"mlp_bn_l{bn}"]
  mlp = [int(k.replace("mlp_do_l", '')) for k in config.keys() if "mlp_do_l" in k]
  for do in mlp:
    config["mlp_config"]['block_list'][do]['dropout'] = config[f"mlp_do_l{do}"]
  return config

In [None]:
def run_with_tune(config, epochs=50):
    config = actualise_config(config)
    model = plm.MNISTClassifier(config)
    dm = plm.MNISTDataModule(config['batch_size'])
    trainer = pl.Trainer(
        max_epochs=epochs,
        fast_dev_run=False,
        callbacks=[
            tune_report_callback,
        ],
    )
    trainer.fit(model, dm)

## Reporter

In [None]:
reporter = CLIReporter(
    parameter_columns=[search_config.keys()],
    metric_columns=[ "time_total_s", "ptl/train_accuracy", "ptl/val_loss", "ptl/val_accuracy", "training_iteration"]
)

## Trial

In [None]:
train_fn_with_parameters = tune.with_parameters(run_with_tune, epochs=50)

In [None]:
resources_per_trial = {"cpu": 2, "gpu": 1}

In [None]:
tuner = tune.Tuner(
        tune.with_resources(
            train_fn_with_parameters,
            resources=resources_per_trial
        ),
        tune_config=tune.TuneConfig(
            metric="ptl/val_loss",
            mode="min",
            search_alg=tune.search.BasicVariantGenerator(),
            #time_budget_s=600,
            scheduler=scheduler_asha,
            #num_samples=-1,
        ),
        run_config=air.RunConfig(
            name="tune_mnist_asha",
            progress_reporter=reporter,
        ),
        param_space=config,
    )
results = tuner.fit()

2023-09-02 16:40:14,241	INFO worker.py:1621 -- Started a local Ray instance.
2023-09-02 16:40:16,715	INFO tune.py:226 -- Initializing Ray automatically. For cluster usage or custom Ray initialization, call `ray.init(...)` before `Tuner(...)`.
2023-09-02 16:40:16,720	INFO tune.py:666 -- [output] This will use the new output engine with verbosity 1. To disable the new output and use the legacy output engine, set the environment variable RAY_AIR_NEW_OUTPUT=0. For more information, please see https://github.com/ray-project/ray/issues/36949


+----------------------------------------------------------+
| Configuration for experiment     tune_mnist_asha         |
+----------------------------------------------------------+
| Search algorithm                 BasicVariantGenerator   |
| Scheduler                        AsyncHyperBandScheduler |
| Number of trials                 96                      |
+----------------------------------------------------------+

View detailed results here: /root/ray_results/tune_mnist_asha
To visualize your results with TensorBoard, run: `tensorboard --logdir /root/ray_results/tune_mnist_asha`

Trial status: 16 PENDING
Current time: 2023-09-02 16:40:17. Total running time: 0s
Logical resource usage: 0/2 CPUs, 0/1 GPUs
+---------------------------------------------------------------------------------------------------------------------+
| Trial name                  status       batch_size     lr     mlp_out_l0   mlp_af_l0     mlp_bn_l0       mlp_do_l0 |
+------------------------------------

[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00000_0_batch_size=64,lr=0.0100,mlp_af_l0=relu,mlp_bn_l0=True,mlp_do_l0=0.1000,mlp_out_l0=64_2023-09-02_16-40-17/lightning_logs
[2m[36m(run_with_tune pid=1086)[0m 2023-09-02 16:40:29.798559: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.
[2m[36m(run_with_tune pid=1086)[0m To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


  0%|          | 0/26421880 [00:00<?, ?it/s]
  0%|          | 32768/26421880 [00:00<02:12, 199567.80it/s]
  0%|          | 65536/26421880 [00:00<02:15, 194473.58it/s]
  0%|          | 131072/26421880 [00:00<01:33, 280967.35it/s]
  1%|          | 229376/26421880 [00:00<01:06, 396746.27it/s]
  2%|▏         | 491520/26421880 [00:00<00:32, 806017.32it/s]
  4%|▎         | 950272/26421880 [00:01<00:17, 1442797.10it/s]
  7%|▋         | 1933312/26421880 [00:01<00:08, 2846348.92it/s]
 15%|█▍        | 3833856/26421880 [00:01<00:04, 5471456.62it/s]
 26%|██▌       | 6914048/26421880 [00:01<00:02, 9375356.92it/s]
 38%|███▊      | 9994240/26421880 [00:01<00:01, 12024674.52it/s]
 50%|████▉     | 13107200/26421880 [00:01<00:00, 13900337.38it/s]
 61%|██████    | 16023552/26421880 [00:02<00:00, 14842493.83it/s]
 71%|███████   | 18776064/26421880 [00:02<00:00, 15205987.53it/s]
 83%|████████▎ | 21856256/26421880 [00:02<00:00, 16035769.18it/s]


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m  94%|█████████▍| 24936448/26421880 [00:02<00:00, 16619076.65it/s]100%|██████████| 26421880/26421880 [00:02<00:00, 10276525.84it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s]
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 174088.54it/s]100%|██████████| 29515/29515 [00:00<00:00, 173856.28it/s]


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


  0%|          | 0/4422102 [00:00<?, ?it/s]
  1%|          | 32768/4422102 [00:00<00:22, 191263.85it/s]
  1%|▏         | 65536/4422102 [00:00<00:22, 190777.85it/s]
  3%|▎         | 131072/4422102 [00:00<00:15, 277852.38it/s]
  5%|▌         | 229376/4422102 [00:00<00:10, 393737.90it/s]
 11%|█         | 491520/4422102 [00:00<00:04, 801599.91it/s]
 21%|██▏       | 950272/4422102 [00:01<00:02, 1435987.18it/s]
 44%|████▎     | 1933312/4422102 [00:01<00:00, 2836585.10it/s]
100%|██████████| 4422102/4422102 [00:01<00:00, 3212514.73it/s]


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 


[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s]100%|██████████| 5148/5148 [00:00<00:00, 33896824.16it/s]


[2m[36m(run_with_tune pid=1086)[0m Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.5 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.3 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid=1086)[0m 15.3 K    Total params
[2m[36m(run_with_tune pid=1086)[0m 0.061     Total estimated model params size (MB)


[2m[36m(run_with_tune pid=1086)[0m Sanity Checking:   0%|          | 0/2 [00:00<?, ?it/s]Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m   out = self.act_fun(out)


Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:01<00:00,  1.50it/s]
Epoch 0:   0%|          | 0/750 [00:00<?, ?it/s] 
Epoch 0:   3%|▎         | 20/750 [00:01<00:54, 13.50it/s, v_num=0]
Epoch 0:   5%|▌         | 40/750 [00:02<00:37, 18.77it/s, v_num=0]
Epoch 0:   8%|▊         | 60/750 [00:02<00:29, 23.26it/s, v_num=0]
Epoch 0:  11%|█         | 80/750 [00:03<00:25, 26.61it/s, v_num=0]
Epoch 0:  13%|█▎        | 100/750 [00:03<00:22, 28.59it/s, v_num=0]
Epoch 0:  16%|█▌        | 120/750 [00:03<00:20, 30.22it/s, v_num=0]
Epoch 0:  19%|█▊        | 140/750 [00:04<00:19, 31.75it/s, v_num=0]
Epoch 0:  21%|██▏       | 160/750 [00:04<00:17, 32.83it/s, v_num=0]
Epoch 0:  24%|██▍       | 180/750 [00:05<00:16, 33.91it/s, v_num=0]
Trial status: 1 RUNNING | 16 PENDING
Current time: 2023-09-02 16:40:47. Total running time: 30s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
+---------------------------------------------------------------------------------------------------------------------+
| T

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:   3%|▎         | 20/750 [00:00<00:21, 33.58it/s, v_num=0]
Epoch 1:   5%|▌         | 40/750 [00:01<00:18, 38.85it/s, v_num=0]
Epoch 1:   8%|▊         | 60/750 [00:01<00:16, 40.96it/s, v_num=0]
Epoch 1:  11%|█         | 80/750 [00:01<00:15, 42.27it/s, v_num=0]
Epoch 1:  13%|█▎        | 100/750 [00:02<00:15, 42.68it/s, v_num=0]
Epoch 1:  16%|█▌        | 120/750 [00:02<00:14, 43.27it/s, v_num=0]
Epoch 1:  19%|█▊        | 140/750 [00:03<00:13, 43.81it/s, v_num=0]
Epoch 1:  21%|██▏       | 160/750 [00:03<00:13, 44.00it/s, v_num=0]
Epoch 1:  24%|██▍       | 180/750 [00:04<00:12, 43.94it/s, v_num=0]
Epoch 1:  27%|██▋       | 200/750 [00:04<00:12, 43.48it/s, v_num=0]
Epoch 1:  29%|██▉       | 220/750 [00:05<00:12, 41.00it/s, v_num=0]
Epoch 1:  32%|███▏      | 240/750 [00:06<00:13, 39.16it/s, v_num=0]
Epoch 1:  35%|███▍      | 260/750 [00:06<00:12, 37.76it/s, v_num=0]
Epoch 1:  37%|███▋      | 280/750 [00:07<00:13, 36.08it/s, v_num=0]
Epoch 1:  40%|████      | 300/750 [00:08<00:12, 35.1

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 2:   3%|▎         | 20/750 [00:01<00:41, 17.45it/s, v_num=0]
Epoch 2:   5%|▌         | 40/750 [00:01<00:34, 20.75it/s, v_num=0]
Epoch 2:   8%|▊         | 60/750 [00:02<00:29, 23.08it/s, v_num=0]
Epoch 2:  11%|█         | 80/750 [00:03<00:25, 26.27it/s, v_num=0]
Epoch 2:  13%|█▎        | 100/750 [00:03<00:22, 28.91it/s, v_num=0]
Epoch 2:  16%|█▌        | 120/750 [00:03<00:20, 30.62it/s, v_num=0]
Epoch 2:  19%|█▊        | 140/750 [00:04<00:18, 32.23it/s, v_num=0]
Epoch 2:  21%|██▏       | 160/750 [00:04<00:17, 33.48it/s, v_num=0]
Epoch 2:  24%|██▍       | 180/750 [00:05<00:16, 34.31it/s, v_num=0]
Epoch 2:  27%|██▋       | 200/750 [00:05<00:15, 35.25it/s, v_num=0]
Epoch 2:  29%|██▉       | 220/750 [00:06<00:14, 35.89it/s, v_num=0]
Epoch 2:  32%|███▏      | 240/750 [00:06<00:13, 36.48it/s, v_num=0]
Epoch 2:  35%|███▍      | 260/750 [00:07<00:13, 36.98it/s, v_num=0]
Epoch 2:  37%|███▋      | 280/750 [00:07<00:12, 37.54it/s, v_num=0]
Epoch 2:  40%|████      | 300/750 [00:07<00:11, 37.8

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 3:   3%|▎         | 20/750 [00:00<00:21, 33.23it/s, v_num=0]
Epoch 3:   5%|▌         | 40/750 [00:01<00:18, 37.75it/s, v_num=0]
Epoch 3:   8%|▊         | 60/750 [00:01<00:17, 39.84it/s, v_num=0]
Epoch 3:  11%|█         | 80/750 [00:01<00:16, 41.49it/s, v_num=0]
Epoch 3:  13%|█▎        | 100/750 [00:02<00:15, 42.10it/s, v_num=0]
Epoch 3:  16%|█▌        | 120/750 [00:02<00:14, 42.89it/s, v_num=0]
Epoch 3:  19%|█▊        | 140/750 [00:03<00:14, 43.00it/s, v_num=0]
Epoch 3:  21%|██▏       | 160/750 [00:03<00:13, 43.28it/s, v_num=0]
Epoch 3:  24%|██▍       | 180/750 [00:04<00:13, 42.62it/s, v_num=0]
Epoch 3:  27%|██▋       | 200/750 [00:04<00:13, 42.17it/s, v_num=0]
Epoch 3:  29%|██▉       | 220/750 [00:05<00:13, 39.81it/s, v_num=0]
Epoch 3:  32%|███▏      | 240/750 [00:06<00:13, 38.48it/s, v_num=0]
Epoch 3:  35%|███▍      | 260/750 [00:06<00:13, 37.43it/s, v_num=0]
Epoch 3:  37%|███▋      | 280/750 [00:07<00:12, 36.47it/s, v_num=0]
Epoch 3:  40%|████      | 300/750 [00:08<00:12, 35.4

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 4:   3%|▎         | 20/750 [00:00<00:34, 21.05it/s, v_num=0]
Epoch 4:   5%|▌         | 40/750 [00:01<00:30, 23.35it/s, v_num=0]
Epoch 4:   8%|▊         | 60/750 [00:02<00:28, 24.01it/s, v_num=0]
Epoch 4:  11%|█         | 80/750 [00:02<00:24, 27.26it/s, v_num=0]
Epoch 4:  13%|█▎        | 100/750 [00:03<00:21, 29.83it/s, v_num=0]
Epoch 4:  16%|█▌        | 120/750 [00:03<00:20, 31.27it/s, v_num=0]
Epoch 4:  19%|█▊        | 140/750 [00:04<00:18, 32.39it/s, v_num=0]
Epoch 4:  21%|██▏       | 160/750 [00:04<00:17, 33.55it/s, v_num=0]
Epoch 4:  24%|██▍       | 180/750 [00:05<00:16, 34.53it/s, v_num=0]
Epoch 4:  27%|██▋       | 200/750 [00:05<00:15, 35.41it/s, v_num=0]
Epoch 4:  29%|██▉       | 220/750 [00:06<00:14, 36.13it/s, v_num=0]
Epoch 4:  32%|███▏      | 240/750 [00:06<00:13, 36.69it/s, v_num=0]
Epoch 4:  35%|███▍      | 260/750 [00:06<00:13, 37.21it/s, v_num=0]
Epoch 4:  37%|███▋      | 280/750 [00:07<00:12, 37.56it/s, v_num=0]
Epoch 4:  40%|████      | 300/750 [00:07<00:11, 37.9

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 5:   3%|▎         | 20/750 [00:00<00:22, 33.16it/s, v_num=0]
Epoch 5:   5%|▌         | 40/750 [00:01<00:18, 37.88it/s, v_num=0]
Epoch 5:   8%|▊         | 60/750 [00:01<00:17, 38.96it/s, v_num=0]
Epoch 5:  11%|█         | 80/750 [00:01<00:16, 40.76it/s, v_num=0]
Trial status: 1 RUNNING | 16 PENDING
Current time: 2023-09-02 16:42:47. Total running time: 2min 30s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.472860723733902 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00001_1_batch_size=128,lr=0.0100,mlp_af_l0=relu,mlp_bn_l0=True,mlp_do_l0=0.1000,mlp_out_l0=64_2023-09-02_16-40-17/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:15, 194387.77it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:15, 194613.47it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:32, 283422.00it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 402670.89it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:31, 819080.84it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1467593.52it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 172575.39it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 172344.98it/s]


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:23, 189962.69it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 189766.59it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 276087.39it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 391607.28it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 796908.71it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1428526.34it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz
Trial status: 1 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 16:43:17. Total running time: 3min 0s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fu

[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5422582.60it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3194935.15it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 33066274.11it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.5 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.3 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 31.77it/s]
Epoch 0:   0%|          | 0/375 [00:00<?, ?it/s] 
Epoch 0:   5%|▌         | 20/375 [00:00<00:16, 22.14it/s, v_num=0]
Epoch 0:  11%|█         | 40/375 [00:01<00:13, 24.26it/s, v_num=0]
Epoch 0:  16%|█▌        | 60/375 [00:02<00:12, 24.46it/s, v_num=0]
Epoch 0:  21%|██▏       | 80/375 [00:03<00:11, 25.22it/s, v_num=0]
Epoch 0:  27%|██▋       | 100/375 [00:04<00:11, 24.60it/s, v_num=0]
Epoch 0:  32%|███▏      | 120/375 [00:05<00:11, 22.66it/s, v_num=0]
Epoch 0:  37%|███▋      | 140/375 [00:06<00:10, 21.69it/s, v_num=0]
Epoch 0:  43%|████▎     | 160/375 [00:07<00:10, 20.76it/s, v_num=0]
Epoch 0:  48%|████▊     | 180/375 [00:08<00:09, 20.12it/s, v_num=0]
Epoch 0:  53%|█████▎    | 200/375 [00:10<00:08, 19.72it/s, v_num=0]
Epoch 0:  59%|█████▊    | 220/375 [00:10<00:07, 20.31it/s, v_num=0]
Epoch 0:  64%|██████▍   | 240/375 [00:11<00:06, 20.71it/s, v_n

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:   5%|▌         | 20/375 [00:01<00:20, 16.91it/s, v_num=0]
Epoch 1:  11%|█         | 40/375 [00:02<00:19, 17.37it/s, v_num=0]
Epoch 1:  16%|█▌        | 60/375 [00:03<00:18, 16.97it/s, v_num=0]
Epoch 1:  21%|██▏       | 80/375 [00:04<00:17, 16.67it/s, v_num=0]
Epoch 1:  27%|██▋       | 100/375 [00:06<00:16, 16.49it/s, v_num=0]
Epoch 1:  32%|███▏      | 120/375 [00:07<00:15, 16.49it/s, v_num=0]
Epoch 1:  37%|███▋      | 140/375 [00:07<00:13, 17.57it/s, v_num=0]
Epoch 1:  43%|████▎     | 160/375 [00:08<00:11, 18.22it/s, v_num=0]
Trial status: 1 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 16:43:47. Total running time: 3min 30s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 2:   5%|▌         | 20/375 [00:01<00:27, 12.83it/s, v_num=0]
Epoch 2:  11%|█         | 40/375 [00:02<00:23, 14.52it/s, v_num=0]
Epoch 2:  16%|█▌        | 60/375 [00:03<00:18, 17.32it/s, v_num=0]
Epoch 2:  21%|██▏       | 80/375 [00:04<00:15, 19.09it/s, v_num=0]
Epoch 2:  27%|██▋       | 100/375 [00:04<00:13, 20.29it/s, v_num=0]
Epoch 2:  32%|███▏      | 120/375 [00:05<00:11, 21.26it/s, v_num=0]
Epoch 2:  37%|███▋      | 140/375 [00:06<00:10, 22.15it/s, v_num=0]
Epoch 2:  43%|████▎     | 160/375 [00:07<00:09, 22.64it/s, v_num=0]
Epoch 2:  48%|████▊     | 180/375 [00:07<00:08, 23.04it/s, v_num=0]
Epoch 2:  53%|█████▎    | 200/375 [00:08<00:07, 23.50it/s, v_num=0]
Epoch 2:  59%|█████▊    | 220/375 [00:09<00:06, 23.83it/s, v_num=0]
Epoch 2:  64%|██████▍   | 240/375 [00:09<00:05, 24.02it/s, v_num=0]
Epoch 2:  69%|██████▉   | 260/375 [00:10<00:04, 24.27it/s, v_num=0]
Epoch 2:  75%|███████▍  | 280/375 [00:11<00:03, 24.53it/s, v_num=0]
Epoch 2:  80%|████████  | 300/375 [00:12<00:03, 24.6

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00002_2_batch_size=256,lr=0.0100,mlp_af_l0=relu,mlp_bn_l0=True,mlp_do_l0=0.1000,mlp_out_l0=64_2023-09-02_16-40-17/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:16, 193816.76it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:16, 193413.89it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:33, 281671.74it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 399590.58it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:31, 812919.02it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1456551.22it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 172227.01it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 171897.47it/s]


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 193226.82it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 192868.90it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 280710.96it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 398175.59it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 809009.75it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1450848.23it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 37947762.73it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.5 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.3 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 23.97it/s]
Epoch 0:   0%|          | 0/188 [00:00<?, ?it/s] 
Epoch 0:  11%|█         | 20/188 [00:02<00:19,  8.56it/s, v_num=0]
Epoch 0:  21%|██▏       | 40/188 [00:04<00:16,  8.75it/s, v_num=0]
Epoch 0:  32%|███▏      | 60/188 [00:06<00:14,  8.74it/s, v_num=0]
Epoch 0:  43%|████▎     | 80/188 [00:08<00:11,  9.67it/s, v_num=0]
Epoch 0:  53%|█████▎    | 100/188 [00:09<00:08, 10.42it/s, v_num=0]
Epoch 0:  64%|██████▍   | 120/188 [00:10<00:06, 11.14it/s, v_num=0]
Epoch 0:  74%|███████▍  | 140/188 [00:12<00:04, 11.61it/s, v_num=0]
Epoch 0:  85%|████████▌ | 160/188 [00:13<00:02, 12.03it/s, v_num=0]
Epoch 0:  96%|█████████▌| 180/188 [00:14<00:00, 12.35it/s, v_num=0]
Epoch 0: 100%|██████████| 188/188 [00:14<00:00, 12.58it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Validation: 0it [00:00, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%| 

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Trial status: 2 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 16:44:48. Total running time: 4min 30s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_key': 0, 'class_key': 1, 'mlp_out_l0': 64, 'mlp_af_l0': 'relu', 'mlp_bn_l0': True, 'mlp_do_l0': 0.1}
+-----------------------------------

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 2:  11%|█         | 20/188 [00:02<00:21,  7.83it/s, v_num=0]
Epoch 2:  21%|██▏       | 40/188 [00:04<00:15,  9.46it/s, v_num=0]
Epoch 2:  32%|███▏      | 60/188 [00:05<00:11, 10.82it/s, v_num=0]
Epoch 2:  43%|████▎     | 80/188 [00:06<00:09, 11.88it/s, v_num=0]
Epoch 2:  53%|█████▎    | 100/188 [00:08<00:07, 12.30it/s, v_num=0]
Epoch 2:  64%|██████▍   | 120/188 [00:09<00:05, 12.85it/s, v_num=0]
Epoch 2:  74%|███████▍  | 140/188 [00:10<00:03, 13.17it/s, v_num=0]
Trial status: 2 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 16:45:18. Total running time: 5min 1s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_cha

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00003_3_batch_size=64,lr=0.1000,mlp_af_l0=relu,mlp_bn_l0=True,mlp_do_l0=0.1000,mlp_out_l0=64_2023-09-02_16-40-17/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:18, 190986.64it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:18, 190642.87it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:34, 277489.06it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:06, 393548.06it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 458752/26421880 [00:00<00:35, 732701.12it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 884736/26421880 [00:01<00:19, 1335814.45it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 176736.97it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 176412.83it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 197461.82it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 196990.17it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:14, 286639.58it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 406669.72it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 10%|█         | 458752/4422102 [00:00<00:05, 756820.08it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 20%|██        | 884736/4422102 [00:00<00:02, 1369149.90it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 24179481.51it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.5 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.3 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 95.40it/s]
Epoch 0:   0%|          | 0/750 [00:00<?, ?it/s] 
Epoch 0:   3%|▎         | 20/750 [00:00<00:20, 35.37it/s, v_num=0]
Epoch 0:   5%|▌         | 40/750 [00:00<00:17, 40.31it/s, v_num=0]
Epoch 0:   8%|▊         | 60/750 [00:01<00:16, 41.89it/s, v_num=0]
Epoch 0:  11%|█         | 80/750 [00:01<00:15, 42.99it/s, v_num=0]
Epoch 0:  13%|█▎        | 100/750 [00:02<00:14, 43.84it/s, v_num=0]
Epoch 0:  16%|█▌        | 120/750 [00:02<00:15, 40.71it/s, v_num=0]
Epoch 0:  19%|█▊        | 140/750 [00:03<00:15, 39.73it/s, v_num=0]
Epoch 0:  21%|██▏       | 160/750 [00:04<00:15, 37.34it/s, v_num=0]
Epoch 0:  24%|██▍       | 180/750 [00:04<00:15, 36.15it/s, v_num=0]
Epoch 0:  27%|██▋       | 200/750 [00:05<00:15, 34.79it/s, v_num=0]
Epoch 0:  29%|██▉       | 220/750 [00:06<00:15, 33.96it/s, v_num=0]
Epoch 0:  32%|███▏      | 240/750 [00:07<00:15, 33.18it/s, v_num=0]
Epoch 0:  35%|███▍      | 260/750 [00:08<00:15, 32.38it/s, v_n

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00004_4_batch_size=128,lr=0.1000,mlp_af_l0=relu,mlp_bn_l0=True,mlp_do_l0=0.1000,mlp_out_l0=64_2023-09-02_16-40-17/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:17, 192038.33it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:17, 191676.30it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:34, 278808.36it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:06, 395414.32it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 458752/26421880 [00:00<00:35, 736057.20it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 917504/26421880 [00:01<00:18, 1396435.60it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 26421880/26421880 [00:02<00:00, 10222173.77it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 171943.31it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 171707.68it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 193119.58it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 192759.66it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 280485.66it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 398153.51it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 810217.22it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1451197.97it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 39546294.86it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.5 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.3 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

                                                                            
Epoch 0:   0%|          | 0/375 [00:00<?, ?it/s] 
Epoch 0:   5%|▌         | 20/375 [00:00<00:15, 23.18it/s, v_num=0]
Epoch 0:  11%|█         | 40/375 [00:01<00:12, 26.10it/s, v_num=0]
Epoch 0:  16%|█▌        | 60/375 [00:02<00:11, 27.04it/s, v_num=0]
Epoch 0: 100%|██████████| 750/750 [00:36<00:00, 20.51it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
                                                                          [A
Epoch 0:  21%|██▏       | 80/375 [00:03<00:12, 24.33it/s, v_num=0]


[2m[36m(run_with_tune pid=1086)[0m Exception ignored in: <function _MultiProcessingDataLoaderIter.__del__ at 0x7acc463f4820>
[2m[36m(run_with_tune pid=1086)[0m Traceback (most recent call last):
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/local/lib/python3.10/dist-packages/torch/utils/data/dataloader.py", line 1478, in __del__
[2m[36m(run_with_tune pid=1086)[0m     self._shutdown_workers()
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/local/lib/python3.10/dist-packages/torch/utils/data/dataloader.py", line 1461, in _shutdown_workers
[2m[36m(run_with_tune pid=1086)[0m     if w.is_alive():
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/lib/python3.10/multiprocessing/process.py", line 160, in is_alive
[2m[36m(run_with_tune pid=1086)[0m     assert self._parent_pid == os.getpid(), 'can only test a child process'
[2m[36m(run_with_tune pid=1086)[0m AssertionError: can only test a child process


Epoch 0:  27%|██▋       | 100/375 [00:04<00:12, 21.60it/s, v_num=0]
Epoch 0:  32%|███▏      | 120/375 [00:05<00:12, 20.55it/s, v_num=0]
Epoch 0:  37%|███▋      | 140/375 [00:07<00:11, 19.93it/s, v_num=0]
Epoch 0:  43%|████▎     | 160/375 [00:08<00:11, 19.31it/s, v_num=0]
Epoch 0:  48%|████▊     | 180/375 [00:09<00:10, 19.11it/s, v_num=0]
Epoch 0:  53%|█████▎    | 200/375 [00:10<00:08, 19.64it/s, v_num=0]
Epoch 0:  59%|█████▊    | 220/375 [00:10<00:07, 20.28it/s, v_num=0]
Trial status: 4 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 16:46:18. Total running time: 6min 1s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in

[2m[36m(run_with_tune pid=1086)[0m Exception ignored in: Exception ignored in: <function _MultiProcessingDataLoaderIter.__del__ at 0x7acc463f4820><function _MultiProcessingDataLoaderIter.__del__ at 0x7acc463f4820>
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Traceback (most recent call last):
[2m[36m(run_with_tune pid=1086)[0m Traceback (most recent call last):
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/local/lib/python3.10/dist-packages/torch/utils/data/dataloader.py", line 1478, in __del__
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/local/lib/python3.10/dist-packages/torch/utils/data/dataloader.py", line 1478, in __del__
[2m[36m(run_with_tune pid=1086)[0m         self._shutdown_workers()self._shutdown_workers()
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/local/lib/python3.10/dist-packages/torch/utils/data/dataloader.py", line 1461, in _shutdown_workers
[2m[36m(run_with_tune pid=108

[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%|          | 0/94 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/94 [00:00<?, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation DataLoader 0:  21%|██▏       | 20/94 [00:00<00:02, 33.53it/s][A
Epoch 0: 100%|██████████| 750/750 [00:51<00:00, 14.63it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
                                                                          [A
[2m[36m(run_with_tune pid=1086)[0m 
Validation DataLoader 0:  43%|████▎     | 40/94 [00:01<00:01, 30.97it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation DataLoader 0:  64%|██████▍   | 60/94 [00:01<00:01, 30.64it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation DataLoader 0:  85%|████████▌ | 80/94 [00:02<00:00, 31.44it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Epoch 0: 100%|██████████| 375/375 [00:19<00:00, 19.00it/s, v_num=0]
Epoch 1:   0%|          | 0/375 [00:00<?, ?it/s, v_num=0]


[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:   5%|▌         | 20/375 [00:01<00:26, 13.31it/s, v_num=0]
Epoch 1:  11%|█         | 40/375 [00:02<00:22, 14.77it/s, v_num=0]
Epoch 1:  16%|█▌        | 60/375 [00:03<00:20, 15.33it/s, v_num=0]
Epoch 1:  21%|██▏       | 80/375 [00:05<00:18, 15.63it/s, v_num=0]
Epoch 1:  27%|██▋       | 100/375 [00:06<00:17, 15.87it/s, v_num=0]
Epoch 1:  32%|███▏      | 120/375 [00:07<00:15, 16.66it/s, v_num=0]
Epoch 1:  37%|███▋      | 140/375 [00:07<00:13, 17.78it/s, v_num=0]
Epoch 1:  43%|████▎     | 160/375 [00:08<00:11, 18.56it/s, v_num=0]
Epoch 1:  48%|████▊     | 180/375 [00:09<00:10, 19.31it/s, v_num=0]
Epoch 1:  53%|█████▎    | 200/375 [00:10<00:08, 19.95it/s, v_num=0]
Epoch 1:  59%|█████▊    | 220/375 [00:10<00:07, 20.46it/s, v_num=0]
Epoch 1:  64%|██████▍   | 240/375 [00:11<00:06, 20.97it/s, v_num=0]
Epoch 1:  69%|██████▉   | 260/375 [00:12<00:05, 21.42it/s, v_num=0]
Epoch 1:  75%|███████▍  | 280/375 [00:12<00:04, 21.79it/s, v_num=0]
Epoch 1:  80%|████████  | 300/375 [00:13<00:03, 22.1

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00005_5_batch_size=256,lr=0.1000,mlp_af_l0=relu,mlp_bn_l0=True,mlp_do_l0=0.1000,mlp_out_l0=64_2023-09-02_16-40-17/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:16, 193236.60it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:16, 192687.44it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:33, 280340.03it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 397580.73it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:32, 809122.95it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1449864.92it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 172195.63it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 171963.37it/s]


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 196163.97it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 195789.84it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 284944.12it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 404279.84it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 10%|▉         | 425984/4422102 [00:00<00:05, 690708.57it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 20%|██        | 884736/4422102 [00:00<00:02, 1392548.85it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  79%|███████▊  | 3473408/4422102 [00:01<00:00, 5086901.22it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3296254.80it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 38557637.49it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.5 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.3 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 88.10it/s]
Epoch 0:   0%|          | 0/188 [00:00<?, ?it/s] 
Epoch 0:  11%|█         | 20/188 [00:01<00:12, 13.79it/s, v_num=0]
Epoch 0:  21%|██▏       | 40/188 [00:02<00:10, 14.56it/s, v_num=0]
Epoch 0:  32%|███▏      | 60/188 [00:04<00:09, 13.34it/s, v_num=0]
Epoch 0:  43%|████▎     | 80/188 [00:06<00:09, 11.96it/s, v_num=0]
Epoch 0:  53%|█████▎    | 100/188 [00:08<00:07, 11.17it/s, v_num=0]
Epoch 0:  64%|██████▍   | 120/188 [00:10<00:06, 11.04it/s, v_num=0]
Epoch 0:  74%|███████▍  | 140/188 [00:12<00:04, 11.44it/s, v_num=0]
Epoch 0:  85%|████████▌ | 160/188 [00:13<00:02, 11.87it/s, v_num=0]
Epoch 0:  85%|████████▌ | 160/188 [00:13<00:02, 11.87it/s, v_num=0]
Epoch 0:  96%|█████████▌| 180/188 [00:14<00:00, 12.12it/s, v_num=0]
Epoch 0: 100%|██████████| 188/188 [00:15<00:00, 12.34it/s, v_num=0]
Validation: 0it [00:00, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%|          | 0/47 [00:00<?, ?it/s][A
Val

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:  11%|█         | 20/188 [00:01<00:12, 13.84it/s, v_num=0]
Epoch 1:  21%|██▏       | 40/188 [00:03<00:11, 12.94it/s, v_num=0]
Trial status: 5 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 16:47:18. Total running time: 7min 1s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_key'

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00006_6_batch_size=64,lr=0.0100,mlp_af_l0=none,mlp_bn_l0=True,mlp_do_l0=0.1000,mlp_out_l0=64_2023-09-02_16-40-17/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:17, 191748.97it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:17, 191535.35it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:34, 278819.37it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:06, 395785.42it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:32, 804971.96it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1443009.77it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 177565.68it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 177259.05it/s]


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 191692.01it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 191280.22it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 278347.81it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 394428.88it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 802840.48it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1439443.04it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5465307.09it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3219392.29it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 34057219.23it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.5 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.3 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Epoch 0:   0%|          | 0/750 [00:00<?, ?it/s] 
Epoch 0:   3%|▎         | 20/750 [00:00<00:21, 34.68it/s, v_num=0]
Epoch 0:   5%|▌         | 40/750 [00:01<00:18, 38.88it/s, v_num=0]
Epoch 0:   8%|▊         | 60/750 [00:01<00:16, 41.00it/s, v_num=0]
Epoch 0:  11%|█         | 80/750 [00:01<00:16, 41.32it/s, v_num=0]
Epoch 0:  13%|█▎        | 100/750 [00:02<00:15, 41.14it/s, v_num=0]
Epoch 0:  16%|█▌        | 120/750 [00:02<00:15, 41.70it/s, v_num=0]
Epoch 0:  19%|█▊        | 140/750 [00:03<00:14, 42.55it/s, v_num=0]
Epoch 0:  21%|██▏       | 160/750 [00:03<00:13, 42.57it/s, v_num=0]
Epoch 0:  24%|██▍       | 180/750 [00:04<00:13, 42.90it/s, v_num=0]
Epoch 0:  27%|██▋       | 200/750 [00:04<00:12, 43.15it/s, v_num=0]
Epoch 0:  29%|██▉       | 220/750 [00:05<00:12, 43.52it/s, v_num=0]
Epoch 0:  32%|███▏      | 240/750 [00:05<00:11, 43.99it/s, v_num=0]
Epoch 0:  35%|███▍      | 260/750 [00:05<00:11, 43.90it/s, v_num=0]
Epoch 0:  37%|███▋      | 280/750 [00:06<00:10, 43.82it/s, v_num=0]
Ep

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00007_7_batch_size=128,lr=0.0100,mlp_af_l0=none,mlp_bn_l0=True,mlp_do_l0=0.1000,mlp_out_l0=64_2023-09-02_16-40-17/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:17, 191428.49it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:17, 191776.04it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:34, 279413.88it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 397352.58it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:32, 807131.08it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1448024.53it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 173007.58it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 172699.85it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 192329.64it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 191995.06it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 279328.94it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 396052.62it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 806068.62it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1445592.39it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5486935.58it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3232634.29it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 37486592.00it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.5 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.3 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 57.54it/s]
Epoch 0:   0%|          | 0/375 [00:00<?, ?it/s] 
Epoch 0:   5%|▌         | 20/375 [00:00<00:16, 21.78it/s, v_num=0]
Epoch 0:  11%|█         | 40/375 [00:01<00:13, 25.39it/s, v_num=0]
Epoch 0:  16%|█▌        | 60/375 [00:02<00:12, 26.00it/s, v_num=0]
Epoch 0:  21%|██▏       | 80/375 [00:03<00:11, 26.66it/s, v_num=0]
Epoch 0:  27%|██▋       | 100/375 [00:03<00:10, 26.67it/s, v_num=0]
Epoch 0:  32%|███▏      | 120/375 [00:04<00:09, 26.90it/s, v_num=0]
Epoch 0:  37%|███▋      | 140/375 [00:05<00:08, 27.27it/s, v_num=0]
Epoch 0:  43%|████▎     | 160/375 [00:05<00:07, 26.95it/s, v_num=0]
Trial status: 7 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 16:48:18. Total running time: 8min 1s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': 

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:   5%|▌         | 20/375 [00:00<00:16, 22.08it/s, v_num=0]
Epoch 1:  11%|█         | 40/375 [00:01<00:13, 25.20it/s, v_num=0]
Epoch 1:  16%|█▌        | 60/375 [00:02<00:12, 25.47it/s, v_num=0]
Epoch 1:  21%|██▏       | 80/375 [00:03<00:11, 26.08it/s, v_num=0]
Epoch 1:  27%|██▋       | 100/375 [00:03<00:10, 26.49it/s, v_num=0]
Epoch 1:  32%|███▏      | 120/375 [00:04<00:09, 26.49it/s, v_num=0]
Epoch 1:  37%|███▋      | 140/375 [00:05<00:08, 26.62it/s, v_num=0]
Epoch 1:  43%|████▎     | 160/375 [00:05<00:08, 26.84it/s, v_num=0]
Trial status: 7 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 16:48:48. Total running time: 8min 31s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 2:   5%|▌         | 20/375 [00:00<00:15, 23.35it/s, v_num=0]
Epoch 2:  11%|█         | 40/375 [00:01<00:13, 24.03it/s, v_num=0]
Epoch 2:  16%|█▌        | 60/375 [00:02<00:12, 25.11it/s, v_num=0]
Epoch 2:  21%|██▏       | 80/375 [00:03<00:11, 26.11it/s, v_num=0]
Epoch 2:  27%|██▋       | 100/375 [00:03<00:10, 25.75it/s, v_num=0]
Epoch 2:  32%|███▏      | 120/375 [00:05<00:10, 23.74it/s, v_num=0]
Epoch 2:  37%|███▋      | 140/375 [00:06<00:10, 22.60it/s, v_num=0]
Epoch 2:  43%|████▎     | 160/375 [00:07<00:09, 21.74it/s, v_num=0]
Epoch 2:  48%|████▊     | 180/375 [00:08<00:09, 20.95it/s, v_num=0]
Epoch 2:  53%|█████▎    | 200/375 [00:09<00:08, 20.34it/s, v_num=0]
Epoch 2:  59%|█████▊    | 220/375 [00:10<00:07, 20.06it/s, v_num=0]
Epoch 2:  64%|██████▍   | 240/375 [00:11<00:06, 20.58it/s, v_num=0]
Epoch 2:  69%|██████▉   | 260/375 [00:12<00:05, 21.08it/s, v_num=0]
Epoch 2:  75%|███████▍  | 280/375 [00:13<00:04, 21.34it/s, v_num=0]
Epoch 2:  80%|████████  | 300/375 [00:13<00:03, 21.6

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00008_8_batch_size=256,lr=0.0100,mlp_af_l0=none,mlp_bn_l0=True,mlp_do_l0=0.1000,mlp_out_l0=64_2023-09-02_16-40-17/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:18, 190287.24it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:18, 189985.98it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:35, 276505.67it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:06, 393335.31it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:32, 798268.74it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1432677.00it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  93%|█████████▎| 24641536/26421880 [00:02<00:00, 16183622.87it/s][A[A100%|██████████| 26421880/26421880 [00:02<00:00, 10180106.89it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 175060.22it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 174675.37it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 193415.54it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 193053.56it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 280984.09it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 398510.66it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 810809.92it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1453764.86it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5517182.15it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3249768.91it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 35630820.12it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.5 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.3 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/188 [00:00<?, ?it/s] 
Epoch 0:  11%|█         | 20/188 [00:01<00:11, 14.02it/s, v_num=0]
Epoch 0:  21%|██▏       | 40/188 [00:02<00:10, 14.75it/s, v_num=0]
Epoch 0:  32%|███▏      | 60/188 [00:03<00:08, 15.08it/s, v_num=0]
Epoch 0:  43%|████▎     | 80/188 [00:05<00:07, 15.00it/s, v_num=0]
Epoch 0:  53%|█████▎    | 100/188 [00:06<00:05, 14.89it/s, v_num=0]
Epoch 0:  64%|██████▍   | 120/188 [00:08<00:04, 13.87it/s, v_num=0]
Epoch 0:  74%|███████▍  | 140/188 [00:10<00:03, 12.84it/s, v_num=0]
Epoch 0:  85%|████████▌ | 160/188 [00:13<00:02, 12.13it/s, v_num=0]
Epoch 0:  96%|█████████▌| 180/188 [00:14<00:00, 12.37it/s, v_num=0]
Epoch 0: 100%|██████████| 188/188 [00:14<00:00, 12.59it/s, v_num=0]
Validation: 0it [00:00, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%|          | 0/47 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/47 [00:00<?, ?it/s][A
[2m[36m(ru

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Trial status: 8 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 16:49:48. Total running time: 9min 31s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_key': 0, 'class_key': 1, 'mlp_out_l0': 64, 'mlp_af_l0': 'relu', 'mlp_bn_l0': True, 'mlp_do_l0': 0.1}
+-----------------------------------

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 2:  11%|█         | 20/188 [00:01<00:13, 12.44it/s, v_num=0]
Epoch 2:  21%|██▏       | 40/188 [00:02<00:10, 14.25it/s, v_num=0]
Epoch 2:  32%|███▏      | 60/188 [00:04<00:09, 14.18it/s, v_num=0]
Epoch 2:  43%|████▎     | 80/188 [00:06<00:08, 12.48it/s, v_num=0]
Epoch 5: 100%|██████████| 750/750 [07:29<00:00,  1.67it/s, v_num=0]
Epoch 2:  53%|█████▎    | 100/188 [00:09<00:08, 10.89it/s, v_num=0]
Epoch 2:  64%|██████▍   | 120/188 [00:11<00:06, 10.84it/s, v_num=0]
Trial status: 8 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 16:50:18. Total running time: 10min 1s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_ch

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


[2m[36m(run_with_tune pid=1086)[0m 
Epoch 2: 100%|██████████| 188/188 [05:28<00:00,  1.75s/it, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Epoch 1: 100%|██████████| 375/375 [04:18<00:00,  1.45it/s, v_num=0]
Trial status: 8 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 16:50:48. Total running time: 10min 31s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10,

[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00009_9_batch_size=64,lr=0.1000,mlp_af_l0=none,mlp_bn_l0=True,mlp_do_l0=0.1000,mlp_out_l0=64_2023-09-02_16-40-17/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:16, 192993.21it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:16, 192541.21it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:33, 280157.02it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 397501.37it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:32, 808941.32it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1449886.76it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  96%|█████████▌| 25296896/26421880 [00:02<00:00, 17041395.27it/s][A[A100%|██████████| 26421880/26421880 [00:02<00:00, 10312932.12it/s]


Trial status: 9 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 16:51:18. Total running time: 11min 1s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_key': 0, 'class_key': 1, 'mlp_out_l0': 64, 'mlp_af_l0': 'relu', 'mlp_bn_l0': True, 'mlp_do_l0': 0.1}
+-----------------------------------

[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 174032.25it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 173784.52it/s]


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 195198.34it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 195001.37it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 283897.64it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 402750.99it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 819622.21it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1471893.53it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5579807.51it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3283763.17it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 25078138.20it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.5 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.3 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 37.38it/s]
                                                                           
Training:   0%|          | 0/750 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/750 [00:00<?, ?it/s] 
Epoch 0:   3%|▎         | 20/750 [00:00<00:36, 20.06it/s, v_num=0]
Epoch 0:   5%|▌         | 40/750 [00:01<00:31, 22.70it/s, v_num=0]
Epoch 0:   8%|▊         | 60/750 [00:02<00:30, 22.95it/s, v_num=0]
Epoch 0:  11%|█         | 80/750 [00:03<00:26, 24.95it/s, v_num=0]
Epoch 0:  13%|█▎        | 100/750 [00:03<00:23, 27.39it/s, v_num=0]
Epoch 0:  16%|█▌        | 120/750 [00:04<00:21, 29.15it/s, v_num=0]
Epoch 0:  19%|█▊        | 140/750 [00:04<00:19, 30.71it/s, v_num=0]
Epoch 0:  21%|██▏       | 160/750 [00:04<00:18, 32.23it/s, v_num=0]
Epoch 0:  24%|██▍       | 180/750 [00:05<00:17, 33.44it/s, v_num=0]
Epoch 0:  27%|██▋       | 200/750 [00:05<00:16, 34.23it/s, v_num=0]
Epoc

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00010_10_batch_size=128,lr=0.1000,mlp_af_l0=none,mlp_bn_l0=True,mlp_do_l0=0.1000,mlp_out_l0=64_2023-09-02_16-40-17/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:15, 195454.83it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:15, 195065.16it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:32, 283722.79it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 402206.11it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:31, 818124.02it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1467640.78it/s][A

Trial status: 10 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 16:51:48. Total running time: 11min 31s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_key': 0, 'class_key': 1, 'mlp_out_l0': 64, 'mlp_af_l0': 'relu', 'mlp_bn_l0': True, 'mlp_do_l0': 0.1}
+---------------------------------

[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  7%|▋         | 1933312/26421880 [00:01<00:08, 2895613.02it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 15%|█▍        | 3833856/26421880 [00:01<00:04, 5567271.10it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 26%|██▋       | 6979584/26421880 [00:01<00:02, 9668008.58it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 38%|███▊      | 10125312/26421880 [00:01<00:01, 12452327.29it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 50%|████▉     | 13205504/26421880 [00:01<00:00, 14241263.32it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 61%|██████▏   | 16187392/26421880 [00:02<00:00, 15301380.96it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 73%|███████▎  | 19300352/26

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 174368.08it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 174108.37it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 194282.80it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 193888.61it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 282236.27it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▍         | 196608/4422102 [00:00<00:13, 323378.76it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 10%|▉         | 425984/4422102 [00:00<00:05, 695412.60it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 19%|█▉        | 851968/4422102 [00:01<00:02, 1314717.03it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  76%|███████▋  | 3375104/4422102 [00:01<00:00, 4868926.28it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3260231.59it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 36659213.91it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.5 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.3 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

[2m[36m(run_with_tune pid=1086)[0m Epoch 0: 100%|██████████| 750/750 [00:31<00:00, 23.67it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m                                                                           [AEpoch 0: 100%|██████████| 750/750 [00:31<00:00, 23.66it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m                                                                           [A
[2m[36m(run_with_tune pid=1086)[0m Sanity Checking:   0%|          | 0/2 [00:00<?, ?it/s]Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m Exception ignored in: <function _MultiProcessingDataLoaderIter.__del__ at 0x7acc463f4820>
[2m[36m(run_with_tune pid=1086)[0m Traceback (most recent call last):
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/local/lib/python3.10/dist-packages/torch/utils/data/dataloader.py", line 1478, in __del__
[2m[36m(run_with_tune pid=1086)[0m     self._shutdown_workers()
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/local/lib/python3.10/dist-packages/torch/utils/data/dataloader.py", line 1461, in _shutdown_workers
[2m[36m(run_with_tune pid=1086)[0m     if w.is_alive():
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/lib/python3.10/multiprocessing/process.py", line 160, in is_alive
[2m[36m(run_with_tune pid=1086)[0m     assert self._parent_pid == os.getpid(), 'can only test a child process'
[2m[36m(run_with_tune pid=1086)[0m AssertionError: can only test a child process
[2m[36m(run_with_tune pid=1086)[0m Exception ignored in: <funct

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 42.43it/s]
Epoch 0:   0%|          | 0/375 [00:00<?, ?it/s] 
Epoch 0: 100%|██████████| 750/750 [00:32<00:00, 23.30it/s, v_num=0]
Epoch 0: 100%|██████████| 750/750 [00:32<00:00, 23.30it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
                                                                          [A
                                                                          [A
Epoch 0: 100%|██████████| 750/750 [00:32<00:00, 23.22it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
                                                                          [A


[2m[36m(run_with_tune pid=1086)[0m Exception ignored in: <function _MultiProcessingDataLoaderIter.__del__ at 0x7acc463f4820>
[2m[36m(run_with_tune pid=1086)[0m Traceback (most recent call last):
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/local/lib/python3.10/dist-packages/torch/utils/data/dataloader.py", line 1478, in __del__
[2m[36m(run_with_tune pid=1086)[0m     self._shutdown_workers()
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/local/lib/python3.10/dist-packages/torch/utils/data/dataloader.py", line 1461, in _shutdown_workers
[2m[36m(run_with_tune pid=1086)[0m     if w.is_alive():
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/lib/python3.10/multiprocessing/process.py", line 160, in is_alive
[2m[36m(run_with_tune pid=1086)[0m     assert self._parent_pid == os.getpid(), 'can only test a child process'
[2m[36m(run_with_tune pid=1086)[0m AssertionError: can only test a child process
[2m[36m(run_with_tune pid=1086)[0m Exception ignored in: <funct

Epoch 0:   5%|▌         | 20/375 [00:01<00:24, 14.72it/s, v_num=0]
Epoch 0:  11%|█         | 40/375 [00:02<00:17, 19.19it/s, v_num=0]
Epoch 0:  16%|█▌        | 60/375 [00:02<00:14, 21.26it/s, v_num=0]
Epoch 0:  21%|██▏       | 80/375 [00:03<00:13, 22.60it/s, v_num=0]
Epoch 0:  27%|██▋       | 100/375 [00:04<00:11, 23.59it/s, v_num=0]
Epoch 0:  32%|███▏      | 120/375 [00:05<00:10, 23.77it/s, v_num=0]
Epoch 0:  37%|███▋      | 140/375 [00:05<00:09, 24.41it/s, v_num=0]
Epoch 0:  43%|████▎     | 160/375 [00:06<00:08, 24.50it/s, v_num=0]
Epoch 0:  48%|████▊     | 180/375 [00:07<00:07, 24.83it/s, v_num=0]
Epoch 0:  53%|█████▎    | 200/375 [00:08<00:07, 24.89it/s, v_num=0]
Epoch 0:  59%|█████▊    | 220/375 [00:08<00:06, 25.10it/s, v_num=0]
Epoch 0:  64%|██████▍   | 240/375 [00:09<00:05, 25.25it/s, v_num=0]
Epoch 0:  69%|██████▉   | 260/375 [00:10<00:04, 25.37it/s, v_num=0]
Epoch 0:  75%|███████▍  | 280/375 [00:11<00:03, 25.34it/s, v_num=0]
Epoch 0:  80%|████████  | 300/375 [00:12<00:03, 24.5

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:   5%|▌         | 20/375 [00:00<00:15, 22.63it/s, v_num=0]
Epoch 1:  11%|█         | 40/375 [00:01<00:13, 24.72it/s, v_num=0]
Epoch 1:  16%|█▌        | 60/375 [00:02<00:12, 25.70it/s, v_num=0]
Epoch 1:  21%|██▏       | 80/375 [00:03<00:11, 25.68it/s, v_num=0]
Trial status: 10 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 16:52:18. Total running time: 12min 1s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': 

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00011_11_batch_size=256,lr=0.1000,mlp_af_l0=none,mlp_bn_l0=True,mlp_do_l0=0.1000,mlp_out_l0=64_2023-09-02_16-40-17/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:16, 193201.02it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:16, 192668.42it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:33, 280232.56it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 397441.47it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:32, 809275.44it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1449209.87it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  91%|█████████▏| 24150016/26421880 [00:02<00:00, 16105018.65it/s][A[A100%|██████████| 26421880/26421880 [00:02<00:00, 10316917.42it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 173078.94it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 172822.33it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 198023.72it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 197592.15it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:14, 287770.20it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▍         | 196608/4422102 [00:00<00:12, 330015.89it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  9%|▉         | 393216/4422102 [00:00<00:06, 638712.04it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 18%|█▊        | 786432/4422102 [00:00<00:02, 1227820.59it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 35748802.97it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.5 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.3 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 44.52it/s]
Epoch 0:   0%|          | 0/188 [00:00<?, ?it/s] 
Epoch 0:  11%|█         | 20/188 [00:01<00:12, 13.81it/s, v_num=0]
Epoch 0:  21%|██▏       | 40/188 [00:02<00:09, 14.96it/s, v_num=0]
Trial status: 11 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 16:52:48. Total running time: 12min 31s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size':

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:  11%|█         | 20/188 [00:01<00:12, 13.98it/s, v_num=0]
Epoch 1:  21%|██▏       | 40/188 [00:02<00:10, 14.72it/s, v_num=0]
Epoch 1:  32%|███▏      | 60/188 [00:04<00:08, 14.87it/s, v_num=0]
Epoch 1:  43%|████▎     | 80/188 [00:05<00:07, 14.01it/s, v_num=0]
Epoch 1:  53%|█████▎    | 100/188 [00:07<00:06, 12.87it/s, v_num=0]
Epoch 1:  64%|██████▍   | 120/188 [00:10<00:05, 11.97it/s, v_num=0]
Epoch 1:  74%|███████▍  | 140/188 [00:11<00:04, 11.84it/s, v_num=0]
Epoch 1:  85%|████████▌ | 160/188 [00:13<00:02, 12.29it/s, v_num=0]
Epoch 1:  96%|█████████▌| 180/188 [00:14<00:00, 12.51it/s, v_num=0]
Epoch 1: 100%|██████████| 188/188 [00:14<00:00, 12.76it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Validation: 0it [00:00, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%|          | 0/47 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/47 [00:00<?, ?it/s][A
Trial status: 11 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 16:53:19. Tot

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00012_12_batch_size=64,lr=0.0100,mlp_af_l0=relu,mlp_bn_l0=False,mlp_do_l0=0.1000,mlp_out_l0=64_2023-09-02_16-40-17/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:15, 194132.96it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:16, 193751.59it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:33, 281965.35it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 400026.32it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:31, 813825.11it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1458147.70it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  97%|█████████▋| 25591808/26421880 [00:02<00:00, 17324445.39it/s][A[A100%|██████████| 26421880/26421880 [00:02<00:00, 10385113.71it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 172982.20it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 172642.53it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 196845.00it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 196394.12it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 285750.36it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▍         | 196608/4422102 [00:00<00:12, 327887.46it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  9%|▉         | 393216/4422102 [00:00<00:06, 633485.87it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 18%|█▊        | 786432/4422102 [00:01<00:02, 1218630.06it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  70%|███████   | 3112960/4422102 [00:01<00:00, 4541350.94it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3298528.12it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 29457403.81it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.3 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.1 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 101.28it/s]
Epoch 0:   0%|          | 0/750 [00:00<?, ?it/s] 
Epoch 0:   3%|▎         | 20/750 [00:00<00:20, 35.51it/s, v_num=0]
Epoch 0:   5%|▌         | 40/750 [00:01<00:18, 38.68it/s, v_num=0]
Epoch 0:   8%|▊         | 60/750 [00:01<00:17, 40.03it/s, v_num=0]
Epoch 0:  11%|█         | 80/750 [00:01<00:16, 40.72it/s, v_num=0]
Epoch 0:  13%|█▎        | 100/750 [00:02<00:15, 41.53it/s, v_num=0]
Epoch 0:  16%|█▌        | 120/750 [00:02<00:14, 42.40it/s, v_num=0]
Epoch 0:  19%|█▊        | 140/750 [00:03<00:14, 42.43it/s, v_num=0]
Epoch 0:  21%|██▏       | 160/750 [00:03<00:13, 42.74it/s, v_num=0]
Epoch 0:  24%|██▍       | 180/750 [00:04<00:13, 42.97it/s, v_num=0]
Epoch 0:  27%|██▋       | 200/750 [00:04<00:12, 43.47it/s, v_num=0]
Epoch 0:  29%|██▉       | 220/750 [00:05<00:12, 43.71it/s, v_num=0]
Epoch 0:  32%|███▏      | 240/750 [00:05<00:11, 43.84it/s, v_num=0]
Epoch 0:  35%|███▍      | 260/750 [00:05<00:11, 43.96it/s, v_

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:   3%|▎         | 20/750 [00:00<00:21, 33.35it/s, v_num=0]
Epoch 1:   5%|▌         | 40/750 [00:01<00:18, 37.83it/s, v_num=0]
Epoch 1:   8%|▊         | 60/750 [00:01<00:16, 40.78it/s, v_num=0]
Epoch 1:  11%|█         | 80/750 [00:01<00:16, 41.52it/s, v_num=0]
Epoch 1:  13%|█▎        | 100/750 [00:02<00:15, 42.47it/s, v_num=0]
Epoch 1:  16%|█▌        | 120/750 [00:03<00:16, 39.21it/s, v_num=0]
Epoch 1:  19%|█▊        | 140/750 [00:03<00:16, 37.66it/s, v_num=0]
Epoch 1:  21%|██▏       | 160/750 [00:04<00:16, 36.61it/s, v_num=0]
Epoch 1:  24%|██▍       | 180/750 [00:05<00:16, 35.29it/s, v_num=0]
Epoch 1:  27%|██▋       | 200/750 [00:05<00:16, 34.16it/s, v_num=0]
Epoch 1:  29%|██▉       | 220/750 [00:06<00:15, 33.47it/s, v_num=0]
Epoch 1:  32%|███▏      | 240/750 [00:07<00:15, 32.91it/s, v_num=0]
Epoch 1:  35%|███▍      | 260/750 [00:08<00:15, 32.43it/s, v_num=0]
Epoch 1:  37%|███▋      | 280/750 [00:08<00:14, 31.92it/s, v_num=0]
Epoch 1:  40%|████      | 300/750 [00:09<00:13, 32.3

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1: 100%|██████████| 750/750 [00:25<00:00, 29.72it/s, v_num=0]
Epoch 2:   0%|          | 0/750 [00:00<?, ?it/s, v_num=0]
Epoch 2:   3%|▎         | 20/750 [00:00<00:21, 33.41it/s, v_num=0]
Epoch 2:   5%|▌         | 40/750 [00:01<00:18, 39.03it/s, v_num=0]
Epoch 2:   8%|▊         | 60/750 [00:01<00:16, 40.84it/s, v_num=0]
Epoch 2:  11%|█         | 80/750 [00:01<00:16, 41.64it/s, v_num=0]
Trial status: 12 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 16:54:19. Total running time: 14min 2s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'sa

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 3:   3%|▎         | 20/750 [00:00<00:27, 26.74it/s, v_num=0]
Epoch 3:   5%|▌         | 40/750 [00:01<00:22, 32.15it/s, v_num=0]
Epoch 3:   8%|▊         | 60/750 [00:01<00:19, 35.01it/s, v_num=0]
Epoch 3:  11%|█         | 80/750 [00:02<00:18, 36.68it/s, v_num=0]
Epoch 3:  13%|█▎        | 100/750 [00:02<00:17, 37.53it/s, v_num=0]
Epoch 3:  16%|█▌        | 120/750 [00:03<00:16, 37.38it/s, v_num=0]
Epoch 3:  19%|█▊        | 140/750 [00:04<00:17, 34.49it/s, v_num=0]
Epoch 3:  21%|██▏       | 160/750 [00:04<00:17, 32.79it/s, v_num=0]
Epoch 3:  24%|██▍       | 180/750 [00:05<00:18, 31.37it/s, v_num=0]
Epoch 3:  27%|██▋       | 200/750 [00:06<00:17, 30.96it/s, v_num=0]
Epoch 3:  29%|██▉       | 220/750 [00:07<00:17, 30.30it/s, v_num=0]
Epoch 3:  32%|███▏      | 240/750 [00:08<00:17, 30.00it/s, v_num=0]
Epoch 3:  35%|███▍      | 260/750 [00:08<00:16, 29.61it/s, v_num=0]
Trial status: 12 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 16:54:49. Total running time: 14min 32s
Lo

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 3: 100%|██████████| 750/750 [00:26<00:00, 28.33it/s, v_num=0]
Epoch 4:   0%|          | 0/750 [00:00<?, ?it/s, v_num=0]
Epoch 4:   3%|▎         | 20/750 [00:00<00:23, 31.58it/s, v_num=0]
Epoch 4:   5%|▌         | 40/750 [00:01<00:18, 37.38it/s, v_num=0]
Epoch 4:   8%|▊         | 60/750 [00:01<00:17, 38.69it/s, v_num=0]
Epoch 4:  11%|█         | 80/750 [00:02<00:16, 39.89it/s, v_num=0]
Epoch 4:  13%|█▎        | 100/750 [00:02<00:15, 41.02it/s, v_num=0]
Epoch 4:  16%|█▌        | 120/750 [00:02<00:15, 41.71it/s, v_num=0]
Epoch 4:  19%|█▊        | 140/750 [00:03<00:14, 42.17it/s, v_num=0]
Epoch 4:  21%|██▏       | 160/750 [00:03<00:13, 42.54it/s, v_num=0]
Epoch 4:  24%|██▍       | 180/750 [00:04<00:13, 42.84it/s, v_num=0]
Epoch 4:  27%|██▋       | 200/750 [00:04<00:12, 42.40it/s, v_num=0]
Epoch 4:  29%|██▉       | 220/750 [00:05<00:12, 42.68it/s, v_num=0]
Epoch 4:  32%|███▏      | 240/750 [00:05<00:11, 43.12it/s, v_num=0]
Epoch 4:  35%|███▍      | 260/750 [00:06<00:11, 43.29it/s, v_n

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00013_13_batch_size=128,lr=0.0100,mlp_af_l0=relu,mlp_bn_l0=False,mlp_do_l0=0.1000,mlp_out_l0=64_2023-09-02_16-40-17/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:17, 192616.98it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:17, 192276.81it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:33, 279821.92it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 196608/26421880 [00:00<01:21, 320875.13it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 393216/26421880 [00:00<00:41, 620688.17it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 786432/26421880 [00:01<00:21, 1193307.33it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 175806.55it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 175426.87it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 193478.16it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 192894.66it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 280907.23it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 398495.02it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 809693.64it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1453101.96it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5514025.52it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3248014.98it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 30411657.74it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.3 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.1 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
                                                                           
Epoch 0:   0%|          | 0/375 [00:00<?, ?it/s] 
Epoch 0:   5%|▌         | 20/375 [00:00<00:15, 22.80it/s, v_num=0]
Epoch 0:  11%|█         | 40/375 [00:01<00:13, 24.51it/s, v_num=0]
Epoch 0:  16%|█▌        | 60/375 [00:02<00:12, 25.38it/s, v_num=0]
Epoch 0:  21%|██▏       | 80/375 [00:03<00:11, 26.29it/s, v_num=0]
Epoch 0:  27%|██▋       | 100/375 [00:03<00:10, 26.08it/s, v_num=0]
Epoch 0:  32%|███▏      | 120/375 [00:04<00:09, 26.07it/s, v_num=0]
Epoch 0:  37%|███▋      | 140/375 [00:05<00:08, 26.23it/s, v_num=0]
Epoch 0:  43%|████▎     | 160/375 [00:06<00:08, 26.23it/s, v_num=0]
Epoch 0:  48%|████▊     | 180/375 [00:06<00:07, 26.44it/s, v_num=0]
Epoch 0:  53%|█████▎    | 200/375 [00:07<00:06, 26.56it/s, v_num=0]
Epoch 0:  59%|█████▊    | 220/375 [00:08<00:05, 26.60it/s, v_num=0]
Epoch 0:  64%|██████▍   | 240/375 [00:09<00:05, 24.97it/s, v_n

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:   5%|▌         | 20/375 [00:00<00:15, 22.55it/s, v_num=0]
Epoch 1:  11%|█         | 40/375 [00:01<00:13, 24.92it/s, v_num=0]
Epoch 1:  16%|█▌        | 60/375 [00:02<00:12, 25.72it/s, v_num=0]
Epoch 1:  21%|██▏       | 80/375 [00:03<00:11, 25.57it/s, v_num=0]
Epoch 1:  27%|██▋       | 100/375 [00:03<00:10, 26.52it/s, v_num=0]
Epoch 1:  32%|███▏      | 120/375 [00:04<00:09, 26.71it/s, v_num=0]
Epoch 1:  37%|███▋      | 140/375 [00:05<00:08, 26.23it/s, v_num=0]
Epoch 1:  43%|████▎     | 160/375 [00:06<00:08, 24.54it/s, v_num=0]
Epoch 1:  48%|████▊     | 180/375 [00:07<00:08, 23.45it/s, v_num=0]
Epoch 1:  53%|█████▎    | 200/375 [00:08<00:07, 22.44it/s, v_num=0]
Epoch 1:  59%|█████▊    | 220/375 [00:10<00:07, 21.68it/s, v_num=0]
Epoch 1:  64%|██████▍   | 240/375 [00:11<00:06, 21.24it/s, v_num=0]
Epoch 1:  69%|██████▉   | 260/375 [00:12<00:05, 21.26it/s, v_num=0]
Epoch 1:  75%|███████▍  | 280/375 [00:12<00:04, 21.66it/s, v_num=0]
Epoch 1:  80%|████████  | 300/375 [00:13<00:03, 21.8

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 2:   5%|▌         | 20/375 [00:01<00:27, 12.89it/s, v_num=0]
Epoch 2:  11%|█         | 40/375 [00:02<00:24, 13.79it/s, v_num=0]
Epoch 2:  16%|█▌        | 60/375 [00:04<00:21, 14.82it/s, v_num=0]
Epoch 2:  21%|██▏       | 80/375 [00:05<00:19, 15.21it/s, v_num=0]
Epoch 2:  27%|██▋       | 100/375 [00:06<00:17, 16.04it/s, v_num=0]
Epoch 2:  32%|███▏      | 120/375 [00:06<00:14, 17.29it/s, v_num=0]
Epoch 2:  37%|███▋      | 140/375 [00:07<00:12, 18.36it/s, v_num=0]
Epoch 2:  43%|████▎     | 160/375 [00:08<00:11, 19.14it/s, v_num=0]
Epoch 2:  48%|████▊     | 180/375 [00:09<00:09, 19.86it/s, v_num=0]
Epoch 2:  53%|█████▎    | 200/375 [00:09<00:08, 20.36it/s, v_num=0]
Epoch 2:  59%|█████▊    | 220/375 [00:10<00:07, 20.82it/s, v_num=0]
Epoch 2:  64%|██████▍   | 240/375 [00:11<00:06, 21.22it/s, v_num=0]
Epoch 2:  69%|██████▉   | 260/375 [00:12<00:05, 21.60it/s, v_num=0]
Epoch 2:  75%|███████▍  | 280/375 [00:12<00:04, 21.89it/s, v_num=0]
Epoch 2:  80%|████████  | 300/375 [00:13<00:03, 22.2

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 3:   5%|▌         | 20/375 [00:01<00:20, 17.71it/s, v_num=0]
Epoch 3:  11%|█         | 40/375 [00:01<00:16, 20.56it/s, v_num=0]
Epoch 3:  16%|█▌        | 60/375 [00:02<00:14, 22.33it/s, v_num=0]
Epoch 3:  21%|██▏       | 80/375 [00:03<00:12, 23.84it/s, v_num=0]
Epoch 3:  27%|██▋       | 100/375 [00:04<00:11, 24.18it/s, v_num=0]
Epoch 3:  32%|███▏      | 120/375 [00:04<00:10, 24.88it/s, v_num=0]
Epoch 3:  37%|███▋      | 140/375 [00:05<00:09, 25.33it/s, v_num=0]
Epoch 3:  43%|████▎     | 160/375 [00:06<00:08, 25.65it/s, v_num=0]
Epoch 3:  48%|████▊     | 180/375 [00:06<00:07, 25.89it/s, v_num=0]
Epoch 3:  53%|█████▎    | 200/375 [00:07<00:06, 26.31it/s, v_num=0]
Trial status: 13 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 16:56:49. Total running time: 16min 32s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 4:   5%|▌         | 20/375 [00:00<00:15, 22.28it/s, v_num=0]
Epoch 4:  11%|█         | 40/375 [00:01<00:13, 24.75it/s, v_num=0]
Epoch 4:  16%|█▌        | 60/375 [00:02<00:12, 25.11it/s, v_num=0]
Epoch 4:  21%|██▏       | 80/375 [00:03<00:11, 25.25it/s, v_num=0]
Epoch 4:  27%|██▋       | 100/375 [00:03<00:10, 25.85it/s, v_num=0]
Epoch 4:  32%|███▏      | 120/375 [00:04<00:09, 26.10it/s, v_num=0]
Epoch 4:  37%|███▋      | 140/375 [00:05<00:09, 25.88it/s, v_num=0]
Epoch 4:  43%|████▎     | 160/375 [00:06<00:08, 26.15it/s, v_num=0]
Epoch 4:  48%|████▊     | 180/375 [00:06<00:07, 26.19it/s, v_num=0]
Epoch 4:  53%|█████▎    | 200/375 [00:07<00:06, 26.02it/s, v_num=0]
Epoch 4:  59%|█████▊    | 220/375 [00:08<00:06, 24.91it/s, v_num=0]
Epoch 4:  64%|██████▍   | 240/375 [00:10<00:05, 23.60it/s, v_num=0]
Epoch 4:  69%|██████▉   | 260/375 [00:11<00:05, 22.50it/s, v_num=0]
Epoch 4:  75%|███████▍  | 280/375 [00:12<00:04, 21.97it/s, v_num=0]
Epoch 4:  80%|████████  | 300/375 [00:13<00:03, 21.4

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 5:   5%|▌         | 20/375 [00:00<00:16, 21.35it/s, v_num=0]
Epoch 5:  11%|█         | 40/375 [00:01<00:13, 24.47it/s, v_num=0]
Epoch 5:  16%|█▌        | 60/375 [00:02<00:12, 24.78it/s, v_num=0]
Epoch 5:  21%|██▏       | 80/375 [00:03<00:11, 25.65it/s, v_num=0]
Epoch 5:  27%|██▋       | 100/375 [00:03<00:10, 26.13it/s, v_num=0]
Epoch 5:  32%|███▏      | 120/375 [00:04<00:10, 24.74it/s, v_num=0]
Epoch 5:  37%|███▋      | 140/375 [00:06<00:10, 23.21it/s, v_num=0]
Epoch 5:  43%|████▎     | 160/375 [00:07<00:09, 22.36it/s, v_num=0]
Epoch 5:  48%|████▊     | 180/375 [00:08<00:09, 21.56it/s, v_num=0]
Epoch 5:  53%|█████▎    | 200/375 [00:09<00:08, 20.76it/s, v_num=0]
Epoch 5:  59%|█████▊    | 220/375 [00:10<00:07, 20.34it/s, v_num=0]
Epoch 5:  64%|██████▍   | 240/375 [00:11<00:06, 20.74it/s, v_num=0]
Epoch 5:  69%|██████▉   | 260/375 [00:12<00:05, 21.24it/s, v_num=0]
Epoch 5:  75%|███████▍  | 280/375 [00:13<00:04, 21.50it/s, v_num=0]
Epoch 5:  80%|████████  | 300/375 [00:13<00:03, 21.8

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00014_14_batch_size=256,lr=0.0100,mlp_af_l0=relu,mlp_bn_l0=False,mlp_do_l0=0.1000,mlp_out_l0=64_2023-09-02_16-40-17/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:16, 193495.05it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:16, 193127.67it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:33, 280829.86it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 398479.78it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:31, 811398.51it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1452780.95it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 172186.53it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 171810.15it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 191791.25it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 191522.89it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 278638.70it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 395314.73it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 804511.96it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1441399.72it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5472706.80it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3224570.65it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 33632830.21it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.3 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.1 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 63.17it/s]
Epoch 0:   0%|          | 0/188 [00:00<?, ?it/s] 
Trial status: 14 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 16:57:49. Total running time: 17min 32s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_key': 0, 

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:  11%|█         | 20/188 [00:01<00:12, 13.18it/s, v_num=0]
Epoch 1:  21%|██▏       | 40/188 [00:02<00:10, 14.49it/s, v_num=0]
Epoch 1:  32%|███▏      | 60/188 [00:04<00:08, 14.63it/s, v_num=0]
Epoch 1:  43%|████▎     | 80/188 [00:05<00:07, 14.89it/s, v_num=0]
Epoch 1:  53%|█████▎    | 100/188 [00:07<00:06, 13.46it/s, v_num=0]
Epoch 1:  64%|██████▍   | 120/188 [00:09<00:05, 12.53it/s, v_num=0]
Epoch 1:  74%|███████▍  | 140/188 [00:11<00:04, 11.97it/s, v_num=0]
Trial status: 14 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 16:58:19. Total running time: 18min 2s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_c

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 2:  11%|█         | 20/188 [00:01<00:12, 13.27it/s, v_num=0]
Epoch 2:  21%|██▏       | 40/188 [00:02<00:10, 14.21it/s, v_num=0]
Epoch 2:  32%|███▏      | 60/188 [00:04<00:08, 14.49it/s, v_num=0]
Epoch 2:  43%|████▎     | 80/188 [00:06<00:08, 13.18it/s, v_num=0]
Epoch 2:  53%|█████▎    | 100/188 [00:08<00:07, 12.07it/s, v_num=0]
Epoch 2:  64%|██████▍   | 120/188 [00:10<00:05, 11.38it/s, v_num=0]
Epoch 2:  74%|███████▍  | 140/188 [00:12<00:04, 11.49it/s, v_num=0]
Epoch 2:  85%|████████▌ | 160/188 [00:13<00:02, 11.87it/s, v_num=0]
Epoch 2:  96%|█████████▌| 180/188 [00:14<00:00, 12.20it/s, v_num=0]
Epoch 2: 100%|██████████| 188/188 [00:15<00:00, 12.39it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Validation: 0it [00:00, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%|          | 0/47 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/47 [00:00<?, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation DataLoader 0:  43%|████▎     | 20/47 [00:

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00015_15_batch_size=64,lr=0.1000,mlp_af_l0=relu,mlp_bn_l0=False,mlp_do_l0=0.1000,mlp_out_l0=64_2023-09-02_16-40-17/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:18, 190609.20it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:18, 190416.57it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:34, 277038.69it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:06, 396619.41it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:32, 797702.00it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1441055.54it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 176348.75it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 176007.01it/s]


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 194537.17it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 194167.92it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 282605.11it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 400753.86it/s][A[A


Trial status: 15 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 16:58:49. Total running time: 18min 32s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_key': 0, 'class_key': 1, 'mlp_out_l0': 64, 'mlp_af_l0': 'relu', 'mlp_bn_l0': True, 'mlp_do_l0': 0.1}
+---------------------------------

[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 815512.22it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1461916.97it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 43%|████▎     | 1900544/4422102 [00:01<00:00, 2821931.33it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  85%|████████▌ | 3768320/4422102 [00:01<00:00, 5441895.44it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3268121.19it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 30670848.00it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.3 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.1 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/750 [00:00<?, ?it/s] 
Epoch 0:   3%|▎         | 20/750 [00:00<00:21, 33.72it/s, v_num=0]
Epoch 0:   5%|▌         | 40/750 [00:01<00:18, 38.63it/s, v_num=0]
Epoch 0:   8%|▊         | 60/750 [00:01<00:16, 41.37it/s, v_num=0]
Epoch 0:  11%|█         | 80/750 [00:01<00:15, 42.33it/s, v_num=0]
Epoch 0:  13%|█▎        | 100/750 [00:02<00:15, 42.37it/s, v_num=0]
Epoch 0:  16%|█▌        | 120/750 [00:02<00:14, 42.67it/s, v_num=0]
Epoch 0:  19%|█▊        | 140/750 [00:03<00:14, 42.78it/s, v_num=0]
Epoch 0:  21%|██▏       | 160/750 [00:03<00:13, 42.89it/s, v_num=0]
Epoch 0:  24%|██▍       | 180/750 [00:04<00:13, 43.09it/s, v_num=0]
Epoch 0:  27%|██▋       | 200/750 [00:04<00:12, 43.29it/s, v_num=0]
Epoch 0:  29%|██▉       | 220/750 [00:05<00:12, 43.48it/s, v_num=0]
Epoch 0:  32%|███▏      | 240/750 [00:05<00:11, 43.48it/s, v_num=0]
Epoch 0:  35%|███▍      | 260/750 [00:05<00:11, 43.63it/s, v_num=0]
Ep

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00016_16_batch_size=128,lr=0.1000,mlp_af_l0=relu,mlp_bn_l0=False,mlp_do_l0=0.1000,mlp_out_l0=64_2023-09-02_16-40-29/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:16, 193673.37it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:16, 193390.12it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:33, 281602.09it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 399375.91it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:31, 812769.30it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1456179.23it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  93%|█████████▎| 24576000/26421880 [00:02<00:00, 16343964.94it/s][A[A100%|██████████| 26421880/26421880 [00:02<00:00, 10362231.92it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 176838.46it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 176479.23it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz
Trial status: 16 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 16:59:19. Total running time: 19min 2s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftm

[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 197075.61it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 197325.44it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:14, 287463.82it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 408749.56it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 831188.51it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:00<00:02, 1489075.48it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 29139375.16it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.3 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.1 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 68.00it/s]
Epoch 0:   0%|          | 0/375 [00:00<?, ?it/s] 
Epoch 0:   5%|▌         | 20/375 [00:00<00:14, 24.21it/s, v_num=0]
Epoch 0:  11%|█         | 40/375 [00:01<00:13, 25.33it/s, v_num=0]
Epoch 0:  16%|█▌        | 60/375 [00:02<00:12, 26.22it/s, v_num=0]
Epoch 0:  21%|██▏       | 80/375 [00:03<00:11, 26.60it/s, v_num=0]
Epoch 0:  27%|██▋       | 100/375 [00:03<00:10, 27.17it/s, v_num=0]
Epoch 0:  32%|███▏      | 120/375 [00:04<00:09, 27.26it/s, v_num=0]
Epoch 0:  37%|███▋      | 140/375 [00:05<00:08, 27.40it/s, v_num=0]
Epoch 0:  43%|████▎     | 160/375 [00:05<00:07, 27.13it/s, v_num=0]
Epoch 0:  48%|████▊     | 180/375 [00:06<00:07, 27.39it/s, v_num=0]
Epoch 0:  53%|█████▎    | 200/375 [00:07<00:06, 27.28it/s, v_num=0]
Epoch 0:  59%|█████▊    | 220/375 [00:08<00:05, 27.33it/s, v_num=0]
Epoch 0:  64%|██████▍   | 240/375 [00:08<00:04, 27.35it/s, v_num=0]
Epoch 0:  69%|██████▉   | 260/375 [00:09<00:04, 26.65it/s, v_n

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Trial status: 16 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 16:59:49. Total running time: 19min 32s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_key': 0, 'class_key': 1, 'mlp_out_l0': 64, 'mlp_af_l0': 'relu', 'mlp_bn_l0': True, 'mlp_do_l0': 0.1}
+---------------------------------

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Trial status: 16 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:00:19. Total running time: 20min 2s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_key': 0, 'class_key': 1, 'mlp_out_l0': 64, 'mlp_af_l0': 'relu', 'mlp_bn_l0': True, 'mlp_do_l0': 0.1}
+----------------------------------

[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00017_17_batch_size=256,lr=0.1000,mlp_af_l0=relu,mlp_bn_l0=False,mlp_do_l0=0.1000,mlp_out_l0=64_2023-09-02_16-43-10/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:14, 195614.79it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:14, 195249.77it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:32, 283926.33it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 402864.96it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:31, 819652.66it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1468622.79it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz
Trial status: 17 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:01:20. Total running time: 21min 2s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation

[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 174790.30it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 174515.07it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 195310.68it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 194989.41it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 283846.65it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 402306.23it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 819196.66it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1468171.89it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 36535155.65it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.3 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.1 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 60.82it/s]
Epoch 0:   0%|          | 0/188 [00:00<?, ?it/s] 
Epoch 0:  11%|█         | 20/188 [00:01<00:12, 13.82it/s, v_num=0]
Epoch 0:  21%|██▏       | 40/188 [00:02<00:10, 14.47it/s, v_num=0]
Epoch 0:  32%|███▏      | 60/188 [00:04<00:08, 14.48it/s, v_num=0]
Epoch 0:  43%|████▎     | 80/188 [00:05<00:07, 14.48it/s, v_num=0]
Epoch 0:  53%|█████▎    | 100/188 [00:07<00:06, 13.43it/s, v_num=0]
Epoch 0:  64%|██████▍   | 120/188 [00:09<00:05, 12.28it/s, v_num=0]
Epoch 0:  74%|███████▍  | 140/188 [00:11<00:03, 12.05it/s, v_num=0]
Epoch 0:  85%|████████▌ | 160/188 [00:12<00:02, 12.39it/s, v_num=0]
Epoch 0:  96%|█████████▌| 180/188 [00:14<00:00, 12.64it/s, v_num=0]
Epoch 0: 100%|██████████| 188/188 [00:14<00:00, 12.83it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Validation: 0it [00:00, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%| 

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:  11%|█         | 20/188 [00:01<00:12, 13.61it/s, v_num=0]
Epoch 1:  21%|██▏       | 40/188 [00:02<00:10, 14.09it/s, v_num=0]
Epoch 1:  32%|███▏      | 60/188 [00:04<00:09, 13.54it/s, v_num=0]
Epoch 1:  43%|████▎     | 80/188 [00:06<00:08, 12.24it/s, v_num=0]
Epoch 1:  53%|█████▎    | 100/188 [00:08<00:07, 11.24it/s, v_num=0]
Trial status: 17 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:01:50. Total running time: 21min 32s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'i

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00018_18_batch_size=64,lr=0.0100,mlp_af_l0=none,mlp_bn_l0=False,mlp_do_l0=0.1000,mlp_out_l0=64_2023-09-02_16-44-20/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:17, 191791.79it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:17, 191403.40it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:34, 278732.39it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 196608/26421880 [00:00<01:22, 319678.28it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 360448/26421880 [00:00<00:47, 549476.34it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 720896/26421880 [00:01<00:23, 1078039.50it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  90%|████████▉ | 23756800/26421880 [00:02<00:00, 16049751.07it/s][A[A100%|██████████| 26421880/26421880 [00:02<00:00, 10199747.32it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 173042.89it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 172778.43it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 192443.82it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 192154.35it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 279537.34it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 396467.90it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 806735.34it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1445629.05it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5486095.15it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3233418.75it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 24818709.19it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.3 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.1 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 83.00it/s]
Epoch 0:   0%|          | 0/750 [00:00<?, ?it/s] 
Epoch 0:   3%|▎         | 20/750 [00:00<00:22, 33.08it/s, v_num=0]
Epoch 0:   5%|▌         | 40/750 [00:01<00:18, 38.20it/s, v_num=0]
Epoch 0:   8%|▊         | 60/750 [00:01<00:17, 40.03it/s, v_num=0]
Epoch 0:  11%|█         | 80/750 [00:01<00:16, 41.43it/s, v_num=0]
Epoch 0:  13%|█▎        | 100/750 [00:02<00:15, 41.86it/s, v_num=0]
Epoch 0:  16%|█▌        | 120/750 [00:02<00:14, 42.36it/s, v_num=0]
Epoch 0:  19%|█▊        | 140/750 [00:03<00:14, 42.78it/s, v_num=0]
Epoch 0:  21%|██▏       | 160/750 [00:03<00:13, 43.19it/s, v_num=0]
Epoch 0:  24%|██▍       | 180/750 [00:04<00:13, 43.30it/s, v_num=0]
Epoch 0:  27%|██▋       | 200/750 [00:04<00:12, 43.55it/s, v_num=0]
Epoch 0:  29%|██▉       | 220/750 [00:05<00:12, 43.58it/s, v_num=0]
Epoch 0:  32%|███▏      | 240/750 [00:05<00:11, 43.15it/s, v_num=0]
Epoch 0:  35%|███▍      | 260/750 [00:06<00:11, 43.23it/s, v_n

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:   0%|          | 0/750 [00:00<?, ?it/s, v_num=0]
Epoch 1:   3%|▎         | 20/750 [00:00<00:32, 22.59it/s, v_num=0]
Epoch 1:   5%|▌         | 40/750 [00:01<00:28, 25.02it/s, v_num=0]
Epoch 1:   8%|▊         | 60/750 [00:02<00:26, 26.13it/s, v_num=0]
Epoch 1:  11%|█         | 80/750 [00:03<00:25, 26.00it/s, v_num=0]
Epoch 1:  13%|█▎        | 100/750 [00:03<00:24, 26.15it/s, v_num=0]
Epoch 1:  16%|█▌        | 120/750 [00:04<00:23, 26.48it/s, v_num=0]
Epoch 1:  19%|█▊        | 140/750 [00:05<00:22, 26.72it/s, v_num=0]
Epoch 1:  21%|██▏       | 160/750 [00:05<00:22, 26.69it/s, v_num=0]
Epoch 1:  24%|██▍       | 180/750 [00:06<00:21, 27.10it/s, v_num=0]
Epoch 1:  27%|██▋       | 200/750 [00:07<00:19, 28.32it/s, v_num=0]
Epoch 1:  29%|██▉       | 220/750 [00:07<00:18, 29.31it/s, v_num=0]
Epoch 1:  32%|███▏      | 240/750 [00:07<00:16, 30.23it/s, v_num=0]
Epoch 1:  35%|███▍      | 260/750 [00:08<00:15, 31.02it/s, v_num=0]
Epoch 1:  37%|███▋      | 280/750 [00:08<00:14, 31.78it/s, v_n

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 2:   3%|▎         | 20/750 [00:00<00:22, 32.86it/s, v_num=0]
Epoch 2:   5%|▌         | 40/750 [00:01<00:18, 38.58it/s, v_num=0]
Epoch 2:   8%|▊         | 60/750 [00:01<00:16, 41.29it/s, v_num=0]
Epoch 2:  11%|█         | 80/750 [00:01<00:15, 42.04it/s, v_num=0]
Epoch 2:  13%|█▎        | 100/750 [00:02<00:15, 42.23it/s, v_num=0]
Epoch 2:  16%|█▌        | 120/750 [00:02<00:15, 41.97it/s, v_num=0]
Epoch 2:  19%|█▊        | 140/750 [00:03<00:14, 42.66it/s, v_num=0]
Epoch 2:  21%|██▏       | 160/750 [00:03<00:13, 43.09it/s, v_num=0]
Epoch 2:  24%|██▍       | 180/750 [00:04<00:13, 43.16it/s, v_num=0]
Epoch 2:  27%|██▋       | 200/750 [00:04<00:12, 43.40it/s, v_num=0]
Epoch 2:  29%|██▉       | 220/750 [00:05<00:12, 43.41it/s, v_num=0]
Epoch 2:  32%|███▏      | 240/750 [00:05<00:11, 43.58it/s, v_num=0]
Epoch 2:  35%|███▍      | 260/750 [00:05<00:11, 43.55it/s, v_num=0]
Epoch 2:  37%|███▋      | 280/750 [00:06<00:10, 43.66it/s, v_num=0]
Epoch 2:  40%|████      | 300/750 [00:06<00:10, 43.6

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 3:   3%|▎         | 20/750 [00:00<00:21, 33.40it/s, v_num=0]
Epoch 3:   5%|▌         | 40/750 [00:01<00:22, 31.52it/s, v_num=0]
Epoch 3:   8%|▊         | 60/750 [00:01<00:22, 30.62it/s, v_num=0]
Trial status: 18 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:03:20. Total running time: 23min 3s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 4:   3%|▎         | 20/750 [00:01<00:37, 19.46it/s, v_num=0]
Epoch 4:   5%|▌         | 40/750 [00:01<00:31, 22.23it/s, v_num=0]
Epoch 4:   8%|▊         | 60/750 [00:02<00:29, 23.71it/s, v_num=0]
Epoch 4:  11%|█         | 80/750 [00:03<00:26, 24.97it/s, v_num=0]
Epoch 4:  13%|█▎        | 100/750 [00:03<00:25, 25.42it/s, v_num=0]
Epoch 4:  16%|█▌        | 120/750 [00:04<00:24, 25.53it/s, v_num=0]
Epoch 4:  19%|█▊        | 140/750 [00:05<00:23, 25.88it/s, v_num=0]
Epoch 4:  19%|█▊        | 140/750 [00:05<00:23, 25.85it/s, v_num=0]
Epoch 4:  21%|██▏       | 160/750 [00:05<00:21, 27.34it/s, v_num=0]
Epoch 4:  24%|██▍       | 180/750 [00:06<00:19, 28.60it/s, v_num=0]
Trial status: 18 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:03:50. Total running time: 23min 33s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00019_19_batch_size=128,lr=0.0100,mlp_af_l0=none,mlp_bn_l0=False,mlp_do_l0=0.1000,mlp_out_l0=64_2023-09-02_16-45-25/lightning_logs


Trial run_with_tune_62480_00019 started with configuration:
+-----------------------------------------------------------------+
| Trial run_with_tune_62480_00019 config                          |
+-----------------------------------------------------------------+
| batch_size                                                  128 |
| class_key                                                     1 |
| img_key                                                       0 |
| lr                                                         0.01 |
| mlp_af_l0                                                  none |
| mlp_bn_l0                                                 False |
| mlp_config/block_list                      ... 'dropout': 0.0}] |
| mlp_do_l0                                                   0.1 |
| mlp_out_l0                                                   64 |
| regularization_ratio                                        0.5 |
| resnet_config/block_list                   ...adding':

[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:13, 197368.81it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:13, 197017.48it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:31, 286721.70it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:04, 406632.16it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:31, 827177.43it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:00<00:17, 1481967.32it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 173752.08it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 173513.90it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 190877.10it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 190564.49it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 277454.49it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 393084.57it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 799546.70it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1433667.30it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5443650.56it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3207479.26it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 40134343.85it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.3 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.1 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 32.45it/s]
Epoch 0:   0%|          | 0/375 [00:00<?, ?it/s] 
Epoch 0:   5%|▌         | 20/375 [00:00<00:16, 21.34it/s, v_num=0]
Epoch 0:  11%|█         | 40/375 [00:01<00:14, 23.46it/s, v_num=0]
Epoch 0:  16%|█▌        | 60/375 [00:02<00:12, 24.85it/s, v_num=0]
Trial status: 19 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:04:20. Total running time: 24min 3s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 's

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:   5%|▌         | 20/375 [00:00<00:17, 20.67it/s, v_num=0]
Epoch 1:  11%|█         | 40/375 [00:01<00:15, 21.43it/s, v_num=0]
Epoch 1:  16%|█▌        | 60/375 [00:02<00:15, 20.22it/s, v_num=0]
Epoch 1:  21%|██▏       | 80/375 [00:04<00:15, 19.06it/s, v_num=0]
Epoch 1:  21%|██▏       | 80/375 [00:04<00:15, 19.03it/s, v_num=0]
Epoch 1:  27%|██▋       | 100/375 [00:05<00:15, 18.27it/s, v_num=0]
Epoch 1:  32%|███▏      | 120/375 [00:06<00:14, 18.21it/s, v_num=0]
Epoch 1:  37%|███▋      | 140/375 [00:07<00:12, 18.17it/s, v_num=0]
Epoch 1:  43%|████▎     | 160/375 [00:08<00:11, 19.16it/s, v_num=0]
Epoch 1:  48%|████▊     | 180/375 [00:09<00:09, 19.83it/s, v_num=0]
Epoch 1:  53%|█████▎    | 200/375 [00:09<00:08, 20.45it/s, v_num=0]
Epoch 1:  59%|█████▊    | 220/375 [00:10<00:07, 20.80it/s, v_num=0]
Epoch 1:  64%|██████▍   | 240/375 [00:11<00:06, 21.34it/s, v_num=0]
Epoch 1:  69%|██████▉   | 260/375 [00:11<00:05, 21.84it/s, v_num=0]
Epoch 1:  75%|███████▍  | 280/375 [00:12<00:04, 21.99

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 2:   5%|▌         | 20/375 [00:01<00:26, 13.16it/s, v_num=0]
Epoch 2:  11%|█         | 40/375 [00:02<00:22, 15.18it/s, v_num=0]
Epoch 2:  16%|█▌        | 60/375 [00:03<00:19, 16.48it/s, v_num=0]
Epoch 2:  21%|██▏       | 80/375 [00:04<00:16, 18.32it/s, v_num=0]
Epoch 2:  27%|██▋       | 100/375 [00:05<00:13, 19.66it/s, v_num=0]
Epoch 2:  32%|███▏      | 120/375 [00:05<00:12, 20.39it/s, v_num=0]
Epoch 2:  37%|███▋      | 140/375 [00:06<00:11, 21.20it/s, v_num=0]
Epoch 2:  43%|████▎     | 160/375 [00:07<00:09, 21.81it/s, v_num=0]
Epoch 2:  48%|████▊     | 180/375 [00:08<00:08, 22.34it/s, v_num=0]
Epoch 2:  53%|█████▎    | 200/375 [00:08<00:07, 22.76it/s, v_num=0]
Epoch 2:  59%|█████▊    | 220/375 [00:09<00:06, 23.23it/s, v_num=0]
Epoch 2:  64%|██████▍   | 240/375 [00:10<00:05, 23.42it/s, v_num=0]
Epoch 2:  69%|██████▉   | 260/375 [00:11<00:04, 23.63it/s, v_num=0]
Epoch 2:  75%|███████▍  | 280/375 [00:11<00:03, 23.90it/s, v_num=0]
Epoch 2:  80%|████████  | 300/375 [00:12<00:03, 24.1

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00020_20_batch_size=256,lr=0.0100,mlp_af_l0=none,mlp_bn_l0=False,mlp_do_l0=0.1000,mlp_out_l0=64_2023-09-02_16-45-59/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:16, 193671.74it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:16, 193104.94it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:33, 281069.72it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 196608/26421880 [00:00<01:21, 322368.67it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 425984/26421880 [00:00<00:37, 692966.03it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 851968/26421880 [00:01<00:19, 1309900.19it/s][A

Trial status: 20 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:05:20. Total running time: 25min 3s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_key': 0, 'class_key': 1, 'mlp_out_l0': 64, 'mlp_af_l0': 'relu', 'mlp_bn_l0': True, 'mlp_do_l0': 0.1}
+----------------------------------

[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 25%|██▍       | 6488064/26421880 [00:01<00:02, 9061681.82it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 36%|███▋      | 9601024/26421880 [00:01<00:01, 11919001.30it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 48%|████▊     | 12681216/26421880 [00:01<00:00, 13818460.28it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 60%|█████▉    | 15728640/26421880 [00:02<00:00, 15034428.81it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 71%|███████▏  | 18841600/26421880 [00:02<00:00, 16018851.49it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 82%|████████▏ | 21626880/26421880 [00:02<00:00, 16117254.20it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
100%|██████████| 26421880

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 176162.80it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 175855.74it/s]


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 195867.36it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 195423.07it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 284351.31it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 403427.98it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 10%|▉         | 425984/4422102 [00:00<00:05, 680492.09it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 20%|██        | 884736/4422102 [00:01<00:02, 1378094.20it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  79%|███████▊  | 3473408/4422102 [00:01<00:00, 5055449.34it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3288745.53it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 41603616.55it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.3 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.1 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 35.40it/s]
Epoch 0:   0%|          | 0/188 [00:00<?, ?it/s] 
Epoch 0:  11%|█         | 20/188 [00:01<00:15, 10.58it/s, v_num=0]
Epoch 0:  21%|██▏       | 40/188 [00:03<00:14, 10.04it/s, v_num=0]
Epoch 0:  32%|███▏      | 60/188 [00:06<00:13,  9.38it/s, v_num=0]
Epoch 0:  43%|████▎     | 80/188 [00:07<00:10, 10.15it/s, v_num=0]
Epoch 0:  53%|█████▎    | 100/188 [00:09<00:08, 10.98it/s, v_num=0]
Epoch 0:  64%|██████▍   | 120/188 [00:10<00:05, 11.57it/s, v_num=0]
Epoch 0:  74%|███████▍  | 140/188 [00:11<00:04, 11.97it/s, v_num=0]
Epoch 0:  85%|████████▌ | 160/188 [00:13<00:02, 12.29it/s, v_num=0]
Epoch 0:  96%|█████████▌| 180/188 [00:14<00:00, 12.64it/s, v_num=0]
Epoch 0: 100%|██████████| 188/188 [00:14<00:00, 12.84it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Validation: 0it [00:00, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%| 

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:  11%|█         | 20/188 [00:02<00:21,  7.79it/s, v_num=0]
Epoch 1:  21%|██▏       | 40/188 [00:04<00:17,  8.40it/s, v_num=0]
Trial status: 20 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:05:50. Total running time: 25min 33s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_k

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 2:  11%|█         | 20/188 [00:02<00:20,  8.26it/s, v_num=0]
Epoch 2:  21%|██▏       | 40/188 [00:03<00:14, 10.48it/s, v_num=0]
Epoch 2:  32%|███▏      | 60/188 [00:05<00:10, 11.79it/s, v_num=0]
Epoch 2:  43%|████▎     | 80/188 [00:06<00:08, 12.68it/s, v_num=0]
Epoch 2:  53%|█████▎    | 100/188 [00:07<00:06, 13.19it/s, v_num=0]
Epoch 2:  64%|██████▍   | 120/188 [00:08<00:04, 13.76it/s, v_num=0]
Epoch 2:  74%|███████▍  | 140/188 [00:10<00:03, 13.97it/s, v_num=0]
Epoch 2:  85%|████████▌ | 160/188 [00:11<00:01, 14.28it/s, v_num=0]
Epoch 2:  96%|█████████▌| 180/188 [00:12<00:00, 14.36it/s, v_num=0]
Epoch 2: 100%|██████████| 188/188 [00:13<00:00, 14.20it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Validation: 0it [00:00, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%|          | 0/47 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/47 [00:00<?, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation DataLoader 0:  43%|████▎     | 20/47 [00:

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00021_21_batch_size=64,lr=0.1000,mlp_af_l0=none,mlp_bn_l0=False,mlp_do_l0=0.1000,mlp_out_l0=64_2023-09-02_16-46-48/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:15, 194137.07it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:15, 193827.21it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:33, 282033.07it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 400038.64it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:31, 813956.00it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1458322.71it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  96%|█████████▌| 25264128/26421880 [00:02<00:00, 16810500.95it/s][A[A100%|██████████| 26421880/26421880 [00:02<00:00, 10382250.40it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 173976.24it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 173618.79it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 194026.35it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 193594.53it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 281755.74it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 399489.33it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 813233.97it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1456714.61it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 34382606.68it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.3 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.1 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/750 [00:00<?, ?it/s] 
Epoch 0:   3%|▎         | 20/750 [00:00<00:20, 35.12it/s, v_num=0]
Epoch 0:   5%|▌         | 40/750 [00:01<00:18, 38.99it/s, v_num=0]
Epoch 0:   8%|▊         | 60/750 [00:01<00:16, 40.83it/s, v_num=0]
Epoch 0:  11%|█         | 80/750 [00:01<00:16, 41.84it/s, v_num=0]
Epoch 0:  13%|█▎        | 100/750 [00:02<00:16, 40.29it/s, v_num=0]
Epoch 0:  16%|█▌        | 120/750 [00:03<00:16, 37.18it/s, v_num=0]
Epoch 0:  19%|█▊        | 140/750 [00:03<00:17, 35.75it/s, v_num=0]
Epoch 0:  21%|██▏       | 160/750 [00:04<00:16, 34.73it/s, v_num=0]
Epoch 0:  24%|██▍       | 180/750 [00:05<00:16, 33.55it/s, v_num=0]
Epoch 0:  27%|██▋       | 200/750 [00:06<00:16, 32.73it/s, v_num=0]
Epoch 0:  29%|██▉       | 220/750 [00:06<00:16, 31.87it/s, v_num=0]
Epoch 0:  32%|███▏      | 240/750 [00:07<00:16, 31.60it/s, v_num=0]
Epoch 0:  35%|███▍      | 260/750 [00:08<00:15, 31.31it/s, v_num=0]
Ep

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00022_22_batch_size=128,lr=0.1000,mlp_af_l0=none,mlp_bn_l0=False,mlp_do_l0=0.1000,mlp_out_l0=64_2023-09-02_16-47-32/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:18, 190688.27it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:18, 190208.74it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:34, 276819.26it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:06, 392700.11it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:32, 798752.69it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1432514.39it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  96%|█████████▌| 25329664/26421880 [00:02<00:00, 16725078.35it/s][A[A100%|██████████| 26421880/26421880 [00:02<00:00, 10192836.15it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 173217.95it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 172886.77it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 193432.14it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 193148.79it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 281129.43it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 398609.09it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 10%|█         | 458752/4422102 [00:00<00:05, 741741.64it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██        | 917504/4422102 [00:01<00:02, 1407746.10it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  82%|████████▏ | 3637248/4422102 [00:01<00:00, 5226462.97it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3249695.46it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 36597079.65it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.3 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.1 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 38.40it/s]
Epoch 0:   0%|          | 0/375 [00:00<?, ?it/s] 
Epoch 0:   5%|▌         | 20/375 [00:00<00:15, 22.95it/s, v_num=0]
Epoch 0:  11%|█         | 40/375 [00:01<00:13, 24.79it/s, v_num=0]
Epoch 0:  16%|█▌        | 60/375 [00:02<00:13, 24.07it/s, v_num=0]
Epoch 0:  21%|██▏       | 80/375 [00:03<00:13, 22.11it/s, v_num=0]
Epoch 0: 100%|██████████| 750/750 [00:36<00:00, 20.33it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
                                                                          [A


[2m[36m(run_with_tune pid=1086)[0m Exception ignored in: <function _MultiProcessingDataLoaderIter.__del__ at 0x7acc463f4820>
[2m[36m(run_with_tune pid=1086)[0m Traceback (most recent call last):
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/local/lib/python3.10/dist-packages/torch/utils/data/dataloader.py", line 1478, in __del__
[2m[36m(run_with_tune pid=1086)[0m     self._shutdown_workers()
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/local/lib/python3.10/dist-packages/torch/utils/data/dataloader.py", line 1461, in _shutdown_workers
[2m[36m(run_with_tune pid=1086)[0m     if w.is_alive():
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/lib/python3.10/multiprocessing/process.py", line 160, in is_alive
[2m[36m(run_with_tune pid=1086)[0m     assert self._parent_pid == os.getpid(), 'can only test a child process'
[2m[36m(run_with_tune pid=1086)[0m AssertionError: can only test a child process


[2m[36m(run_with_tune pid=1086)[0m Epoch 0: 100%|██████████| 750/750 [00:37<00:00, 19.77it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m                                                                           [A


[2m[36m(run_with_tune pid=1086)[0m Exception ignored in: <function _MultiProcessingDataLoaderIter.__del__ at 0x7acc463f4820>
[2m[36m(run_with_tune pid=1086)[0m Traceback (most recent call last):
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/local/lib/python3.10/dist-packages/torch/utils/data/dataloader.py", line 1478, in __del__
[2m[36m(run_with_tune pid=1086)[0m     self._shutdown_workers()
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/local/lib/python3.10/dist-packages/torch/utils/data/dataloader.py", line 1461, in _shutdown_workers
[2m[36m(run_with_tune pid=1086)[0m     if w.is_alive():
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/lib/python3.10/multiprocessing/process.py", line 160, in is_alive
[2m[36m(run_with_tune pid=1086)[0m     assert self._parent_pid == os.getpid(), 'can only test a child process'
[2m[36m(run_with_tune pid=1086)[0m AssertionError: can only test a child process


Epoch 0:  27%|██▋       | 100/375 [00:04<00:13, 20.51it/s, v_num=0]
Epoch 0:  32%|███▏      | 120/375 [00:06<00:13, 19.35it/s, v_num=0]
Epoch 0:  37%|███▋      | 140/375 [00:07<00:12, 19.11it/s, v_num=0]
Epoch 0:  43%|████▎     | 160/375 [00:08<00:11, 18.85it/s, v_num=0]
Epoch 0:  48%|████▊     | 180/375 [00:09<00:10, 19.32it/s, v_num=0]
Epoch 0:  53%|█████▎    | 200/375 [00:10<00:08, 19.99it/s, v_num=0]
Epoch 0:  59%|█████▊    | 220/375 [00:10<00:07, 20.43it/s, v_num=0]
Epoch 0:  64%|██████▍   | 240/375 [00:11<00:06, 20.92it/s, v_num=0]
Epoch 0:  69%|██████▉   | 260/375 [00:12<00:05, 21.26it/s, v_num=0]
Epoch 0:  75%|███████▍  | 280/375 [00:12<00:04, 21.58it/s, v_num=0]
Epoch 0:  80%|████████  | 300/375 [00:13<00:03, 21.91it/s, v_num=0]
Epoch 0:  85%|████████▌ | 320/375 [00:14<00:02, 22.20it/s, v_num=0]
Epoch 0:  91%|█████████ | 340/375 [00:15<00:01, 22.57it/s, v_num=0]
Epoch 0:  96%|█████████▌| 360/375 [00:15<00:00, 22.87it/s, v_num=0]
Epoch 0: 100%|██████████| 750/750 [00:49<00:00, 

[2m[36m(run_with_tune pid=1086)[0m Exception ignored in: <function _MultiProcessingDataLoaderIter.__del__ at 0x7acc463f4820>
[2m[36m(run_with_tune pid=1086)[0m Traceback (most recent call last):
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/local/lib/python3.10/dist-packages/torch/utils/data/dataloader.py", line 1478, in __del__
[2m[36m(run_with_tune pid=1086)[0m     self._shutdown_workers()
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/local/lib/python3.10/dist-packages/torch/utils/data/dataloader.py", line 1461, in _shutdown_workers
[2m[36m(run_with_tune pid=1086)[0m     if w.is_alive():
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/lib/python3.10/multiprocessing/process.py", line 160, in is_alive
[2m[36m(run_with_tune pid=1086)[0m     assert self._parent_pid == os.getpid(), 'can only test a child process'
[2m[36m(run_with_tune pid=1086)[0m AssertionError: can only test a child process
[2m[36m(run_with_tune pid=1086)[0m Exception ignored in: <funct

[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%|          | 0/94 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/94 [00:00<?, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation DataLoader 0:  21%|██▏       | 20/94 [00:00<00:02, 32.53it/s][A
Trial status: 22 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:07:20. Total running time: 27min 3s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:   5%|▌         | 20/375 [00:01<00:26, 13.62it/s, v_num=0]
Epoch 1:  11%|█         | 40/375 [00:02<00:22, 14.90it/s, v_num=0]
Epoch 1:  16%|█▌        | 60/375 [00:03<00:20, 15.15it/s, v_num=0]
Epoch 1:  21%|██▏       | 80/375 [00:05<00:20, 14.45it/s, v_num=0]
Epoch 1:  21%|██▏       | 80/375 [00:05<00:20, 14.45it/s, v_num=0]
Epoch 1:  27%|██▋       | 100/375 [00:06<00:18, 14.83it/s, v_num=0]
Epoch 1:  32%|███▏      | 120/375 [00:08<00:17, 14.98it/s, v_num=0]
Epoch 1:  37%|███▋      | 140/375 [00:09<00:15, 15.31it/s, v_num=0]
Epoch 1:  43%|████▎     | 160/375 [00:10<00:13, 15.42it/s, v_num=0]
Epoch 1:  48%|████▊     | 180/375 [00:11<00:12, 16.01it/s, v_num=0]
Epoch 1:  53%|█████▎    | 200/375 [00:12<00:10, 16.66it/s, v_num=0]
Epoch 1:  59%|█████▊    | 220/375 [00:12<00:08, 17.38it/s, v_num=0]
Epoch 1:  64%|██████▍   | 240/375 [00:13<00:07, 17.91it/s, v_num=0]
Epoch 1:  69%|██████▉   | 260/375 [00:14<00:06, 18.48it/s, v_num=0]
Epoch 1:  75%|███████▍  | 280/375 [00:14<00:05, 18.99

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00023_23_batch_size=256,lr=0.1000,mlp_af_l0=none,mlp_bn_l0=False,mlp_do_l0=0.1000,mlp_out_l0=64_2023-09-02_16-48-03/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:17, 191678.64it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:17, 191281.94it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:34, 278409.80it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 400157.34it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:32, 799880.49it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1452830.03it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
Trial status: 23 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:07:50. Total running time: 27min 33s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_key': 0, 'cl

[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 176131.97it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 175875.23it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 195092.49it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 194804.10it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 283601.00it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 405085.24it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 818285.90it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1474244.46it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5581442.69it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3284105.05it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 38557637.49it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.3 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.1 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 64.92it/s]
Epoch 0:   0%|          | 0/188 [00:00<?, ?it/s] 
Epoch 0:  11%|█         | 20/188 [00:02<00:19,  8.46it/s, v_num=0]
Epoch 0:  21%|██▏       | 40/188 [00:04<00:16,  8.79it/s, v_num=0]
Epoch 0:  32%|███▏      | 60/188 [00:06<00:13,  9.38it/s, v_num=0]
Epoch 0:  43%|████▎     | 80/188 [00:07<00:10, 10.41it/s, v_num=0]
Epoch 0:  53%|█████▎    | 100/188 [00:08<00:07, 11.27it/s, v_num=0]
Epoch 0:  64%|██████▍   | 120/188 [00:10<00:05, 11.92it/s, v_num=0]
Epoch 0:  74%|███████▍  | 140/188 [00:11<00:03, 12.27it/s, v_num=0]
Epoch 0:  85%|████████▌ | 160/188 [00:12<00:02, 12.69it/s, v_num=0]
Epoch 0:  96%|█████████▌| 180/188 [00:13<00:00, 12.95it/s, v_num=0]
Epoch 0: 100%|██████████| 188/188 [00:14<00:00, 13.16it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Validation: 0it [00:00, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%|          | 0/47 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|  

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:  11%|█         | 20/188 [00:02<00:20,  8.03it/s, v_num=0]
Epoch 1:  21%|██▏       | 40/188 [00:04<00:16,  8.91it/s, v_num=0]
Epoch 1:  32%|███▏      | 60/188 [00:05<00:12, 10.57it/s, v_num=0]
Epoch 1:  43%|████▎     | 80/188 [00:06<00:09, 11.57it/s, v_num=0]
Trial status: 23 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:08:20. Total running time: 28min 3s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': 

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00024_24_batch_size=64,lr=0.0100,mlp_af_l0=relu,mlp_bn_l0=True,mlp_do_l0=0.3000,mlp_out_l0=64_2023-09-02_16-49-22/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:12, 198663.45it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:12, 198177.82it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:31, 288233.54it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 196608/26421880 [00:00<01:19, 330920.94it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 393216/26421880 [00:00<00:40, 640107.95it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 786432/26421880 [00:00<00:20, 1229892.61it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 173958.15it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 173716.24it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 193740.53it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 193549.23it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 281656.41it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 399558.77it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 812915.59it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1457053.67it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 24018105.66it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.5 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.3 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 91.11it/s]
Epoch 0:   0%|          | 0/750 [00:00<?, ?it/s] 
Epoch 0:   3%|▎         | 20/750 [00:00<00:20, 36.00it/s, v_num=0]
Epoch 0:   5%|▌         | 40/750 [00:01<00:18, 38.75it/s, v_num=0]
Epoch 0:   8%|▊         | 60/750 [00:01<00:16, 41.31it/s, v_num=0]
Epoch 0:  11%|█         | 80/750 [00:01<00:15, 42.07it/s, v_num=0]
Epoch 0:  13%|█▎        | 100/750 [00:02<00:15, 42.57it/s, v_num=0]
Epoch 0:  16%|█▌        | 120/750 [00:02<00:14, 43.46it/s, v_num=0]
Epoch 0:  19%|█▊        | 140/750 [00:03<00:13, 43.71it/s, v_num=0]
Epoch 0:  21%|██▏       | 160/750 [00:03<00:13, 43.51it/s, v_num=0]
Epoch 0:  24%|██▍       | 180/750 [00:04<00:13, 41.01it/s, v_num=0]
Epoch 0:  27%|██▋       | 200/750 [00:05<00:13, 39.30it/s, v_num=0]
Epoch 0:  29%|██▉       | 220/750 [00:05<00:13, 37.98it/s, v_num=0]
Epoch 0:  32%|███▏      | 240/750 [00:06<00:13, 36.94it/s, v_num=0]
Epoch 0:  35%|███▍      | 260/750 [00:07<00:13, 35.92it/s, v_n

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:   3%|▎         | 20/750 [00:01<00:38, 19.09it/s, v_num=0]
Epoch 1:   5%|▌         | 40/750 [00:01<00:31, 22.69it/s, v_num=0]
Epoch 1:   8%|▊         | 60/750 [00:02<00:29, 23.51it/s, v_num=0]
Epoch 1:  11%|█         | 80/750 [00:03<00:27, 24.25it/s, v_num=0]
Epoch 1:  13%|█▎        | 100/750 [00:03<00:25, 25.84it/s, v_num=0]
Epoch 1:  16%|█▌        | 120/750 [00:04<00:22, 27.90it/s, v_num=0]
Epoch 1:  19%|█▊        | 140/750 [00:04<00:20, 29.48it/s, v_num=0]
Epoch 1:  21%|██▏       | 160/750 [00:05<00:19, 30.86it/s, v_num=0]
Epoch 1:  24%|██▍       | 180/750 [00:05<00:17, 32.11it/s, v_num=0]
Epoch 1:  27%|██▋       | 200/750 [00:06<00:16, 33.20it/s, v_num=0]
Epoch 1:  29%|██▉       | 220/750 [00:06<00:15, 33.95it/s, v_num=0]
Epoch 1:  32%|███▏      | 240/750 [00:06<00:14, 34.59it/s, v_num=0]
Epoch 1:  35%|███▍      | 260/750 [00:07<00:13, 35.28it/s, v_num=0]
Epoch 1:  35%|███▍      | 260/750 [00:07<00:13, 35.26it/s, v_num=0]
Epoch 1:  37%|███▋      | 280/750 [00:07<00:13, 35.8

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 2:   3%|▎         | 20/750 [00:00<00:23, 30.82it/s, v_num=0]
Epoch 2:   5%|▌         | 40/750 [00:01<00:19, 35.84it/s, v_num=0]
Epoch 2:   8%|▊         | 60/750 [00:01<00:17, 38.87it/s, v_num=0]
Epoch 2:  11%|█         | 80/750 [00:01<00:16, 40.52it/s, v_num=0]
Epoch 2:  13%|█▎        | 100/750 [00:02<00:15, 41.28it/s, v_num=0]
Epoch 2:  16%|█▌        | 120/750 [00:02<00:14, 42.22it/s, v_num=0]
Epoch 2:  19%|█▊        | 140/750 [00:03<00:14, 42.64it/s, v_num=0]
Epoch 2:  21%|██▏       | 160/750 [00:03<00:13, 43.27it/s, v_num=0]
Epoch 2:  24%|██▍       | 180/750 [00:04<00:13, 43.74it/s, v_num=0]
Epoch 2:  27%|██▋       | 200/750 [00:04<00:12, 43.79it/s, v_num=0]
Epoch 2:  29%|██▉       | 220/750 [00:04<00:12, 44.09it/s, v_num=0]
Epoch 2:  32%|███▏      | 240/750 [00:05<00:11, 44.07it/s, v_num=0]
Epoch 2:  35%|███▍      | 260/750 [00:05<00:11, 44.04it/s, v_num=0]
Epoch 2:  37%|███▋      | 280/750 [00:06<00:10, 44.06it/s, v_num=0]
Epoch 2:  40%|████      | 300/750 [00:06<00:10, 44.1

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 3:   3%|▎         | 20/750 [00:00<00:22, 32.07it/s, v_num=0]
Trial status: 24 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:09:51. Total running time: 29min 33s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_key': 0, 'class_key': 1, 'mlp_out_l0': 64, 'mlp_af_l0': 'relu', 'mlp

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Trial status: 24 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:10:21. Total running time: 30min 3s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_key': 0, 'class_key': 1, 'mlp_out_l0': 64, 'mlp_af_l0': 'relu', 'mlp_bn_l0': True, 'mlp_do_l0': 0.1}
+----------------------------------

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00025_25_batch_size=128,lr=0.0100,mlp_af_l0=relu,mlp_bn_l0=True,mlp_do_l0=0.3000,mlp_out_l0=64_2023-09-02_16-51-15/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:15, 195078.65it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:15, 194607.60it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:32, 283073.15it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 196608/26421880 [00:00<01:20, 324843.08it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 425984/26421880 [00:00<00:37, 697382.43it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 851968/26421880 [00:01<00:19, 1319298.57it/s][A

Trial status: 25 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:11:51. Total running time: 31min 34s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_key': 0, 'class_key': 1, 'mlp_out_l0': 64, 'mlp_af_l0': 'relu', 'mlp_bn_l0': True, 'mlp_do_l0': 0.1}
+---------------------------------

[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  93%|█████████▎| 24576000/26421880 [00:02<00:00, 16790566.41it/s][A[A100%|██████████| 26421880/26421880 [00:02<00:00, 10377126.05it/s]


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 174344.75it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 174091.23it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 195267.39it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 194969.69it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 283802.21it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 402419.16it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 10%|█         | 458752/4422102 [00:00<00:05, 749087.80it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1488180.93it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  86%|████████▌ | 3801088/4422102 [00:01<00:00, 5538946.12it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3283618.41it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 28905323.95it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.5 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.3 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 49.64it/s]
Epoch 0:   0%|          | 0/375 [00:00<?, ?it/s] 
Epoch 0:   5%|▌         | 20/375 [00:00<00:15, 22.75it/s, v_num=0]
Epoch 0:  11%|█         | 40/375 [00:01<00:13, 25.44it/s, v_num=0]
Epoch 0:  16%|█▌        | 60/375 [00:02<00:12, 25.59it/s, v_num=0]
Epoch 0:  21%|██▏       | 80/375 [00:03<00:11, 25.63it/s, v_num=0]
Epoch 0:  27%|██▋       | 100/375 [00:03<00:10, 25.86it/s, v_num=0]
Epoch 0:  32%|███▏      | 120/375 [00:04<00:09, 26.36it/s, v_num=0]
Epoch 0:  37%|███▋      | 140/375 [00:05<00:08, 26.35it/s, v_num=0]
Epoch 0:  43%|████▎     | 160/375 [00:06<00:08, 25.58it/s, v_num=0]
Epoch 0:  48%|████▊     | 180/375 [00:07<00:08, 24.26it/s, v_num=0]
Epoch 0:  53%|█████▎    | 200/375 [00:08<00:07, 23.01it/s, v_num=0]
Epoch 0:  59%|█████▊    | 220/375 [00:09<00:06, 22.35it/s, v_num=0]
Epoch 0:  64%|██████▍   | 240/375 [00:11<00:06, 21.80it/s, v_num=0]
Epoch 0:  69%|██████▉   | 260/375 [00:12<00:05, 21.63it/s, v_n

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:   5%|▌         | 20/375 [00:01<00:18, 19.71it/s, v_num=0]
Epoch 1:  11%|█         | 40/375 [00:01<00:14, 22.40it/s, v_num=0]
Epoch 1:  16%|█▌        | 60/375 [00:02<00:14, 22.24it/s, v_num=0]
Epoch 1:  21%|██▏       | 80/375 [00:03<00:14, 20.83it/s, v_num=0]
Epoch 1:  27%|██▋       | 100/375 [00:05<00:14, 19.43it/s, v_num=0]
Trial status: 25 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:12:21. Total running time: 32min 4s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 2:   5%|▌         | 20/375 [00:01<00:27, 12.86it/s, v_num=0]
Epoch 2:   5%|▌         | 20/375 [00:01<00:27, 12.83it/s, v_num=0]
Epoch 2:  11%|█         | 40/375 [00:02<00:23, 13.98it/s, v_num=0]
Epoch 2:  16%|█▌        | 60/375 [00:03<00:19, 15.78it/s, v_num=0]
Epoch 2:  21%|██▏       | 80/375 [00:04<00:16, 17.59it/s, v_num=0]
Epoch 2:  27%|██▋       | 100/375 [00:05<00:14, 18.84it/s, v_num=0]
Epoch 2:  32%|███▏      | 120/375 [00:06<00:12, 19.70it/s, v_num=0]
Epoch 2:  37%|███▋      | 140/375 [00:06<00:11, 20.47it/s, v_num=0]
Epoch 2:  43%|████▎     | 160/375 [00:07<00:10, 21.13it/s, v_num=0]
Epoch 2:  48%|████▊     | 180/375 [00:08<00:08, 21.68it/s, v_num=0]
Epoch 2:  53%|█████▎    | 200/375 [00:09<00:07, 22.10it/s, v_num=0]
Epoch 2:  59%|█████▊    | 220/375 [00:09<00:06, 22.33it/s, v_num=0]
Epoch 2:  64%|██████▍   | 240/375 [00:10<00:05, 22.57it/s, v_num=0]
Epoch 2:  69%|██████▉   | 260/375 [00:11<00:05, 22.93it/s, v_num=0]
Epoch 2:  75%|███████▍  | 280/375 [00:12<00:04, 23.26

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00026_26_batch_size=256,lr=0.0100,mlp_af_l0=relu,mlp_bn_l0=True,mlp_do_l0=0.3000,mlp_out_l0=64_2023-09-02_16-51-47/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:17, 191971.54it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:17, 191706.13it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:34, 279091.41it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 400915.33it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:32, 802754.10it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1455259.64it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  94%|█████████▍| 24936448/26421880 [00:02<00:00, 16615104.22it/s][A[A100%|██████████| 26421880/26421880 [00:02<00:00, 10264097.30it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 175936.97it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 175696.26it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 190981.87it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 190712.02it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 277574.11it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 394232.50it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 801142.46it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1436623.58it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5450862.98it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3212157.55it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 28114944.00it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.5 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.3 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 37.60it/s]
Epoch 0:   0%|          | 0/188 [00:00<?, ?it/s] 
Epoch 0:  11%|█         | 20/188 [00:02<00:20,  8.36it/s, v_num=0]
Epoch 0:  21%|██▏       | 40/188 [00:04<00:17,  8.69it/s, v_num=0]
Epoch 0:  32%|███▏      | 60/188 [00:06<00:13,  9.62it/s, v_num=0]
Epoch 0:  43%|████▎     | 80/188 [00:07<00:10, 10.64it/s, v_num=0]
Epoch 0:  53%|█████▎    | 100/188 [00:08<00:07, 11.38it/s, v_num=0]
Epoch 0:  64%|██████▍   | 120/188 [00:10<00:05, 11.92it/s, v_num=0]
Epoch 0:  74%|███████▍  | 140/188 [00:11<00:03, 12.32it/s, v_num=0]
Epoch 0:  85%|████████▌ | 160/188 [00:12<00:02, 12.68it/s, v_num=0]
Epoch 0:  96%|█████████▌| 180/188 [00:13<00:00, 13.03it/s, v_num=0]
Epoch 0: 100%|██████████| 188/188 [00:14<00:00, 13.20it/s, v_num=0]
Validation: 0it [00:00, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%|          | 0/47 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/47 [00:00<?, ?it/s][A
Tria

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:  11%|█         | 20/188 [00:02<00:21,  7.75it/s, v_num=0]
Epoch 1:  21%|██▏       | 40/188 [00:04<00:15,  9.80it/s, v_num=0]
Epoch 1:  32%|███▏      | 60/188 [00:05<00:11, 11.22it/s, v_num=0]
Epoch 1:  43%|████▎     | 80/188 [00:06<00:08, 12.12it/s, v_num=0]
Epoch 1:  53%|█████▎    | 100/188 [00:07<00:06, 12.82it/s, v_num=0]
Epoch 1:  64%|██████▍   | 120/188 [00:09<00:05, 13.15it/s, v_num=0]
Epoch 1:  74%|███████▍  | 140/188 [00:10<00:03, 13.39it/s, v_num=0]
Epoch 1:  85%|████████▌ | 160/188 [00:11<00:02, 13.63it/s, v_num=0]
Epoch 1:  85%|████████▌ | 160/188 [00:11<00:02, 13.63it/s, v_num=0]
Epoch 1:  96%|█████████▌| 180/188 [00:12<00:00, 13.96it/s, v_num=0]
Epoch 1: 100%|██████████| 188/188 [00:13<00:00, 14.12it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Validation: 0it [00:00, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%|          | 0/47 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/47 [00:00<?, ?it/s][A
[2m[36m(run_with_tune

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 2:  11%|█         | 20/188 [00:01<00:13, 12.92it/s, v_num=0]
Epoch 2:  21%|██▏       | 40/188 [00:02<00:10, 14.44it/s, v_num=0]
Epoch 2:  32%|███▏      | 60/188 [00:04<00:08, 14.80it/s, v_num=0]
Epoch 2:  43%|████▎     | 80/188 [00:05<00:07, 14.99it/s, v_num=0]
Epoch 2:  53%|█████▎    | 100/188 [00:06<00:05, 15.13it/s, v_num=0]
Epoch 2:  64%|██████▍   | 120/188 [00:07<00:04, 15.31it/s, v_num=0]
Trial status: 26 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:13:51. Total running time: 33min 34s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'pa

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 3:  11%|█         | 20/188 [00:01<00:11, 14.15it/s, v_num=0]
Epoch 3:  21%|██▏       | 40/188 [00:02<00:10, 14.69it/s, v_num=0]
Epoch 3:  32%|███▏      | 60/188 [00:03<00:08, 15.07it/s, v_num=0]
Epoch 3:  43%|████▎     | 80/188 [00:05<00:07, 15.28it/s, v_num=0]
Epoch 3:  53%|█████▎    | 100/188 [00:06<00:05, 15.36it/s, v_num=0]
Epoch 3:  64%|██████▍   | 120/188 [00:07<00:04, 15.50it/s, v_num=0]
Epoch 3:  74%|███████▍  | 140/188 [00:09<00:03, 15.06it/s, v_num=0]
Epoch 3:  85%|████████▌ | 160/188 [00:11<00:02, 13.91it/s, v_num=0]
Epoch 3:  96%|█████████▌| 180/188 [00:13<00:00, 13.11it/s, v_num=0]
Epoch 3: 100%|██████████| 188/188 [00:14<00:00, 13.00it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Validation: 0it [00:00, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%|          | 0/47 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/47 [00:00<?, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation DataLoader 0:  43%|████▎     | 20/47 [00:

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 4:  11%|█         | 20/188 [00:01<00:13, 12.92it/s, v_num=0]
Trial status: 26 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:14:21. Total running time: 34min 4s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_key': 0, 'class_key': 1, 'mlp_out_l0': 64, 'mlp_af_l0': 'relu', 'mlp_

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 5:  11%|█         | 20/188 [00:01<00:12, 13.48it/s, v_num=0]
Epoch 5:  21%|██▏       | 40/188 [00:02<00:10, 14.75it/s, v_num=0]
Epoch 5:  32%|███▏      | 60/188 [00:03<00:08, 15.16it/s, v_num=0]
Epoch 5:  43%|████▎     | 80/188 [00:05<00:07, 14.74it/s, v_num=0]
Epoch 5:  53%|█████▎    | 100/188 [00:07<00:06, 13.24it/s, v_num=0]
Epoch 5:  64%|██████▍   | 120/188 [00:09<00:05, 12.11it/s, v_num=0]
Epoch 5:  74%|███████▍  | 140/188 [00:11<00:03, 12.17it/s, v_num=0]
Trial status: 26 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:14:51. Total running time: 34min 34s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 6:  11%|█         | 20/188 [00:01<00:13, 12.85it/s, v_num=0]
Epoch 6:  21%|██▏       | 40/188 [00:02<00:10, 14.20it/s, v_num=0]
Epoch 6:  32%|███▏      | 60/188 [00:04<00:10, 12.72it/s, v_num=0]
Epoch 6:  43%|████▎     | 80/188 [00:06<00:09, 11.54it/s, v_num=0]
Epoch 6:  53%|█████▎    | 100/188 [00:09<00:08, 10.97it/s, v_num=0]
Epoch 6:  53%|█████▎    | 100/188 [00:09<00:08, 10.96it/s, v_num=0]
Epoch 6:  64%|██████▍   | 120/188 [00:10<00:05, 11.47it/s, v_num=0]
Epoch 6:  74%|███████▍  | 140/188 [00:11<00:04, 11.87it/s, v_num=0]
Epoch 6:  85%|████████▌ | 160/188 [00:13<00:02, 12.19it/s, v_num=0]
Epoch 6:  96%|█████████▌| 180/188 [00:14<00:00, 12.54it/s, v_num=0]
Epoch 6: 100%|██████████| 188/188 [00:14<00:00, 12.71it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Validation: 0it [00:00, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%|          | 0/47 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/47 [00:00<?, ?it/s][A
[2m[36m(run_with_tune

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 7:  11%|█         | 20/188 [00:01<00:13, 12.68it/s, v_num=0]
Epoch 7:  21%|██▏       | 40/188 [00:03<00:14, 10.55it/s, v_num=0]
Epoch 7:  32%|███▏      | 60/188 [00:06<00:13,  9.68it/s, v_num=0]
Trial status: 26 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:15:21. Total running time: 35min 4s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00027_27_batch_size=64,lr=0.1000,mlp_af_l0=relu,mlp_bn_l0=True,mlp_do_l0=0.3000,mlp_out_l0=64_2023-09-02_16-52-37/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:18, 190458.11it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:18, 189818.45it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:35, 276267.18it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 196608/26421880 [00:00<01:22, 316739.54it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 393216/26421880 [00:00<00:42, 612388.58it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 819200/26421880 [00:01<00:20, 1240956.08it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 173797.21it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 173547.47it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 193440.04it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 193074.62it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 280952.11it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 398560.94it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 10%|█         | 458752/4422102 [00:00<00:05, 741384.94it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1472484.25it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  85%|████████▌ | 3768320/4422102 [00:01<00:00, 5436504.35it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3249787.13it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 27471090.32it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.5 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.3 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 58.50it/s]
Epoch 0:   0%|          | 0/750 [00:00<?, ?it/s] 
Epoch 0:   3%|▎         | 20/750 [00:00<00:21, 34.73it/s, v_num=0]
Epoch 0:   5%|▌         | 40/750 [00:01<00:18, 39.17it/s, v_num=0]
Epoch 0:   8%|▊         | 60/750 [00:01<00:16, 41.12it/s, v_num=0]
Epoch 0:  11%|█         | 80/750 [00:01<00:15, 42.25it/s, v_num=0]
Epoch 0:  13%|█▎        | 100/750 [00:02<00:15, 42.71it/s, v_num=0]
Epoch 0:  16%|█▌        | 120/750 [00:02<00:14, 42.99it/s, v_num=0]
Epoch 0:  19%|█▊        | 140/750 [00:03<00:14, 42.34it/s, v_num=0]
Epoch 0:  21%|██▏       | 160/750 [00:03<00:14, 41.41it/s, v_num=0]
Epoch 0:  24%|██▍       | 180/750 [00:04<00:13, 41.22it/s, v_num=0]
Epoch 0:  27%|██▋       | 200/750 [00:04<00:13, 41.44it/s, v_num=0]
Epoch 0:  29%|██▉       | 220/750 [00:05<00:12, 41.23it/s, v_num=0]
Epoch 0:  32%|███▏      | 240/750 [00:06<00:12, 39.58it/s, v_num=0]
Epoch 0:  35%|███▍      | 260/750 [00:06<00:12, 38.29it/s, v_n

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00028_28_batch_size=128,lr=0.1000,mlp_af_l0=relu,mlp_bn_l0=True,mlp_do_l0=0.3000,mlp_out_l0=64_2023-09-02_16-53-20/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Validation DataLoader 0: 100%|██████████| 188/188 [00:04<00:00, 39.15it/s][A
Trial run_with_tune_62480_00027 completed after 1 iterations at 2023-09-02 17:16:05. Total running time: 35min 48s
+----------------------------------------------------+
| Trial run_with_tune_62480_00027 result             |
+----------------------------------------------------+
| time_this_iter_s                           32.5018 |
| time_total_s                               32.5018 |
| training_iteration                               1 |
| ptl/train_accuracy                          0.6875 |
| ptl/train_loss                             0.76223 |
| ptl/val_accuracy                           0.70789 |
| ptl/val_loss                               0.75906 |
+----------------------------------------------------+

Trial run_with_tune_62480_00028 started with configuration:
+--------------------------------------------------------------

[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:15, 194674.67it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:15, 194712.47it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:32, 283741.57it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:04, 403761.06it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:31, 821234.32it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1470032.84it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 173125.89it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 172872.53it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 196659.39it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 196344.73it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 285673.18it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 405892.84it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 824942.04it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1479196.92it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5611856.86it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3306007.93it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 35748802.97it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.5 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.3 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 28.57it/s]
Epoch 0:   0%|          | 0/375 [00:00<?, ?it/s] 
Epoch 0:   5%|▌         | 20/375 [00:00<00:16, 22.17it/s, v_num=0]
Epoch 0:  11%|█         | 40/375 [00:01<00:13, 24.89it/s, v_num=0]
Epoch 0:  16%|█▌        | 60/375 [00:02<00:12, 25.92it/s, v_num=0]
Epoch 0:  21%|██▏       | 80/375 [00:03<00:11, 25.66it/s, v_num=0]
Epoch 0:  27%|██▋       | 100/375 [00:03<00:10, 26.08it/s, v_num=0]
Epoch 0:  32%|███▏      | 120/375 [00:05<00:10, 23.76it/s, v_num=0]
Epoch 0:  37%|███▋      | 140/375 [00:06<00:10, 22.19it/s, v_num=0]
Epoch 0:  43%|████▎     | 160/375 [00:07<00:10, 21.19it/s, v_num=0]
Trial status: 28 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:16:21. Total running time: 36min 4s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:   5%|▌         | 20/375 [00:01<00:17, 19.91it/s, v_num=0]
Epoch 1:  11%|█         | 40/375 [00:02<00:18, 17.89it/s, v_num=0]
Epoch 1:  16%|█▌        | 60/375 [00:03<00:18, 17.04it/s, v_num=0]
Epoch 1:  21%|██▏       | 80/375 [00:04<00:17, 16.71it/s, v_num=0]
Epoch 1:  27%|██▋       | 100/375 [00:05<00:16, 16.87it/s, v_num=0]
Epoch 1:  32%|███▏      | 120/375 [00:07<00:15, 16.91it/s, v_num=0]
Epoch 1:  37%|███▋      | 140/375 [00:08<00:13, 17.48it/s, v_num=0]
Epoch 1:  43%|████▎     | 160/375 [00:08<00:11, 18.28it/s, v_num=0]
Epoch 1:  48%|████▊     | 180/375 [00:09<00:10, 18.95it/s, v_num=0]
Epoch 1:  53%|█████▎    | 200/375 [00:10<00:08, 19.51it/s, v_num=0]
Epoch 1:  59%|█████▊    | 220/375 [00:10<00:07, 20.09it/s, v_num=0]
Epoch 1:  64%|██████▍   | 240/375 [00:11<00:06, 20.56it/s, v_num=0]
Epoch 1:  69%|██████▉   | 260/375 [00:12<00:05, 20.96it/s, v_num=0]
Epoch 1:  75%|███████▍  | 280/375 [00:13<00:04, 21.38it/s, v_num=0]
Epoch 1:  80%|████████  | 300/375 [00:13<00:03, 21.7

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00029_29_batch_size=256,lr=0.1000,mlp_af_l0=relu,mlp_bn_l0=True,mlp_do_l0=0.3000,mlp_out_l0=64_2023-09-02_16-55-29/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:15, 194452.67it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:15, 194044.74it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:33, 282248.21it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 400524.61it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:31, 814120.12it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1461134.60it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  95%|█████████▍| 24969216/26421880 [00:02<00:00, 16885730.06it/s][A[A100%|██████████| 26421880/26421880 [00:02<00:00, 10391792.16it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 173701.86it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 173435.87it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 190885.31it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 190453.84it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 277281.02it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 393228.56it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 10%|█         | 458752/4422102 [00:00<00:05, 731966.15it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1453511.33it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  85%|████████▌ | 3768320/4422102 [00:01<00:00, 5367000.75it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3207134.28it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 28078383.60it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.5 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.3 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 44.89it/s]
Epoch 0:   0%|          | 0/188 [00:00<?, ?it/s] 
Epoch 1: 100%|██████████| 375/375 [00:29<00:00, 12.63it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
                                                                        [A


[2m[36m(run_with_tune pid=1086)[0m Exception ignored in: <function _MultiProcessingDataLoaderIter.__del__ at 0x7acc463f4820>
[2m[36m(run_with_tune pid=1086)[0m Traceback (most recent call last):
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/local/lib/python3.10/dist-packages/torch/utils/data/dataloader.py", line 1478, in __del__
[2m[36m(run_with_tune pid=1086)[0m     self._shutdown_workers()
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/local/lib/python3.10/dist-packages/torch/utils/data/dataloader.py", line 1461, in _shutdown_workers
[2m[36m(run_with_tune pid=1086)[0m     if w.is_alive():
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/lib/python3.10/multiprocessing/process.py", line 160, in is_alive
[2m[36m(run_with_tune pid=1086)[0m     assert self._parent_pid == os.getpid(), 'can only test a child process'
[2m[36m(run_with_tune pid=1086)[0m AssertionError: can only test a child process


[2m[36m(run_with_tune pid=1086)[0m Epoch 1: 100%|██████████| 375/375 [00:30<00:00, 12.35it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m                                                                         [A


[2m[36m(run_with_tune pid=1086)[0m Exception ignored in: <function _MultiProcessingDataLoaderIter.__del__ at 0x7acc463f4820>
[2m[36m(run_with_tune pid=1086)[0m Traceback (most recent call last):
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/local/lib/python3.10/dist-packages/torch/utils/data/dataloader.py", line 1478, in __del__
[2m[36m(run_with_tune pid=1086)[0m     self._shutdown_workers()
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/local/lib/python3.10/dist-packages/torch/utils/data/dataloader.py", line 1461, in _shutdown_workers
[2m[36m(run_with_tune pid=1086)[0m     if w.is_alive():
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/lib/python3.10/multiprocessing/process.py", line 160, in is_alive
[2m[36m(run_with_tune pid=1086)[0m     assert self._parent_pid == os.getpid(), 'can only test a child process'
[2m[36m(run_with_tune pid=1086)[0m AssertionError: can only test a child process


Epoch 0:  11%|█         | 20/188 [00:01<00:13, 12.21it/s, v_num=0]
Epoch 0:  21%|██▏       | 40/188 [00:02<00:10, 14.02it/s, v_num=0]
Epoch 0:  32%|███▏      | 60/188 [00:04<00:09, 13.23it/s, v_num=0]
Epoch 0:  43%|████▎     | 80/188 [00:06<00:08, 12.08it/s, v_num=0]
Epoch 0:  53%|█████▎    | 100/188 [00:08<00:07, 11.23it/s, v_num=0]
Epoch 0:  64%|██████▍   | 120/188 [00:10<00:05, 11.35it/s, v_num=0]
Epoch 0:  74%|███████▍  | 140/188 [00:11<00:04, 11.75it/s, v_num=0]
Epoch 0:  85%|████████▌ | 160/188 [00:13<00:02, 12.21it/s, v_num=0]
Epoch 0:  96%|█████████▌| 180/188 [00:14<00:00, 12.52it/s, v_num=0]
Epoch 0: 100%|██████████| 188/188 [00:14<00:00, 12.68it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Validation: 0it [00:00, ?it/s][A
Epoch 1: 100%|██████████| 375/375 [00:44<00:00,  8.46it/s, v_num=0]
Epoch 1: 100%|██████████| 375/375 [00:44<00:00,  8.46it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
                                                                        [A


[2m[36m(run_with_tune pid=1086)[0m Exception ignored in: <function _MultiProcessingDataLoaderIter.__del__ at 0x7acc463f4820>
[2m[36m(run_with_tune pid=1086)[0m Traceback (most recent call last):
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/local/lib/python3.10/dist-packages/torch/utils/data/dataloader.py", line 1478, in __del__
[2m[36m(run_with_tune pid=1086)[0m     self._shutdown_workers()
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/local/lib/python3.10/dist-packages/torch/utils/data/dataloader.py", line 1461, in _shutdown_workers
[2m[36m(run_with_tune pid=1086)[0m     if w.is_alive():
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/lib/python3.10/multiprocessing/process.py", line 160, in is_alive
[2m[36m(run_with_tune pid=1086)[0m     assert self._parent_pid == os.getpid(), 'can only test a child process'
[2m[36m(run_with_tune pid=1086)[0m AssertionError: can only test a child process
[2m[36m(run_with_tune pid=1086)[0m Exception ignored in: <funct

[2m[36m(run_with_tune pid=1086)[0m 
Validation DataLoader 0:  43%|████▎     | 20/47 [00:01<00:01, 17.99it/s][A
Epoch 1: 100%|██████████| 375/375 [00:46<00:00,  8.06it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
                                                                        [A
[2m[36m(run_with_tune pid=1086)[0m 
Validation DataLoader 0:  85%|████████▌ | 40/47 [00:02<00:00, 16.56it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation DataLoader 0: 100%|██████████| 47/47 [00:02<00:00, 16.48it/s][A
Epoch 0: 100%|██████████| 188/188 [00:17<00:00, 10.47it/s, v_num=0]
Epoch 1:   0%|          | 0/188 [00:00<?, ?it/s, v_num=0]


[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:  11%|█         | 20/188 [00:01<00:12, 13.25it/s, v_num=0]
Trial status: 29 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:17:21. Total running time: 37min 4s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_key': 0, 'class_key': 1, 'mlp_out_l0': 64, 'mlp_af_l0': 'relu', 'mlp_

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00030_30_batch_size=64,lr=0.0100,mlp_af_l0=none,mlp_bn_l0=True,mlp_do_l0=0.3000,mlp_out_l0=64_2023-09-02_16-57-40/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:18, 191093.66it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:16, 192621.80it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:34, 279565.61it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 397376.31it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:32, 808105.47it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1447972.41it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 175824.52it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 175539.80it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 196493.22it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 196284.08it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 285743.11it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 405416.01it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 824632.30it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1477864.36it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5608129.30it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3304883.98it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 39764782.67it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.5 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.3 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 113.48it/s]
Epoch 0:   0%|          | 0/750 [00:00<?, ?it/s] 
Epoch 0:   3%|▎         | 20/750 [00:00<00:20, 34.83it/s, v_num=0]
Epoch 0:   5%|▌         | 40/750 [00:00<00:17, 40.25it/s, v_num=0]
Epoch 0:   8%|▊         | 60/750 [00:01<00:16, 41.39it/s, v_num=0]
Epoch 0:  11%|█         | 80/750 [00:01<00:15, 42.93it/s, v_num=0]
Epoch 0:  11%|█         | 80/750 [00:01<00:15, 42.83it/s, v_num=0]
Epoch 0:  13%|█▎        | 100/750 [00:02<00:14, 43.86it/s, v_num=0]
Epoch 0:  16%|█▌        | 120/750 [00:02<00:14, 43.90it/s, v_num=0]
Epoch 0:  19%|█▊        | 140/750 [00:03<00:13, 44.65it/s, v_num=0]
Epoch 0:  21%|██▏       | 160/750 [00:03<00:13, 44.20it/s, v_num=0]
Epoch 0:  24%|██▍       | 180/750 [00:04<00:12, 44.42it/s, v_num=0]
Epoch 0:  27%|██▋       | 200/750 [00:04<00:12, 44.94it/s, v_num=0]
Epoch 0:  29%|██▉       | 220/750 [00:04<00:11, 44.88it/s, v_num=0]
Trial status: 30 TERMINATED | 1 RUNNING | 16 PENDING
Current t

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:   3%|▎         | 20/750 [00:00<00:20, 35.41it/s, v_num=0]
Epoch 1:   5%|▌         | 40/750 [00:01<00:18, 39.34it/s, v_num=0]
Epoch 1:   8%|▊         | 60/750 [00:01<00:19, 36.00it/s, v_num=0]
Epoch 1:  11%|█         | 80/750 [00:02<00:19, 34.19it/s, v_num=0]
Epoch 1:  13%|█▎        | 100/750 [00:02<00:19, 33.47it/s, v_num=0]
Epoch 1:  16%|█▌        | 120/750 [00:03<00:19, 32.59it/s, v_num=0]
Epoch 1:  19%|█▊        | 140/750 [00:04<00:19, 31.95it/s, v_num=0]
Epoch 1:  21%|██▏       | 160/750 [00:05<00:18, 31.39it/s, v_num=0]
Epoch 1:  24%|██▍       | 180/750 [00:05<00:18, 31.02it/s, v_num=0]
Epoch 1:  27%|██▋       | 200/750 [00:06<00:17, 30.57it/s, v_num=0]
Epoch 1:  29%|██▉       | 220/750 [00:07<00:17, 30.39it/s, v_num=0]
Epoch 1:  32%|███▏      | 240/750 [00:07<00:16, 30.38it/s, v_num=0]
Epoch 1:  35%|███▍      | 260/750 [00:08<00:15, 31.21it/s, v_num=0]
Epoch 1:  37%|███▋      | 280/750 [00:08<00:14, 31.90it/s, v_num=0]
Epoch 1:  40%|████      | 300/750 [00:09<00:13, 32.5

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 2:   3%|▎         | 20/750 [00:00<00:25, 28.81it/s, v_num=0]
Epoch 2:   5%|▌         | 40/750 [00:01<00:20, 34.14it/s, v_num=0]
Epoch 2:   8%|▊         | 60/750 [00:01<00:18, 37.10it/s, v_num=0]
Epoch 2:  11%|█         | 80/750 [00:02<00:17, 38.78it/s, v_num=0]
Epoch 2:  13%|█▎        | 100/750 [00:02<00:16, 38.73it/s, v_num=0]
Epoch 2:  16%|█▌        | 120/750 [00:03<00:15, 39.55it/s, v_num=0]
Epoch 2:  19%|█▊        | 140/750 [00:03<00:15, 39.97it/s, v_num=0]
Epoch 2:  21%|██▏       | 160/750 [00:03<00:14, 40.53it/s, v_num=0]
Epoch 2:  24%|██▍       | 180/750 [00:04<00:13, 41.00it/s, v_num=0]
Epoch 2:  27%|██▋       | 200/750 [00:04<00:13, 41.22it/s, v_num=0]
Epoch 2:  29%|██▉       | 220/750 [00:05<00:12, 41.20it/s, v_num=0]
Epoch 2:  32%|███▏      | 240/750 [00:05<00:12, 41.19it/s, v_num=0]
Epoch 2:  32%|███▏      | 240/750 [00:05<00:12, 41.18it/s, v_num=0]
Epoch 2:  35%|███▍      | 260/750 [00:06<00:11, 41.38it/s, v_num=0]
Epoch 2:  37%|███▋      | 280/750 [00:06<00:11, 41.4

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 3:   0%|          | 0/750 [00:00<?, ?it/s, v_num=0]
Epoch 3:   3%|▎         | 20/750 [00:00<00:24, 30.23it/s, v_num=0]
Epoch 3:   5%|▌         | 40/750 [00:01<00:20, 35.45it/s, v_num=0]
Epoch 3:   8%|▊         | 60/750 [00:01<00:19, 35.85it/s, v_num=0]
Epoch 3:  11%|█         | 80/750 [00:02<00:20, 32.67it/s, v_num=0]
Epoch 3:  13%|█▎        | 100/750 [00:03<00:20, 31.61it/s, v_num=0]
Epoch 3:  16%|█▌        | 120/750 [00:03<00:20, 30.82it/s, v_num=0]
Epoch 3:  19%|█▊        | 140/750 [00:04<00:20, 29.80it/s, v_num=0]
Epoch 3:  21%|██▏       | 160/750 [00:05<00:20, 28.97it/s, v_num=0]
Epoch 3:  24%|██▍       | 180/750 [00:06<00:19, 28.56it/s, v_num=0]
Epoch 3:  27%|██▋       | 200/750 [00:07<00:19, 28.26it/s, v_num=0]
Epoch 3:  29%|██▉       | 220/750 [00:07<00:19, 27.89it/s, v_num=0]
Epoch 3:  32%|███▏      | 240/750 [00:08<00:18, 27.96it/s, v_num=0]
Epoch 3:  35%|███▍      | 260/750 [00:09<00:17, 28.71it/s, v_num=0]
Epoch 3:  37%|███▋      | 280/750 [00:09<00:16, 29.34it/s, v_n

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 3: 100%|██████████| 750/750 [00:26<00:00, 28.05it/s, v_num=0]
Epoch 4:   0%|          | 0/750 [00:00<?, ?it/s, v_num=0]
Epoch 4:   3%|▎         | 20/750 [00:00<00:24, 29.81it/s, v_num=0]
Epoch 4:   5%|▌         | 40/750 [00:01<00:20, 35.31it/s, v_num=0]
Epoch 4:   8%|▊         | 60/750 [00:01<00:18, 37.20it/s, v_num=0]
Epoch 4:  11%|█         | 80/750 [00:02<00:18, 37.01it/s, v_num=0]
Epoch 4:  13%|█▎        | 100/750 [00:02<00:16, 38.30it/s, v_num=0]
Epoch 4:  16%|█▌        | 120/750 [00:03<00:16, 39.29it/s, v_num=0]
Epoch 4:  19%|█▊        | 140/750 [00:03<00:15, 39.91it/s, v_num=0]
Epoch 4:  21%|██▏       | 160/750 [00:03<00:14, 40.20it/s, v_num=0]
Epoch 4:  24%|██▍       | 180/750 [00:04<00:14, 40.70it/s, v_num=0]
Epoch 4:  27%|██▋       | 200/750 [00:04<00:13, 40.90it/s, v_num=0]
Epoch 4:  29%|██▉       | 220/750 [00:05<00:12, 41.20it/s, v_num=0]
Epoch 4:  32%|███▏      | 240/750 [00:05<00:12, 41.30it/s, v_num=0]
Epoch 4:  35%|███▍      | 260/750 [00:06<00:11, 41.60it/s, v_n

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00031_31_batch_size=128,lr=0.0100,mlp_af_l0=none,mlp_bn_l0=True,mlp_do_l0=0.3000,mlp_out_l0=64_2023-09-02_16-58-43/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:16, 193566.18it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:16, 193199.96it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:33, 281039.20it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 398315.82it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:32, 810048.64it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1453165.27it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  95%|█████████▌| 25198592/26421880 [00:02<00:00, 16846165.04it/s][A[A100%|██████████| 26421880/26421880 [00:02<00:00, 10319000.11it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 174184.31it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 173382.43it/s]


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 192181.46it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 191784.25it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 279942.77it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 398168.73it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 809512.36it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1452221.28it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 38216419.45it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.5 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.3 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 27.31it/s]
Epoch 0:   0%|          | 0/375 [00:00<?, ?it/s] 
Epoch 0:   5%|▌         | 20/375 [00:00<00:16, 21.01it/s, v_num=0]
Epoch 0:  11%|█         | 40/375 [00:01<00:14, 23.63it/s, v_num=0]
Epoch 0:  16%|█▌        | 60/375 [00:02<00:12, 25.14it/s, v_num=0]
Epoch 0:  21%|██▏       | 80/375 [00:03<00:11, 25.84it/s, v_num=0]
Epoch 0:  27%|██▋       | 100/375 [00:03<00:10, 26.08it/s, v_num=0]
Epoch 0:  32%|███▏      | 120/375 [00:04<00:09, 26.35it/s, v_num=0]
Epoch 0:  37%|███▋      | 140/375 [00:05<00:08, 26.61it/s, v_num=0]
Epoch 0:  43%|████▎     | 160/375 [00:06<00:08, 26.47it/s, v_num=0]
Epoch 0:  48%|████▊     | 180/375 [00:06<00:07, 26.62it/s, v_num=0]
Epoch 0:  53%|█████▎    | 200/375 [00:07<00:06, 26.95it/s, v_num=0]
Epoch 0:  59%|█████▊    | 220/375 [00:08<00:05, 25.85it/s, v_num=0]
Epoch 0:  64%|██████▍   | 240/375 [00:09<00:05, 24.85it/s, v_n

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


[2m[36m(run_with_tune pid=1086)[0m 
Epoch 2: 100%|██████████| 375/375 [07:48<00:00,  1.25s/it, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Epoch 7: 100%|██████████| 188/188 [05:20<00:00,  1.71s/it, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
                                                                        [A
Epoch 0: 100%|██████████| 750/750 [05:14<00:00,  2.38it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Epoch 1: 100%|██████████| 188/188 [03:35<00:00,  1.14s/it, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Epoch 4: 100%|██████████| 750/750 [01:36<00:00,  7.78it/s, v_num=0]




[2m[36m(run_with_tune pid=1086)[0m 
                                                                          [A
Trial status: 31 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:21:15. Total running time: 40min 58s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_key': 0, 'class_ke

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00032_32_batch_size=256,lr=0.0100,mlp_af_l0=none,mlp_bn_l0=True,mlp_do_l0=0.3000,mlp_out_l0=64_2023-09-02_16-59-14/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:16, 193406.56it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:16, 192977.81it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:33, 280867.70it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 398460.19it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:31, 810670.91it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1452707.38it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 177111.70it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 176763.72it/s]


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:23, 190253.78it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 189927.00it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 276451.21it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 392155.82it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 798176.23it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1430188.30it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5424764.62it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3197135.30it/s]


Trial status: 32 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:21:45. Total running time: 41min 28s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_key': 0, 'class_key': 1, 'mlp_out_l0': 64, 'mlp_af_l0': 'relu', 'mlp_bn_l0': True, 'mlp_do_l0': 0.1}
+---------------------------------

[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 27896998.70it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.5 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.3 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 46.65it/s]
Epoch 0:   0%|          | 0/188 [00:00<?, ?it/s] 
Epoch 0:  11%|█         | 20/188 [00:01<00:12, 13.32it/s, v_num=0]
Epoch 0:  21%|██▏       | 40/188 [00:02<00:10, 14.37it/s, v_num=0]
Epoch 0:  32%|███▏      | 60/188 [00:04<00:09, 14.20it/s, v_num=0]
Epoch 0:  43%|████▎     | 80/188 [00:05<00:07, 14.64it/s, v_num=0]
Epoch 0:  53%|█████▎    | 100/188 [00:06<00:05, 14.88it/s, v_num=0]
Epoch 0:  64%|██████▍   | 120/188 [00:08<00:04, 13.78it/s, v_num=0]
Epoch 0:  74%|███████▍  | 140/188 [00:10<00:03, 12.78it/s, v_num=0]
Epoch 0:  85%|████████▌ | 160/188 [00:13<00:02, 12.13it/s, v_num=0]
Epoch 0:  96%|█████████▌| 180/188 [00:14<00:00, 12.35it/s, v_num=0]
Epoch 0: 100%|██████████| 188/188 [00:15<00:00, 12.52it/s, v_num=0]
Validation: 0it [00:00, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%|          | 0/47 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/47 [00:00<?, ?it/s][A
[2m

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:  11%|█         | 20/188 [00:01<00:12, 13.22it/s, v_num=0]
Epoch 1:  21%|██▏       | 40/188 [00:02<00:10, 14.15it/s, v_num=0]
Epoch 1:  32%|███▏      | 60/188 [00:04<00:08, 14.47it/s, v_num=0]
Epoch 1:  43%|████▎     | 80/188 [00:05<00:07, 14.02it/s, v_num=0]
Epoch 1:  53%|█████▎    | 100/188 [00:07<00:06, 12.81it/s, v_num=0]
Epoch 1:  64%|██████▍   | 120/188 [00:09<00:05, 12.07it/s, v_num=0]
Trial status: 32 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:22:15. Total running time: 41min 58s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'pa

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 2:  11%|█         | 20/188 [00:01<00:12, 13.28it/s, v_num=0]
Epoch 2:  21%|██▏       | 40/188 [00:02<00:10, 14.12it/s, v_num=0]
Epoch 2:  32%|███▏      | 60/188 [00:04<00:09, 12.95it/s, v_num=0]
Epoch 2:  43%|████▎     | 80/188 [00:06<00:09, 11.85it/s, v_num=0]
Epoch 2:  53%|█████▎    | 100/188 [00:08<00:07, 11.15it/s, v_num=0]
Epoch 2:  64%|██████▍   | 120/188 [00:10<00:05, 11.53it/s, v_num=0]
Epoch 2:  74%|███████▍  | 140/188 [00:11<00:04, 11.81it/s, v_num=0]
Epoch 2:  85%|████████▌ | 160/188 [00:13<00:02, 12.10it/s, v_num=0]
Epoch 2:  96%|█████████▌| 180/188 [00:14<00:00, 12.46it/s, v_num=0]
Epoch 2: 100%|██████████| 188/188 [00:14<00:00, 12.65it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Validation: 0it [00:00, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%|          | 0/47 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/47 [00:00<?, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation DataLoader 0:  43%|████▎     | 20/47 [00:

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00033_33_batch_size=64,lr=0.1000,mlp_af_l0=none,mlp_bn_l0=True,mlp_do_l0=0.3000,mlp_out_l0=64_2023-09-02_17-01-14/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:14, 196853.18it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:14, 196195.95it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:32, 285573.69it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:04, 404979.94it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 458752/26421880 [00:00<00:34, 753636.70it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 884736/26421880 [00:01<00:18, 1364333.70it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 174471.54it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 174050.36it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz
Trial status: 33 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:22:45. Total running time: 42min 28s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoft

[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 198218.21it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 197782.95it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:14, 287858.34it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 408385.45it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 831016.51it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:00<00:02, 1489404.27it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5652970.23it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3329667.56it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 32864957.37it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.5 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.3 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 131.70it/s]
Epoch 0:   0%|          | 0/750 [00:00<?, ?it/s] 
Epoch 0:   3%|▎         | 20/750 [00:00<00:21, 34.59it/s, v_num=0]
Epoch 0:   5%|▌         | 40/750 [00:01<00:18, 38.89it/s, v_num=0]
Epoch 0:   8%|▊         | 60/750 [00:01<00:17, 40.34it/s, v_num=0]
Epoch 0:  11%|█         | 80/750 [00:01<00:16, 41.72it/s, v_num=0]
Epoch 0:  13%|█▎        | 100/750 [00:02<00:15, 41.70it/s, v_num=0]
Epoch 0:  16%|█▌        | 120/750 [00:02<00:14, 42.30it/s, v_num=0]
Epoch 0:  19%|█▊        | 140/750 [00:03<00:14, 42.66it/s, v_num=0]
Epoch 0:  21%|██▏       | 160/750 [00:03<00:13, 42.65it/s, v_num=0]
Epoch 0:  24%|██▍       | 180/750 [00:04<00:13, 42.73it/s, v_num=0]
Epoch 0:  27%|██▋       | 200/750 [00:04<00:12, 42.78it/s, v_num=0]
Epoch 0:  29%|██▉       | 220/750 [00:05<00:12, 42.79it/s, v_num=0]
Epoch 0:  32%|███▏      | 240/750 [00:05<00:11, 42.83it/s, v_num=0]
Epoch 0:  35%|███▍      | 260/750 [00:06<00:11, 42.78it/s, v_

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00034_34_batch_size=128,lr=0.1000,mlp_af_l0=none,mlp_bn_l0=True,mlp_do_l0=0.3000,mlp_out_l0=64_2023-09-02_17-01-58/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:14, 196494.91it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:14, 195866.99it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:32, 285132.77it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:04, 404047.40it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:31, 822307.61it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1474548.08it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  93%|█████████▎| 24510464/26421880 [00:02<00:00, 16322351.35it/s][A[A100%|██████████| 26421880/26421880 [00:02<00:00, 10489027.17it/s]


Trial status: 34 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:23:15. Total running time: 42min 58s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_key': 0, 'class_key': 1, 'mlp_out_l0': 64, 'mlp_af_l0': 'relu', 'mlp_bn_l0': True, 'mlp_do_l0': 0.1}
+---------------------------------

[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 177370.54it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 177058.76it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 193220.57it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 193254.46it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 281199.02it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 399079.14it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 812007.86it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1454777.54it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5522742.91it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3252819.20it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 38695836.90it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.5 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.3 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 92.29it/s]
Epoch 0:   0%|          | 0/375 [00:00<?, ?it/s] 
Epoch 0:   5%|▌         | 20/375 [00:00<00:15, 22.32it/s, v_num=0]
Epoch 0:  11%|█         | 40/375 [00:01<00:13, 24.81it/s, v_num=0]
Epoch 0:  16%|█▌        | 60/375 [00:02<00:12, 24.99it/s, v_num=0]
Epoch 0:  21%|██▏       | 80/375 [00:03<00:11, 25.32it/s, v_num=0]
Epoch 0:  27%|██▋       | 100/375 [00:03<00:10, 25.34it/s, v_num=0]
Epoch 0:  32%|███▏      | 120/375 [00:04<00:09, 25.56it/s, v_num=0]
Epoch 0:  37%|███▋      | 140/375 [00:05<00:09, 25.44it/s, v_num=0]
Epoch 0:  43%|████▎     | 160/375 [00:06<00:08, 23.94it/s, v_num=0]
Epoch 0:  48%|████▊     | 180/375 [00:07<00:08, 22.94it/s, v_num=0]
Epoch 0:  53%|█████▎    | 200/375 [00:09<00:07, 21.90it/s, v_num=0]
Epoch 0:  59%|█████▊    | 220/375 [00:10<00:07, 21.31it/s, v_num=0]
Epoch 0:  64%|██████▍   | 240/375 [00:11<00:06, 20.62it/s, v_num=0]
Epoch 0:  69%|██████▉   | 260/375 [00:12<00:05, 20.91it/s, v_n

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:   5%|▌         | 20/375 [00:00<00:17, 20.87it/s, v_num=0]
Epoch 1:  11%|█         | 40/375 [00:01<00:14, 23.64it/s, v_num=0]
Epoch 1:  16%|█▌        | 60/375 [00:02<00:14, 21.44it/s, v_num=0]
Epoch 1:  21%|██▏       | 80/375 [00:03<00:14, 20.20it/s, v_num=0]
Epoch 1:  27%|██▋       | 100/375 [00:05<00:14, 19.44it/s, v_num=0]
Trial status: 34 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:23:45. Total running time: 43min 28s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'i

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00035_35_batch_size=256,lr=0.1000,mlp_af_l0=none,mlp_bn_l0=True,mlp_do_l0=0.3000,mlp_out_l0=64_2023-09-02_17-04-09/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:14, 195814.06it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:14, 195910.61it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:32, 285469.53it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 196608/26421880 [00:00<01:19, 328205.14it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 425984/26421880 [00:00<00:36, 704932.29it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 851968/26421880 [00:01<00:19, 1331915.07it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  94%|█████████▍| 24772608/26421880 [00:02<00:00, 17133524.99it/s][A[A100%|██████████| 26421880/26421880 [00:02<00:00, 10511895.64it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 172930.73it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 172677.93it/s]


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 193509.49it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 193005.00it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 280444.68it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 398303.69it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 810788.00it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1453750.69it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5520218.78it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3250501.33it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 35987128.32it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.5 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.3 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 63.25it/s]
Epoch 0:   0%|          | 0/188 [00:00<?, ?it/s] 
Epoch 0:  11%|█         | 20/188 [00:01<00:11, 14.42it/s, v_num=0]
Epoch 0:  21%|██▏       | 40/188 [00:02<00:10, 14.35it/s, v_num=0]
Epoch 0:  32%|███▏      | 60/188 [00:04<00:08, 14.75it/s, v_num=0]
Epoch 0:  43%|████▎     | 80/188 [00:05<00:08, 13.45it/s, v_num=0]
Trial status: 35 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:24:15. Total running time: 43min 58s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 's

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:  11%|█         | 20/188 [00:01<00:13, 12.67it/s, v_num=0]
Epoch 1:  21%|██▏       | 40/188 [00:03<00:11, 12.88it/s, v_num=0]
Epoch 1:  32%|███▏      | 60/188 [00:05<00:11, 11.46it/s, v_num=0]
Epoch 1:  43%|████▎     | 80/188 [00:07<00:10, 10.30it/s, v_num=0]
Epoch 1:  53%|█████▎    | 100/188 [00:09<00:08, 10.36it/s, v_num=0]
Epoch 1:  64%|██████▍   | 120/188 [00:10<00:06, 10.95it/s, v_num=0]
Epoch 1:  74%|███████▍  | 140/188 [00:12<00:04, 11.47it/s, v_num=0]
Epoch 1:  85%|████████▌ | 160/188 [00:13<00:02, 11.79it/s, v_num=0]
Epoch 1:  96%|█████████▌| 180/188 [00:14<00:00, 12.05it/s, v_num=0]
Epoch 1: 100%|██████████| 188/188 [00:15<00:00, 12.16it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Validation: 0it [00:00, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%|          | 0/47 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/47 [00:00<?, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation DataLoader 0:  43%|████▎     | 20/47 [00:

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00036_36_batch_size=64,lr=0.0100,mlp_af_l0=relu,mlp_bn_l0=False,mlp_do_l0=0.3000,mlp_out_l0=64_2023-09-02_17-05-18/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:15, 194512.11it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:15, 194023.50it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:33, 282047.34it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 400849.77it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:31, 814275.88it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1461626.51it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 176404.79it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 176101.90it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 192791.79it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 192483.51it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 280215.99it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 397128.36it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 10%|▉         | 425984/4422102 [00:00<00:05, 670441.28it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 20%|██        | 884736/4422102 [00:01<00:02, 1357599.72it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  79%|███████▊  | 3473408/4422102 [00:01<00:00, 4982811.28it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3240149.02it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 33737932.80it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.3 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.1 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/750 [00:00<?, ?it/s] 
Epoch 0:   3%|▎         | 20/750 [00:00<00:21, 34.32it/s, v_num=0]
Epoch 0:   5%|▌         | 40/750 [00:01<00:19, 37.20it/s, v_num=0]
Epoch 0:   8%|▊         | 60/750 [00:01<00:17, 39.53it/s, v_num=0]
Epoch 0:  11%|█         | 80/750 [00:02<00:16, 39.58it/s, v_num=0]
Epoch 0:  13%|█▎        | 100/750 [00:02<00:16, 39.61it/s, v_num=0]
Epoch 0:  16%|█▌        | 120/750 [00:03<00:15, 39.63it/s, v_num=0]
Epoch 0:  19%|█▊        | 140/750 [00:03<00:15, 39.99it/s, v_num=0]
Epoch 0:  21%|██▏       | 160/750 [00:03<00:14, 40.39it/s, v_num=0]
Epoch 0:  24%|██▍       | 180/750 [00:04<00:13, 40.86it/s, v_num=0]
Epoch 0:  27%|██▋       | 200/750 [00:04<00:13, 41.29it/s, v_num=0]
Epoch 0:  29%|██▉       | 220/750 [00:05<00:12, 41.56it/s, v_num=0]
Epoch 0:  32%|███▏      | 240/750 [00:05<00:12, 42.02it/s, v_num=0]
Epoch 0:  35%|███▍      | 260/750 [00:06<00:11, 42.16it/s, v_num=0]
Ep

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:   3%|▎         | 20/750 [00:00<00:35, 20.46it/s, v_num=0]
Epoch 1:   5%|▌         | 40/750 [00:01<00:31, 22.52it/s, v_num=0]
Epoch 1:   8%|▊         | 60/750 [00:02<00:29, 23.36it/s, v_num=0]
Epoch 1:  11%|█         | 80/750 [00:03<00:27, 24.29it/s, v_num=0]
Epoch 1:  13%|█▎        | 100/750 [00:04<00:26, 24.73it/s, v_num=0]
Epoch 1:  16%|█▌        | 120/750 [00:04<00:25, 25.01it/s, v_num=0]
Epoch 1:  19%|█▊        | 140/750 [00:05<00:24, 25.20it/s, v_num=0]
Epoch 1:  21%|██▏       | 160/750 [00:06<00:23, 25.43it/s, v_num=0]
Epoch 1:  24%|██▍       | 180/750 [00:07<00:22, 25.57it/s, v_num=0]
Epoch 1:  27%|██▋       | 200/750 [00:07<00:20, 26.66it/s, v_num=0]
Epoch 1:  29%|██▉       | 220/750 [00:07<00:19, 27.67it/s, v_num=0]
Epoch 1:  32%|███▏      | 240/750 [00:08<00:17, 28.48it/s, v_num=0]
Epoch 1:  35%|███▍      | 260/750 [00:08<00:16, 29.27it/s, v_num=0]
Epoch 1:  37%|███▋      | 280/750 [00:09<00:15, 29.86it/s, v_num=0]
Epoch 1:  40%|████      | 300/750 [00:09<00:14, 30.5

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 2:   3%|▎         | 20/750 [00:00<00:22, 32.79it/s, v_num=0]
Trial status: 36 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:25:46. Total running time: 45min 28s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_key': 0, 'class_key': 1, 'mlp_out_l0': 64, 'mlp_af_l0': 'relu', 'mlp

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00037_37_batch_size=128,lr=0.0100,mlp_af_l0=relu,mlp_bn_l0=False,mlp_do_l0=0.3000,mlp_out_l0=64_2023-09-02_17-06-21/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:14, 196914.67it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:14, 196214.17it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:32, 285471.13it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 196608/26421880 [00:00<01:20, 327323.96it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 393216/26421880 [00:00<00:41, 633545.76it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 786432/26421880 [00:01<00:21, 1217581.24it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 175330.47it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 175029.53it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 193847.38it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 193477.06it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 281599.75it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 399217.61it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 812358.70it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1456913.43it/s][A[A
[2

Trial status: 37 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:26:16. Total running time: 45min 58s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_key': 0, 'class_key': 1, 'mlp_out_l0': 64, 'mlp_af_l0': 'relu', 'mlp_bn_l0': True, 'mlp_do_l0': 0.1}
+---------------------------------

[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 37682856.88it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.3 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.1 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 39.94it/s]
Epoch 0:   0%|          | 0/375 [00:00<?, ?it/s] 
Epoch 0:   5%|▌         | 20/375 [00:00<00:15, 22.84it/s, v_num=0]
Epoch 0:  11%|█         | 40/375 [00:01<00:13, 24.95it/s, v_num=0]
Epoch 0:  16%|█▌        | 60/375 [00:02<00:12, 24.70it/s, v_num=0]
Epoch 0:  21%|██▏       | 80/375 [00:03<00:11, 24.94it/s, v_num=0]
Epoch 0:  27%|██▋       | 100/375 [00:03<00:10, 25.22it/s, v_num=0]
Epoch 0:  32%|███▏      | 120/375 [00:04<00:10, 25.19it/s, v_num=0]
Epoch 0:  37%|███▋      | 140/375 [00:05<00:09, 25.33it/s, v_num=0]
Epoch 0:  43%|████▎     | 160/375 [00:06<00:08, 25.72it/s, v_num=0]
Epoch 0:  48%|████▊     | 180/375 [00:07<00:07, 24.80it/s, v_num=0]
Epoch 0:  53%|█████▎    | 200/375 [00:08<00:07, 23.55it/s, v_num=0]
Epoch 0:  59%|█████▊    | 220/375 [00:09<00:06, 22.51it/s, v_num=0]
Epoch 0:  64%|██████▍   | 240/375 [00:11<00:06, 21.64it/s, v_num=0]
Epoch 0:  69%|██████▉   | 260/375 [00:12<00:05, 21.09it/s, v_n

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:   5%|▌         | 20/375 [00:00<00:16, 21.40it/s, v_num=0]
Epoch 1:  11%|█         | 40/375 [00:01<00:14, 23.50it/s, v_num=0]
Epoch 1:  16%|█▌        | 60/375 [00:02<00:12, 25.34it/s, v_num=0]
Epoch 1:  21%|██▏       | 80/375 [00:03<00:11, 24.79it/s, v_num=0]
Epoch 1:  27%|██▋       | 100/375 [00:04<00:12, 22.02it/s, v_num=0]
Epoch 1:  32%|███▏      | 120/375 [00:05<00:12, 21.21it/s, v_num=0]
Epoch 1:  37%|███▋      | 140/375 [00:06<00:11, 20.14it/s, v_num=0]
Epoch 1:  43%|████▎     | 160/375 [00:08<00:11, 19.42it/s, v_num=0]
Trial status: 37 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:26:46. Total running time: 46min 29s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'ou

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 2:   5%|▌         | 20/375 [00:01<00:25, 13.72it/s, v_num=0]
Epoch 2:  11%|█         | 40/375 [00:02<00:22, 14.96it/s, v_num=0]
Epoch 2:  16%|█▌        | 60/375 [00:03<00:20, 15.19it/s, v_num=0]
Epoch 2:  21%|██▏       | 80/375 [00:05<00:18, 15.73it/s, v_num=0]
Epoch 2:  27%|██▋       | 100/375 [00:06<00:17, 15.89it/s, v_num=0]
Epoch 2:  32%|███▏      | 120/375 [00:07<00:14, 17.08it/s, v_num=0]
Epoch 2:  37%|███▋      | 140/375 [00:07<00:12, 18.18it/s, v_num=0]
Epoch 2:  43%|████▎     | 160/375 [00:08<00:11, 18.87it/s, v_num=0]
Epoch 2:  48%|████▊     | 180/375 [00:09<00:10, 19.42it/s, v_num=0]
Epoch 2:  53%|█████▎    | 200/375 [00:09<00:08, 20.14it/s, v_num=0]
Epoch 2:  59%|█████▊    | 220/375 [00:10<00:07, 20.61it/s, v_num=0]
Epoch 2:  64%|██████▍   | 240/375 [00:11<00:06, 21.00it/s, v_num=0]
Epoch 2:  69%|██████▉   | 260/375 [00:12<00:05, 21.41it/s, v_num=0]
Epoch 2:  75%|███████▍  | 280/375 [00:12<00:04, 21.75it/s, v_num=0]
Epoch 2:  80%|████████  | 300/375 [00:13<00:03, 22.0

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 3:   5%|▌         | 20/375 [00:01<00:21, 16.57it/s, v_num=0]
Epoch 3:  11%|█         | 40/375 [00:01<00:16, 20.51it/s, v_num=0]
Epoch 3:  16%|█▌        | 60/375 [00:02<00:14, 22.42it/s, v_num=0]
Epoch 3:  21%|██▏       | 80/375 [00:03<00:12, 23.15it/s, v_num=0]
Epoch 3:  27%|██▋       | 100/375 [00:04<00:11, 23.81it/s, v_num=0]
Epoch 3:  32%|███▏      | 120/375 [00:04<00:10, 24.10it/s, v_num=0]
Epoch 3:  37%|███▋      | 140/375 [00:05<00:09, 24.42it/s, v_num=0]
Epoch 3:  43%|████▎     | 160/375 [00:06<00:08, 24.54it/s, v_num=0]
Epoch 3:  48%|████▊     | 180/375 [00:07<00:07, 24.98it/s, v_num=0]
Epoch 3:  53%|█████▎    | 200/375 [00:07<00:06, 25.01it/s, v_num=0]
Epoch 3:  59%|█████▊    | 220/375 [00:08<00:06, 25.10it/s, v_num=0]
Epoch 3:  64%|██████▍   | 240/375 [00:09<00:05, 25.21it/s, v_num=0]
Epoch 3:  69%|██████▉   | 260/375 [00:10<00:04, 25.36it/s, v_num=0]
Epoch 3:  75%|███████▍  | 280/375 [00:11<00:03, 25.17it/s, v_num=0]
Epoch 3:  80%|████████  | 300/375 [00:12<00:03, 24.3

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 4:   5%|▌         | 20/375 [00:00<00:16, 21.00it/s, v_num=0]
Epoch 4:  11%|█         | 40/375 [00:01<00:14, 23.38it/s, v_num=0]
Epoch 4:  16%|█▌        | 60/375 [00:02<00:12, 24.42it/s, v_num=0]
Epoch 4:  21%|██▏       | 80/375 [00:03<00:11, 25.00it/s, v_num=0]
Epoch 4:  27%|██▋       | 100/375 [00:03<00:10, 25.89it/s, v_num=0]
Epoch 4:  32%|███▏      | 120/375 [00:04<00:09, 25.92it/s, v_num=0]
Epoch 4:  37%|███▋      | 140/375 [00:05<00:09, 25.94it/s, v_num=0]
Trial status: 37 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:27:46. Total running time: 47min 29s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 5:   5%|▌         | 20/375 [00:01<00:18, 19.29it/s, v_num=0]
Epoch 5:  11%|█         | 40/375 [00:01<00:14, 22.56it/s, v_num=0]
Epoch 5:  16%|█▌        | 60/375 [00:02<00:13, 23.99it/s, v_num=0]
Epoch 5:  21%|██▏       | 80/375 [00:03<00:11, 24.62it/s, v_num=0]
Epoch 5:  27%|██▋       | 100/375 [00:04<00:11, 24.43it/s, v_num=0]
Epoch 5:  32%|███▏      | 120/375 [00:04<00:10, 24.55it/s, v_num=0]
Epoch 5:  37%|███▋      | 140/375 [00:06<00:10, 23.04it/s, v_num=0]
Epoch 5:  43%|████▎     | 160/375 [00:07<00:09, 21.65it/s, v_num=0]
Epoch 5:  48%|████▊     | 180/375 [00:08<00:09, 20.92it/s, v_num=0]
Epoch 5:  53%|█████▎    | 200/375 [00:10<00:08, 19.87it/s, v_num=0]
Epoch 5:  59%|█████▊    | 220/375 [00:11<00:08, 18.90it/s, v_num=0]
Epoch 5:  64%|██████▍   | 240/375 [00:13<00:07, 18.40it/s, v_num=0]
Epoch 5:  69%|██████▉   | 260/375 [00:14<00:06, 18.04it/s, v_num=0]
Epoch 5:  75%|███████▍  | 280/375 [00:15<00:05, 17.77it/s, v_num=0]
Trial status: 37 TERMINATED | 1 RUNNING | 16 PENDING

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 6:   5%|▌         | 20/375 [00:01<00:26, 13.25it/s, v_num=0]
Epoch 6:  11%|█         | 40/375 [00:02<00:22, 14.98it/s, v_num=0]
Epoch 6:  16%|█▌        | 60/375 [00:03<00:20, 15.67it/s, v_num=0]
Epoch 6:  21%|██▏       | 80/375 [00:05<00:18, 15.56it/s, v_num=0]
Epoch 6:  27%|██▋       | 100/375 [00:06<00:17, 16.00it/s, v_num=0]
Epoch 6:  32%|███▏      | 120/375 [00:07<00:15, 16.24it/s, v_num=0]
Epoch 6:  37%|███▋      | 140/375 [00:08<00:13, 17.21it/s, v_num=0]
Epoch 6:  43%|████▎     | 160/375 [00:08<00:11, 18.01it/s, v_num=0]
Epoch 6:  48%|████▊     | 180/375 [00:09<00:10, 18.62it/s, v_num=0]
Epoch 6:  53%|█████▎    | 200/375 [00:10<00:09, 19.08it/s, v_num=0]
Epoch 6:  59%|█████▊    | 220/375 [00:11<00:07, 19.59it/s, v_num=0]
Epoch 6:  64%|██████▍   | 240/375 [00:12<00:06, 19.97it/s, v_num=0]
Epoch 6:  69%|██████▉   | 260/375 [00:12<00:05, 20.41it/s, v_num=0]
Epoch 6:  75%|███████▍  | 280/375 [00:13<00:04, 20.74it/s, v_num=0]
Epoch 6:  80%|████████  | 300/375 [00:14<00:03, 21.1

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz
Trial status: 38 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:28:46. Total running time: 48min 29s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img

[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00038_38_batch_size=256,lr=0.0100,mlp_af_l0=relu,mlp_bn_l0=False,mlp_do_l0=0.3000,mlp_out_l0=64_2023-09-02_17-06-55/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:17, 191326.69it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:18, 190861.10it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:34, 277780.89it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 397121.11it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:32, 801108.05it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1444619.83it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 173878.99it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 173591.28it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 195978.52it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 195575.46it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 284721.39it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 403959.54it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 10%|█         | 458752/4422102 [00:00<00:05, 751670.67it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 20%|██        | 884736/4422102 [00:00<00:02, 1376437.30it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  81%|████████  | 3571712/4422102 [00:01<00:00, 5230671.44it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3284626.74it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 29060938.08it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.3 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.1 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 38.11it/s]
Epoch 0:   0%|          | 0/188 [00:00<?, ?it/s] 
Epoch 0:  11%|█         | 20/188 [00:01<00:12, 13.62it/s, v_num=0]
Epoch 0:  21%|██▏       | 40/188 [00:02<00:10, 14.13it/s, v_num=0]
Epoch 0:  32%|███▏      | 60/188 [00:04<00:10, 12.09it/s, v_num=0]
Epoch 0:  43%|████▎     | 80/188 [00:07<00:09, 11.21it/s, v_num=0]
Epoch 0:  53%|█████▎    | 100/188 [00:09<00:08, 10.66it/s, v_num=0]
Epoch 0:  64%|██████▍   | 120/188 [00:10<00:06, 11.19it/s, v_num=0]
Epoch 0:  74%|███████▍  | 140/188 [00:12<00:04, 11.54it/s, v_num=0]
Epoch 0:  85%|████████▌ | 160/188 [00:13<00:02, 12.00it/s, v_num=0]
Epoch 0:  96%|█████████▌| 180/188 [00:14<00:00, 12.23it/s, v_num=0]
Epoch 0: 100%|██████████| 188/188 [00:15<00:00, 12.39it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Validation: 0it [00:00, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%| 

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:  11%|█         | 20/188 [00:01<00:13, 12.15it/s, v_num=0]
Epoch 1:  21%|██▏       | 40/188 [00:03<00:13, 10.99it/s, v_num=0]
Trial status: 38 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:29:16. Total running time: 48min 59s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_k

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 2:  11%|█         | 20/188 [00:02<00:21,  7.71it/s, v_num=0]
Epoch 2:  21%|██▏       | 40/188 [00:04<00:17,  8.32it/s, v_num=0]
Epoch 2:  32%|███▏      | 60/188 [00:07<00:14,  8.56it/s, v_num=0]
Epoch 2:  43%|████▎     | 80/188 [00:08<00:11,  9.62it/s, v_num=0]
Epoch 2:  53%|█████▎    | 100/188 [00:09<00:08, 10.34it/s, v_num=0]
Epoch 2:  64%|██████▍   | 120/188 [00:10<00:06, 10.97it/s, v_num=0]
Epoch 2:  74%|███████▍  | 140/188 [00:12<00:04, 11.35it/s, v_num=0]
Epoch 2:  85%|████████▌ | 160/188 [00:13<00:02, 11.68it/s, v_num=0]
Epoch 2:  96%|█████████▌| 180/188 [00:15<00:00, 11.93it/s, v_num=0]
Trial status: 38 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:29:46. Total running time: 49min 29s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00039_39_batch_size=64,lr=0.1000,mlp_af_l0=relu,mlp_bn_l0=False,mlp_do_l0=0.3000,mlp_out_l0=64_2023-09-02_17-07-47/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:15, 195163.41it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:13, 197158.24it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:31, 286863.09it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:04, 408232.71it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:31, 828908.16it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:00<00:17, 1487531.18it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 172429.00it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 172109.45it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 194746.39it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 195331.86it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 284204.25it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 402920.03it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 819924.26it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1469147.26it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 37421623.90it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.3 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.1 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/750 [00:00<?, ?it/s] 
Epoch 0:   3%|▎         | 20/750 [00:00<00:22, 32.77it/s, v_num=0]
Epoch 0:   5%|▌         | 40/750 [00:01<00:18, 38.61it/s, v_num=0]
Epoch 0:   8%|▊         | 60/750 [00:01<00:16, 41.15it/s, v_num=0]
Epoch 0:  11%|█         | 80/750 [00:01<00:15, 42.02it/s, v_num=0]
Epoch 0:  13%|█▎        | 100/750 [00:02<00:15, 42.66it/s, v_num=0]
Epoch 0:  16%|█▌        | 120/750 [00:02<00:14, 43.14it/s, v_num=0]
Epoch 0:  19%|█▊        | 140/750 [00:03<00:14, 43.27it/s, v_num=0]
Epoch 0:  21%|██▏       | 160/750 [00:03<00:13, 43.45it/s, v_num=0]
Epoch 0:  24%|██▍       | 180/750 [00:04<00:13, 43.58it/s, v_num=0]
Epoch 0:  27%|██▋       | 200/750 [00:04<00:12, 43.69it/s, v_num=0]
Epoch 0:  29%|██▉       | 220/750 [00:05<00:12, 41.68it/s, v_num=0]
Epoch 0:  29%|██▉       | 220/750 [00:05<00:12, 41.66it/s, v_num=0]
Epoch 0:  32%|███▏      | 240/750 [00:06<00:12, 39.67it/s, v_num=0]
Ep

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


[2m[36m(run_with_tune pid=1086)[0m 
Epoch 2: 100%|██████████| 188/188 [08:02<00:00,  2.57s/it, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Epoch 0: 100%|██████████| 750/750 [07:46<00:00,  1.61it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
                                                                          [A
Epoch 1: 100%|██████████| 375/375 [07:05<00:00,  1.13s/it, v_num=0]
Trial status: 39 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:30:46. Total running time: 50min 29s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding

[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00040_40_batch_size=128,lr=0.1000,mlp_af_l0=relu,mlp_bn_l0=False,mlp_do_l0=0.3000,mlp_out_l0=64_2023-09-02_17-08-31/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:17, 192577.57it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:17, 192230.74it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:33, 279742.32it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:06, 396583.65it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 458752/26421880 [00:00<00:35, 738144.46it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 884736/26421880 [00:01<00:19, 1335536.60it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  95%|█████████▍| 24969216/26421880 [00:02<00:00, 16815060.20it/s][A[A100%|██████████| 26421880/26421880 [00:02<00:00, 10290776.90it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 174987.96it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 174727.39it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 193861.05it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 193418.60it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 281512.14it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 399121.21it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 812006.61it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1455116.57it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5523342.24it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3252652.63it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 34826253.21it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.3 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.1 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 40.80it/s]
Epoch 0:   0%|          | 0/375 [00:00<?, ?it/s] 
Epoch 0:   5%|▌         | 20/375 [00:00<00:16, 21.56it/s, v_num=0]
Epoch 0:  11%|█         | 40/375 [00:01<00:13, 24.12it/s, v_num=0]
Epoch 0:  16%|█▌        | 60/375 [00:02<00:12, 24.93it/s, v_num=0]
Trial status: 40 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:31:46. Total running time: 51min 29s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:   5%|▌         | 20/375 [00:01<00:28, 12.45it/s, v_num=0]
Epoch 1:  11%|█         | 40/375 [00:02<00:24, 13.84it/s, v_num=0]
Epoch 1:  16%|█▌        | 60/375 [00:04<00:22, 14.26it/s, v_num=0]
Epoch 1:  21%|██▏       | 80/375 [00:05<00:18, 15.75it/s, v_num=0]
Epoch 1:  27%|██▋       | 100/375 [00:05<00:16, 17.00it/s, v_num=0]
Epoch 1:  32%|███▏      | 120/375 [00:06<00:14, 17.94it/s, v_num=0]
Epoch 1:  37%|███▋      | 140/375 [00:07<00:12, 18.82it/s, v_num=0]
Epoch 1:  43%|████▎     | 160/375 [00:08<00:10, 19.62it/s, v_num=0]
Epoch 1:  48%|████▊     | 180/375 [00:08<00:09, 20.27it/s, v_num=0]
Epoch 1:  53%|█████▎    | 200/375 [00:09<00:08, 20.88it/s, v_num=0]
Epoch 1:  59%|█████▊    | 220/375 [00:10<00:07, 21.27it/s, v_num=0]
Epoch 1:  64%|██████▍   | 240/375 [00:11<00:06, 21.73it/s, v_num=0]
Epoch 1:  69%|██████▉   | 260/375 [00:11<00:05, 21.95it/s, v_num=0]
Epoch 1:  75%|███████▍  | 280/375 [00:12<00:04, 22.16it/s, v_num=0]
Trial status: 40 TERMINATED | 1 RUNNING | 16 PENDING

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00041_41_batch_size=256,lr=0.1000,mlp_af_l0=relu,mlp_bn_l0=False,mlp_do_l0=0.3000,mlp_out_l0=64_2023-09-02_17-11-48/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:20, 188486.07it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:20, 188177.60it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:36, 273823.94it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:06, 392427.44it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:32, 788495.59it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1425889.44it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  95%|█████████▌| 25198592/26421880 [00:02<00:00, 16502351.85it/s][A[A100%|██████████| 26421880/26421880 [00:02<00:00, 10079625.21it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 171100.37it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 170845.35it/s]


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 196578.38it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 196230.19it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 285765.12it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 408119.29it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 823332.62it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:00<00:02, 1484718.83it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5619484.44it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3307255.31it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 36909875.20it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.3 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.1 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 61.44it/s]
Epoch 0:   0%|          | 0/188 [00:00<?, ?it/s] 
Epoch 0:  11%|█         | 20/188 [00:02<00:20,  8.17it/s, v_num=0]
Epoch 0:  21%|██▏       | 40/188 [00:04<00:17,  8.50it/s, v_num=0]
Epoch 0:  32%|███▏      | 60/188 [00:06<00:14,  8.96it/s, v_num=0]
Epoch 0:  43%|████▎     | 80/188 [00:08<00:11,  9.80it/s, v_num=0]
Epoch 0:  53%|█████▎    | 100/188 [00:09<00:08, 10.67it/s, v_num=0]
Epoch 0:  64%|██████▍   | 120/188 [00:10<00:06, 11.25it/s, v_num=0]
Epoch 0:  74%|███████▍  | 140/188 [00:12<00:04, 11.64it/s, v_num=0]
Trial status: 41 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:32:46. Total running time: 52min 29s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride'

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:  11%|█         | 20/188 [00:02<00:22,  7.62it/s, v_num=0]
Epoch 1:  21%|██▏       | 40/188 [00:04<00:15,  9.61it/s, v_num=0]
Epoch 1:  32%|███▏      | 60/188 [00:05<00:11, 11.05it/s, v_num=0]
Epoch 1:  43%|████▎     | 80/188 [00:06<00:09, 11.90it/s, v_num=0]
Epoch 1:  53%|█████▎    | 100/188 [00:08<00:07, 12.50it/s, v_num=0]
Epoch 1:  64%|██████▍   | 120/188 [00:09<00:05, 12.93it/s, v_num=0]
Epoch 1:  74%|███████▍  | 140/188 [00:10<00:03, 13.10it/s, v_num=0]
Epoch 1:  85%|████████▌ | 160/188 [00:11<00:02, 13.48it/s, v_num=0]
Epoch 1:  96%|█████████▌| 180/188 [00:13<00:00, 13.60it/s, v_num=0]
Epoch 1: 100%|██████████| 188/188 [00:13<00:00, 13.58it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Validation: 0it [00:00, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%|          | 0/47 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/47 [00:00<?, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation DataLoader 0:  43%|████▎     | 20/47 [00:

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00042_42_batch_size=64,lr=0.0100,mlp_af_l0=none,mlp_bn_l0=False,mlp_do_l0=0.3000,mlp_out_l0=64_2023-09-02_17-12-58/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:16, 193109.26it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:16, 192634.49it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:33, 280527.06it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 397904.48it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:32, 809832.71it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1450162.70it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  94%|█████████▍| 24838144/26421880 [00:02<00:00, 16466051.54it/s][A[A100%|██████████| 26421880/26421880 [00:02<00:00, 10269215.27it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
Trial status: 42 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:33:16. Total running time: 52min 59s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batc

[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 177179.39it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 176887.48it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 192723.93it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 192275.42it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 279837.25it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 396907.38it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 10%|█         | 458752/4422102 [00:00<00:05, 738601.45it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1467106.58it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  85%|████████▌ | 3768320/4422102 [00:01<00:00, 5417596.55it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3237476.16it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 35927249.57it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.3 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.1 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 63.59it/s]
Epoch 0:   0%|          | 0/750 [00:00<?, ?it/s] 
Epoch 0:   3%|▎         | 20/750 [00:00<00:21, 33.90it/s, v_num=0]
Epoch 0:   5%|▌         | 40/750 [00:01<00:18, 39.04it/s, v_num=0]
Epoch 0:   8%|▊         | 60/750 [00:01<00:16, 41.17it/s, v_num=0]
Epoch 0:  11%|█         | 80/750 [00:01<00:16, 40.89it/s, v_num=0]
Epoch 0:  13%|█▎        | 100/750 [00:02<00:17, 36.47it/s, v_num=0]
Epoch 0:  16%|█▌        | 120/750 [00:03<00:18, 33.85it/s, v_num=0]
Epoch 0:  19%|█▊        | 140/750 [00:04<00:18, 32.68it/s, v_num=0]
Epoch 0:  21%|██▏       | 160/750 [00:05<00:18, 31.94it/s, v_num=0]
Epoch 0:  24%|██▍       | 180/750 [00:05<00:18, 31.56it/s, v_num=0]
Epoch 0:  27%|██▋       | 200/750 [00:06<00:17, 31.20it/s, v_num=0]
Epoch 0:  29%|██▉       | 220/750 [00:07<00:17, 30.57it/s, v_num=0]
Epoch 0:  32%|███▏      | 240/750 [00:07<00:16, 30.14it/s, v_num=0]
Epoch 0:  35%|███▍      | 260/750 [00:08<00:16, 30.26it/s, v_n

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:   3%|▎         | 20/750 [00:00<00:23, 30.56it/s, v_num=0]
Epoch 1:   5%|▌         | 40/750 [00:01<00:19, 36.38it/s, v_num=0]
Epoch 1:   8%|▊         | 60/750 [00:01<00:17, 38.75it/s, v_num=0]
Epoch 1:  11%|█         | 80/750 [00:02<00:16, 39.93it/s, v_num=0]
Epoch 1:  13%|█▎        | 100/750 [00:02<00:16, 40.59it/s, v_num=0]
Epoch 1:  16%|█▌        | 120/750 [00:02<00:15, 40.92it/s, v_num=0]
Epoch 1:  19%|█▊        | 140/750 [00:03<00:14, 41.24it/s, v_num=0]
Epoch 1:  21%|██▏       | 160/750 [00:03<00:14, 41.33it/s, v_num=0]
Epoch 1:  24%|██▍       | 180/750 [00:04<00:13, 41.64it/s, v_num=0]
Epoch 1:  27%|██▋       | 200/750 [00:04<00:13, 41.77it/s, v_num=0]
Epoch 1:  29%|██▉       | 220/750 [00:05<00:12, 41.83it/s, v_num=0]
Epoch 1:  32%|███▏      | 240/750 [00:05<00:12, 41.86it/s, v_num=0]
Epoch 1:  35%|███▍      | 260/750 [00:06<00:11, 42.02it/s, v_num=0]
Epoch 1:  37%|███▋      | 280/750 [00:06<00:11, 42.16it/s, v_num=0]
Epoch 1:  40%|████      | 300/750 [00:07<00:10, 42.2

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 2:   3%|▎         | 20/750 [00:00<00:23, 31.28it/s, v_num=0]
Epoch 2:   5%|▌         | 40/750 [00:01<00:19, 37.09it/s, v_num=0]
Epoch 2:   8%|▊         | 60/750 [00:01<00:18, 37.33it/s, v_num=0]
Epoch 2:  11%|█         | 80/750 [00:02<00:19, 34.24it/s, v_num=0]
Epoch 2:  13%|█▎        | 100/750 [00:03<00:19, 32.62it/s, v_num=0]
Epoch 2:  16%|█▌        | 120/750 [00:03<00:20, 31.17it/s, v_num=0]
Epoch 2:  19%|█▊        | 140/750 [00:04<00:19, 30.59it/s, v_num=0]
Epoch 2:  21%|██▏       | 160/750 [00:05<00:19, 30.03it/s, v_num=0]
Epoch 2:  24%|██▍       | 180/750 [00:06<00:19, 29.72it/s, v_num=0]
Trial status: 42 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:34:17. Total running time: 53min 59s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00043_43_batch_size=128,lr=0.0100,mlp_af_l0=none,mlp_bn_l0=False,mlp_do_l0=0.3000,mlp_out_l0=64_2023-09-02_17-15-32/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:14, 196814.84it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:14, 196618.74it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:31, 286037.90it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:04, 405842.87it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:31, 825586.69it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1479071.29it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  94%|█████████▍| 24903680/26421880 [00:02<00:00, 16946023.22it/s][A[A100%|██████████| 26421880/26421880 [00:02<00:00, 10512869.89it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 176777.35it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 176512.44it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 194335.27it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 194059.74it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 282474.46it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 400602.68it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 815168.79it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1460580.49it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5543616.17it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3265858.53it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 27789288.28it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.3 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.1 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 40.13it/s]
Epoch 0:   0%|          | 0/375 [00:00<?, ?it/s] 
Epoch 0:   5%|▌         | 20/375 [00:01<00:19, 17.85it/s, v_num=0]
Trial status: 43 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:34:47. Total running time: 54min 29s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:   5%|▌         | 20/375 [00:00<00:15, 22.49it/s, v_num=0]
Epoch 1:  11%|█         | 40/375 [00:01<00:14, 23.66it/s, v_num=0]
Epoch 1:  16%|█▌        | 60/375 [00:02<00:12, 25.26it/s, v_num=0]
Epoch 1:  21%|██▏       | 80/375 [00:03<00:11, 25.09it/s, v_num=0]
Epoch 1:  27%|██▋       | 100/375 [00:03<00:10, 25.55it/s, v_num=0]
Epoch 1:  32%|███▏      | 120/375 [00:04<00:09, 25.52it/s, v_num=0]
Epoch 1:  37%|███▋      | 140/375 [00:05<00:09, 25.70it/s, v_num=0]
Epoch 1:  43%|████▎     | 160/375 [00:06<00:08, 25.99it/s, v_num=0]
Trial status: 43 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:35:17. Total running time: 54min 59s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'ou

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 2:   5%|▌         | 20/375 [00:00<00:17, 20.65it/s, v_num=0]
Epoch 2:  11%|█         | 40/375 [00:01<00:14, 23.60it/s, v_num=0]
Epoch 2:  16%|█▌        | 60/375 [00:02<00:12, 24.71it/s, v_num=0]
Epoch 2:  21%|██▏       | 80/375 [00:03<00:11, 24.70it/s, v_num=0]
Epoch 2:  27%|██▋       | 100/375 [00:03<00:10, 25.54it/s, v_num=0]
Epoch 2:  32%|███▏      | 120/375 [00:04<00:10, 25.48it/s, v_num=0]
Epoch 2:  37%|███▋      | 140/375 [00:05<00:09, 24.97it/s, v_num=0]
Epoch 2:  43%|████▎     | 160/375 [00:06<00:09, 23.52it/s, v_num=0]
Epoch 2:  48%|████▊     | 180/375 [00:08<00:08, 22.27it/s, v_num=0]
Epoch 2:  53%|█████▎    | 200/375 [00:09<00:08, 21.26it/s, v_num=0]
Epoch 2:  59%|█████▊    | 220/375 [00:10<00:07, 20.98it/s, v_num=0]
Epoch 2:  64%|██████▍   | 240/375 [00:11<00:06, 20.43it/s, v_num=0]
Epoch 2:  69%|██████▉   | 260/375 [00:12<00:05, 20.88it/s, v_num=0]
Epoch 2:  75%|███████▍  | 280/375 [00:13<00:04, 21.08it/s, v_num=0]
Epoch 2:  80%|████████  | 300/375 [00:14<00:03, 21.4

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00044_44_batch_size=256,lr=0.0100,mlp_af_l0=none,mlp_bn_l0=False,mlp_do_l0=0.3000,mlp_out_l0=64_2023-09-02_17-16-05/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:14, 196221.11it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:14, 195870.24it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:32, 285097.70it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:04, 404192.41it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:31, 822264.60it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1475183.33it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  96%|█████████▌| 25362432/26421880 [00:02<00:00, 17044937.27it/s][A[A100%|██████████| 26421880/26421880 [00:02<00:00, 10481223.88it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 175712.47it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 175308.62it/s]


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 195022.18it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 194472.87it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 282988.33it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 401074.91it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 816561.84it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1463015.53it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 34826253.21it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.3 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.1 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 25.20it/s]
Epoch 0:   0%|          | 0/188 [00:00<?, ?it/s] 
Epoch 0:  11%|█         | 20/188 [00:01<00:12, 13.52it/s, v_num=0]
Epoch 0:  21%|██▏       | 40/188 [00:02<00:10, 14.37it/s, v_num=0]
Epoch 0:  32%|███▏      | 60/188 [00:04<00:09, 14.19it/s, v_num=0]
Epoch 0:  43%|████▎     | 80/188 [00:05<00:07, 14.45it/s, v_num=0]
Epoch 0:  53%|█████▎    | 100/188 [00:06<00:06, 14.46it/s, v_num=0]
Epoch 0:  64%|██████▍   | 120/188 [00:08<00:04, 14.06it/s, v_num=0]
Epoch 0:  74%|███████▍  | 140/188 [00:10<00:03, 13.07it/s, v_num=0]
Epoch 0:  85%|████████▌ | 160/188 [00:12<00:02, 12.46it/s, v_num=0]
Epoch 0:  96%|█████████▌| 180/188 [00:14<00:00, 12.11it/s, v_num=0]
Epoch 0: 100%|██████████| 188/188 [00:15<00:00, 12.30it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Validation: 0it [00:00, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%| 

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:  11%|█         | 20/188 [00:01<00:12, 13.24it/s, v_num=0]
Epoch 1:  21%|██▏       | 40/188 [00:02<00:10, 13.91it/s, v_num=0]
Epoch 1:  32%|███▏      | 60/188 [00:04<00:08, 14.55it/s, v_num=0]
Epoch 1:  43%|████▎     | 80/188 [00:05<00:07, 14.74it/s, v_num=0]
Epoch 1:  53%|█████▎    | 100/188 [00:07<00:06, 14.04it/s, v_num=0]
Epoch 1:  64%|██████▍   | 120/188 [00:09<00:05, 12.82it/s, v_num=0]
Epoch 1:  74%|███████▍  | 140/188 [00:11<00:03, 12.07it/s, v_num=0]
Epoch 1:  85%|████████▌ | 160/188 [00:13<00:02, 12.02it/s, v_num=0]
Epoch 1:  96%|█████████▌| 180/188 [00:14<00:00, 12.30it/s, v_num=0]
Epoch 1: 100%|██████████| 188/188 [00:15<00:00, 12.49it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Validation: 0it [00:00, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%|          | 0/47 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/47 [00:00<?, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation DataLoader 0:  43%|████▎     | 20/47 [00:

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 2:  11%|█         | 20/188 [00:01<00:13, 12.89it/s, v_num=0]
Epoch 2:  21%|██▏       | 40/188 [00:02<00:10, 13.92it/s, v_num=0]
Epoch 2:  32%|███▏      | 60/188 [00:04<00:08, 14.31it/s, v_num=0]
Epoch 2:  43%|████▎     | 80/188 [00:06<00:08, 12.87it/s, v_num=0]
Epoch 2:  53%|█████▎    | 100/188 [00:08<00:07, 11.64it/s, v_num=0]
Epoch 2:  64%|██████▍   | 120/188 [00:10<00:06, 11.11it/s, v_num=0]
Trial status: 44 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:36:47. Total running time: 56min 30s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'pa

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00045_45_batch_size=64,lr=0.1000,mlp_af_l0=none,mlp_bn_l0=False,mlp_do_l0=0.3000,mlp_out_l0=64_2023-09-02_17-16-54/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:17, 191934.54it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:17, 192054.92it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:33, 279753.76it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 397524.20it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:32, 808705.33it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1448725.73it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 177755.37it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 177342.59it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 194738.94it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 195054.49it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 284344.40it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 404149.74it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 820996.32it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1472787.58it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 32227279.09it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.3 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.1 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 59.81it/s]
Epoch 0:   0%|          | 0/750 [00:00<?, ?it/s] 
Epoch 0:   3%|▎         | 20/750 [00:00<00:21, 33.58it/s, v_num=0]
Epoch 0:   5%|▌         | 40/750 [00:01<00:18, 37.57it/s, v_num=0]
Epoch 0:   8%|▊         | 60/750 [00:01<00:17, 39.38it/s, v_num=0]
Epoch 0:  11%|█         | 80/750 [00:01<00:16, 40.77it/s, v_num=0]
Epoch 0:  13%|█▎        | 100/750 [00:02<00:15, 40.81it/s, v_num=0]
Epoch 0:  16%|█▌        | 120/750 [00:02<00:15, 41.46it/s, v_num=0]
Epoch 0:  19%|█▊        | 140/750 [00:03<00:14, 41.86it/s, v_num=0]
Epoch 0:  21%|██▏       | 160/750 [00:03<00:13, 42.14it/s, v_num=0]
Epoch 0:  24%|██▍       | 180/750 [00:04<00:13, 42.31it/s, v_num=0]
Epoch 0:  27%|██▋       | 200/750 [00:04<00:12, 42.61it/s, v_num=0]
Epoch 0:  29%|██▉       | 220/750 [00:05<00:12, 42.56it/s, v_num=0]
Epoch 0:  32%|███▏      | 240/750 [00:05<00:11, 42.77it/s, v_num=0]
Epoch 0:  35%|███▍      | 260/750 [00:06<00:11, 42.82it/s, v_n

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00046_46_batch_size=128,lr=0.1000,mlp_af_l0=none,mlp_bn_l0=False,mlp_do_l0=0.3000,mlp_out_l0=64_2023-09-02_17-17-38/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:18, 191168.88it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:18, 190927.68it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:34, 277805.33it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:06, 394064.51it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:32, 801884.52it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1437089.94it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 175192.76it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 174715.06it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 194061.97it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 194318.91it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 282879.81it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 402437.36it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 818077.79it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1465415.04it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 30540702.96it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.3 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.1 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Epoch 0:   0%|          | 0/375 [00:00<?, ?it/s] 
Epoch 0:   5%|▌         | 20/375 [00:00<00:15, 23.22it/s, v_num=0]
Epoch 0:  11%|█         | 40/375 [00:01<00:13, 25.39it/s, v_num=0]
Epoch 0:  16%|█▌        | 60/375 [00:02<00:12, 26.10it/s, v_num=0]
Epoch 0:  21%|██▏       | 80/375 [00:03<00:11, 25.87it/s, v_num=0]
Epoch 0:  27%|██▋       | 100/375 [00:03<00:10, 26.28it/s, v_num=0]
Epoch 0:  32%|███▏      | 120/375 [00:04<00:09, 26.29it/s, v_num=0]
Epoch 0:  37%|███▋      | 140/375 [00:05<00:09, 25.88it/s, v_num=0]
Epoch 0:  43%|████▎     | 160/375 [00:06<00:08, 26.37it/s, v_num=0]
Epoch 0:  48%|████▊     | 180/375 [00:06<00:07, 26.30it/s, v_num=0]
Epoch 0:  53%|█████▎    | 200/375 [00:07<00:06, 26.44it/s, v_num=0]
Epoch 0:  59%|█████▊    | 220/375 [00:08<00:06, 25.69it/s, v_num=0]
Epoch 0:  64%|██████▍   | 240/375 [00:09<00:05, 24.71it/s, v_num=0]
Epoch 0:  69%|██████▉   | 260/375 [00:10<00:04, 23.70it/s, v_num=0]
Ep

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:   5%|▌         | 20/375 [00:00<00:17, 20.57it/s, v_num=0]
Epoch 1:  11%|█         | 40/375 [00:01<00:14, 23.45it/s, v_num=0]
Epoch 1:  16%|█▌        | 60/375 [00:02<00:12, 24.71it/s, v_num=0]
Epoch 1:  21%|██▏       | 80/375 [00:03<00:11, 25.07it/s, v_num=0]
Epoch 1:  27%|██▋       | 100/375 [00:03<00:10, 25.29it/s, v_num=0]
Epoch 1:  32%|███▏      | 120/375 [00:04<00:09, 25.58it/s, v_num=0]
Epoch 1:  37%|███▋      | 140/375 [00:05<00:09, 25.12it/s, v_num=0]
Epoch 1:  43%|████▎     | 160/375 [00:06<00:09, 23.64it/s, v_num=0]
Epoch 1:  48%|████▊     | 180/375 [00:07<00:08, 22.54it/s, v_num=0]
Epoch 1:  53%|█████▎    | 200/375 [00:09<00:08, 21.64it/s, v_num=0]
Epoch 1:  59%|█████▊    | 220/375 [00:10<00:07, 21.18it/s, v_num=0]
Epoch 1:  64%|██████▍   | 240/375 [00:11<00:06, 20.37it/s, v_num=0]
Epoch 1:  69%|██████▉   | 260/375 [00:12<00:05, 20.40it/s, v_num=0]
Epoch 1:  75%|███████▍  | 280/375 [00:13<00:04, 20.76it/s, v_num=0]
Epoch 1:  80%|████████  | 300/375 [00:14<00:03, 21.0

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00047_47_batch_size=256,lr=0.1000,mlp_af_l0=none,mlp_bn_l0=False,mlp_do_l0=0.3000,mlp_out_l0=64_2023-09-02_17-19-52/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:14, 196026.88it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:14, 195917.41it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:32, 285212.88it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:04, 404814.11it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 458752/26421880 [00:00<00:34, 753296.87it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 917504/26421880 [00:01<00:17, 1429514.92it/s][A

Trial status: 47 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:38:17. Total running time: 58min 0s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_key': 0, 'class_key': 1, 'mlp_out_l0': 64, 'mlp_af_l0': 'relu', 'mlp_bn_l0': True, 'mlp_do_l0': 0.1}
+----------------------------------

[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 49%|████▊     | 12845056/26421880 [00:01<00:00, 14003772.07it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 60%|██████    | 15892480/26421880 [00:02<00:00, 15297479.38it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 71%|███████   | 18677760/26421880 [00:02<00:00, 15683236.64it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 82%|████████▏ | 21692416/26421880 [00:02<00:00, 16385349.21it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
100%|██████████| 26421880/26421880 [00:02<00:00, 10472734.42it/s]


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 171422.59it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 171048.12it/s]


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 193663.28it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 193533.66it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 282187.03it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 401333.51it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 814899.23it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1462614.69it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5550764.22it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3267713.54it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 34658550.55it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 5.3 K 
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 15.1 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 64.84it/s]
Epoch 0:   0%|          | 0/188 [00:00<?, ?it/s] 
Epoch 0:  11%|█         | 20/188 [00:01<00:12, 13.49it/s, v_num=0]
Epoch 0:  21%|██▏       | 40/188 [00:02<00:10, 14.03it/s, v_num=0]
Epoch 0:  32%|███▏      | 60/188 [00:04<00:08, 14.68it/s, v_num=0]
Epoch 0:  43%|████▎     | 80/188 [00:05<00:07, 14.84it/s, v_num=0]
Epoch 0:  53%|█████▎    | 100/188 [00:06<00:05, 14.84it/s, v_num=0]
Epoch 0:  64%|██████▍   | 120/188 [00:08<00:04, 14.82it/s, v_num=0]
Epoch 0:  74%|███████▍  | 140/188 [00:09<00:03, 14.55it/s, v_num=0]
Epoch 0:  85%|████████▌ | 160/188 [00:11<00:02, 13.64it/s, v_num=0]
Epoch 0:  96%|█████████▌| 180/188 [00:13<00:00, 12.90it/s, v_num=0]
Epoch 0: 100%|██████████| 188/188 [00:14<00:00, 12.83it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Validation: 0it [00:00, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%|          | 0/47 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|  

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:  11%|█         | 20/188 [00:01<00:13, 12.62it/s, v_num=0]
Epoch 1:  21%|██▏       | 40/188 [00:02<00:10, 13.92it/s, v_num=0]
Epoch 1:  32%|███▏      | 60/188 [00:04<00:09, 14.18it/s, v_num=0]
Epoch 1:  43%|████▎     | 80/188 [00:05<00:07, 14.27it/s, v_num=0]
Trial status: 47 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:38:47. Total running time: 58min 30s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm':

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00048_48_batch_size=64,lr=0.0100,mlp_af_l0=relu,mlp_bn_l0=True,mlp_do_l0=0.1000,mlp_out_l0=128_2023-09-02_17-21-38/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:15, 194874.24it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:15, 194291.02it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:32, 282989.03it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 401452.96it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:31, 816749.52it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1463106.71it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 176397.50it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 176121.44it/s]


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 195344.55it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 195958.11it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 285171.96it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 404013.56it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 822617.62it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1473618.09it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5596120.30it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3295540.86it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 23964791.33it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.9 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.7 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 41.17it/s]
                                                                           
Epoch 0:   0%|          | 0/750 [00:00<?, ?it/s] 
Epoch 0:   3%|▎         | 20/750 [00:00<00:35, 20.82it/s, v_num=0]
Epoch 0:   5%|▌         | 40/750 [00:01<00:30, 23.13it/s, v_num=0]
Epoch 0:   8%|▊         | 60/750 [00:02<00:28, 24.31it/s, v_num=0]
Epoch 0:  11%|█         | 80/750 [00:03<00:26, 25.06it/s, v_num=0]
Epoch 0:  13%|█▎        | 100/750 [00:03<00:25, 25.31it/s, v_num=0]
Epoch 0:  16%|█▌        | 120/750 [00:04<00:23, 26.90it/s, v_num=0]
Epoch 0:  19%|█▊        | 140/750 [00:04<00:21, 28.31it/s, v_num=0]
Epoch 0:  21%|██▏       | 160/750 [00:05<00:19, 29.71it/s, v_num=0]
Epoch 0:  24%|██▍       | 180/750 [00:05<00:18, 30.82it/s, v_num=0]
Epoch 0:  27%|██▋       | 200/750 [00:06<00:17, 31.68it/s, v_num=0]
Epoch 0:  29%|██▉       | 220/750 [00:06<00:16, 32.52it/s, v_num=0]
Epoch 0:  32%|███▏      | 240/750 [00:07<00:15, 33.35i

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:   3%|▎         | 20/750 [00:00<00:26, 27.78it/s, v_num=0]
Epoch 1:   5%|▌         | 40/750 [00:01<00:21, 33.32it/s, v_num=0]
Epoch 1:   8%|▊         | 60/750 [00:01<00:18, 36.49it/s, v_num=0]
Epoch 1:  11%|█         | 80/750 [00:02<00:17, 37.68it/s, v_num=0]
Epoch 1:  13%|█▎        | 100/750 [00:02<00:16, 38.39it/s, v_num=0]
Epoch 1:  16%|█▌        | 120/750 [00:03<00:16, 38.53it/s, v_num=0]
Epoch 1:  19%|█▊        | 140/750 [00:03<00:15, 39.33it/s, v_num=0]
Epoch 1:  21%|██▏       | 160/750 [00:04<00:14, 39.81it/s, v_num=0]
Epoch 1:  24%|██▍       | 180/750 [00:04<00:14, 40.25it/s, v_num=0]
Epoch 1:  27%|██▋       | 200/750 [00:04<00:13, 40.72it/s, v_num=0]
Epoch 1:  29%|██▉       | 220/750 [00:05<00:12, 40.96it/s, v_num=0]
Epoch 1:  32%|███▏      | 240/750 [00:05<00:12, 41.18it/s, v_num=0]
Epoch 1:  35%|███▍      | 260/750 [00:06<00:12, 40.48it/s, v_num=0]
Epoch 1:  37%|███▋      | 280/750 [00:07<00:12, 38.95it/s, v_num=0]
Epoch 1:  40%|████      | 300/750 [00:07<00:11, 38.1

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 2:   3%|▎         | 20/750 [00:01<00:38, 18.93it/s, v_num=0]
Epoch 2:   5%|▌         | 40/750 [00:01<00:31, 22.53it/s, v_num=0]
Epoch 2:   8%|▊         | 60/750 [00:02<00:28, 24.10it/s, v_num=0]
Epoch 2:  11%|█         | 80/750 [00:03<00:26, 24.84it/s, v_num=0]
Epoch 2:  13%|█▎        | 100/750 [00:03<00:25, 25.38it/s, v_num=0]
Epoch 2:  16%|█▌        | 120/750 [00:04<00:24, 25.74it/s, v_num=0]
Epoch 2:  19%|█▊        | 140/750 [00:05<00:23, 25.91it/s, v_num=0]
Epoch 2:  21%|██▏       | 160/750 [00:06<00:22, 25.97it/s, v_num=0]
Epoch 2:  24%|██▍       | 180/750 [00:06<00:21, 26.27it/s, v_num=0]
Epoch 2:  27%|██▋       | 200/750 [00:07<00:20, 27.33it/s, v_num=0]
Epoch 2:  29%|██▉       | 220/750 [00:07<00:18, 28.48it/s, v_num=0]
Epoch 2:  32%|███▏      | 240/750 [00:08<00:17, 29.33it/s, v_num=0]
Epoch 2:  35%|███▍      | 260/750 [00:08<00:16, 30.21it/s, v_num=0]
Epoch 2:  37%|███▋      | 280/750 [00:09<00:15, 30.96it/s, v_num=0]
Epoch 2:  40%|████      | 300/750 [00:09<00:14, 31.6

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1: 100%|██████████| 188/188 [07:41<00:00,  2.46s/it, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Epoch 2: 100%|██████████| 750/750 [06:34<00:00,  1.90it/s, v_num=0]
Trial status: 48 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:40:47. Total running time: 1hr 0min 30s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'b

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00049_49_batch_size=128,lr=0.0100,mlp_af_l0=relu,mlp_bn_l0=True,mlp_do_l0=0.1000,mlp_out_l0=128_2023-09-02_17-22-40/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:14, 195894.16it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:14, 195512.55it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:32, 284614.17it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 196608/26421880 [00:00<01:20, 326498.80it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 425984/26421880 [00:00<00:37, 701547.21it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 819200/26421880 [00:01<00:20, 1259955.29it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 26421880/26421880 [00:02<00:00, 10414009.15it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 172990.90it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 172565.52it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:23, 190345.74it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 189938.78it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 276365.03it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 393256.41it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 797300.42it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1431791.39it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5429238.96it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3198065.28it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 23991418.88it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.9 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.7 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 56.23it/s]
Epoch 0:   0%|          | 0/375 [00:00<?, ?it/s] 
Trial status: 49 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:42:18. Total running time: 1hr 2min 0s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_key': 0

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:   5%|▌         | 20/375 [00:00<00:17, 20.82it/s, v_num=0]
Epoch 1:  11%|█         | 40/375 [00:01<00:14, 23.05it/s, v_num=0]
Epoch 1:  16%|█▌        | 60/375 [00:02<00:12, 24.81it/s, v_num=0]
Epoch 1:  21%|██▏       | 80/375 [00:03<00:11, 25.29it/s, v_num=0]
Epoch 1:  27%|██▋       | 100/375 [00:04<00:12, 22.67it/s, v_num=0]
Epoch 1:  32%|███▏      | 120/375 [00:05<00:11, 21.51it/s, v_num=0]
Epoch 1:  37%|███▋      | 140/375 [00:06<00:11, 20.67it/s, v_num=0]
Epoch 1:  43%|████▎     | 160/375 [00:08<00:10, 19.98it/s, v_num=0]
Epoch 1:  48%|████▊     | 180/375 [00:09<00:10, 19.45it/s, v_num=0]
Trial status: 49 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:42:48. Total running time: 1hr 2min 31s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size'

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 2:   5%|▌         | 20/375 [00:01<00:29, 12.16it/s, v_num=0]
Epoch 2:  11%|█         | 40/375 [00:03<00:25, 13.20it/s, v_num=0]
Epoch 2:  16%|█▌        | 60/375 [00:04<00:22, 13.90it/s, v_num=0]
Epoch 2:  21%|██▏       | 80/375 [00:05<00:18, 15.67it/s, v_num=0]
Epoch 2:  27%|██▋       | 100/375 [00:05<00:16, 17.15it/s, v_num=0]
Epoch 2:  32%|███▏      | 120/375 [00:06<00:14, 18.16it/s, v_num=0]
Epoch 2:  37%|███▋      | 140/375 [00:07<00:12, 19.05it/s, v_num=0]
Epoch 2:  43%|████▎     | 160/375 [00:08<00:10, 19.55it/s, v_num=0]
Epoch 2:  48%|████▊     | 180/375 [00:08<00:09, 20.03it/s, v_num=0]
Epoch 2:  53%|█████▎    | 200/375 [00:09<00:08, 20.36it/s, v_num=0]
Epoch 2:  59%|█████▊    | 220/375 [00:10<00:07, 20.68it/s, v_num=0]
Epoch 2:  64%|██████▍   | 240/375 [00:11<00:06, 20.97it/s, v_num=0]
Epoch 2:  69%|██████▉   | 260/375 [00:12<00:05, 21.35it/s, v_num=0]
Epoch 2:  75%|███████▍  | 280/375 [00:12<00:04, 21.57it/s, v_num=0]
Epoch 2:  80%|████████  | 300/375 [00:13<00:03, 21.8

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 3:   5%|▌         | 20/375 [00:01<00:18, 19.70it/s, v_num=0]
Epoch 3:  11%|█         | 40/375 [00:01<00:15, 21.92it/s, v_num=0]
Epoch 3:  16%|█▌        | 60/375 [00:02<00:13, 23.19it/s, v_num=0]
Epoch 3:  21%|██▏       | 80/375 [00:03<00:12, 23.94it/s, v_num=0]
Epoch 3:  27%|██▋       | 100/375 [00:04<00:11, 24.26it/s, v_num=0]
Epoch 3:  32%|███▏      | 120/375 [00:04<00:10, 24.56it/s, v_num=0]
Epoch 3:  37%|███▋      | 140/375 [00:05<00:09, 24.92it/s, v_num=0]
Epoch 3:  43%|████▎     | 160/375 [00:06<00:08, 24.94it/s, v_num=0]
Epoch 3:  48%|████▊     | 180/375 [00:07<00:07, 25.00it/s, v_num=0]
Epoch 3:  53%|█████▎    | 200/375 [00:07<00:06, 25.30it/s, v_num=0]
Epoch 3:  59%|█████▊    | 220/375 [00:09<00:06, 24.14it/s, v_num=0]
Epoch 3:  64%|██████▍   | 240/375 [00:10<00:05, 22.95it/s, v_num=0]
Epoch 3:  69%|██████▉   | 260/375 [00:11<00:05, 22.20it/s, v_num=0]
Epoch 3:  75%|███████▍  | 280/375 [00:12<00:04, 21.60it/s, v_num=0]
Epoch 3:  80%|████████  | 300/375 [00:14<00:03, 21.0

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 4:   5%|▌         | 20/375 [00:00<00:17, 20.21it/s, v_num=0]
Epoch 4:  11%|█         | 40/375 [00:01<00:15, 22.27it/s, v_num=0]
Epoch 4:  16%|█▌        | 60/375 [00:02<00:13, 23.56it/s, v_num=0]
Epoch 4:  21%|██▏       | 80/375 [00:03<00:11, 24.67it/s, v_num=0]
Epoch 4:  27%|██▋       | 100/375 [00:04<00:11, 24.46it/s, v_num=0]
Epoch 4:  32%|███▏      | 120/375 [00:05<00:11, 22.26it/s, v_num=0]
Trial status: 49 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:43:48. Total running time: 1hr 3min 31s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 5:   5%|▌         | 20/375 [00:01<00:29, 12.09it/s, v_num=0]
Epoch 5:  11%|█         | 40/375 [00:02<00:24, 13.64it/s, v_num=0]
Epoch 5:  16%|█▌        | 60/375 [00:04<00:22, 13.74it/s, v_num=0]
Epoch 5:  21%|██▏       | 80/375 [00:05<00:20, 14.34it/s, v_num=0]
Epoch 5:  27%|██▋       | 100/375 [00:06<00:17, 15.77it/s, v_num=0]
Epoch 5:  32%|███▏      | 120/375 [00:07<00:15, 16.98it/s, v_num=0]
Epoch 5:  37%|███▋      | 140/375 [00:07<00:13, 17.87it/s, v_num=0]
Epoch 5:  43%|████▎     | 160/375 [00:08<00:11, 18.64it/s, v_num=0]
Epoch 5:  48%|████▊     | 180/375 [00:09<00:10, 19.24it/s, v_num=0]
Epoch 5:  53%|█████▎    | 200/375 [00:10<00:08, 19.73it/s, v_num=0]
Epoch 5:  59%|█████▊    | 220/375 [00:10<00:07, 20.37it/s, v_num=0]
Epoch 5:  64%|██████▍   | 240/375 [00:11<00:06, 20.72it/s, v_num=0]
Epoch 5:  69%|██████▉   | 260/375 [00:12<00:05, 21.15it/s, v_num=0]
Epoch 5:  75%|███████▍  | 280/375 [00:12<00:04, 21.55it/s, v_num=0]
Epoch 5:  80%|████████  | 300/375 [00:13<00:03, 21.7

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 6:   5%|▌         | 20/375 [00:00<00:17, 20.68it/s, v_num=0]
Epoch 6:  11%|█         | 40/375 [00:01<00:14, 23.28it/s, v_num=0]
Epoch 6:  16%|█▌        | 60/375 [00:02<00:12, 24.80it/s, v_num=0]
Epoch 6:  21%|██▏       | 80/375 [00:03<00:11, 25.00it/s, v_num=0]
Epoch 6:  27%|██▋       | 100/375 [00:03<00:10, 25.41it/s, v_num=0]
Epoch 6:  32%|███▏      | 120/375 [00:04<00:09, 25.91it/s, v_num=0]
Epoch 6:  37%|███▋      | 140/375 [00:05<00:09, 25.88it/s, v_num=0]
Epoch 6:  43%|████▎     | 160/375 [00:06<00:08, 26.17it/s, v_num=0]
Epoch 6:  48%|████▊     | 180/375 [00:06<00:07, 26.04it/s, v_num=0]
Epoch 6:  53%|█████▎    | 200/375 [00:07<00:06, 26.32it/s, v_num=0]
Epoch 6:  59%|█████▊    | 220/375 [00:08<00:05, 26.35it/s, v_num=0]
Epoch 6:  64%|██████▍   | 240/375 [00:09<00:05, 26.23it/s, v_num=0]
Epoch 6:  69%|██████▉   | 260/375 [00:10<00:04, 25.25it/s, v_num=0]
Epoch 6:  75%|███████▍  | 280/375 [00:11<00:03, 24.33it/s, v_num=0]
Epoch 6:  80%|████████  | 300/375 [00:12<00:03, 23.7

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00050_50_batch_size=256,lr=0.0100,mlp_af_l0=relu,mlp_bn_l0=True,mlp_do_l0=0.1000,mlp_out_l0=128_2023-09-02_17-23-11/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:13, 197940.72it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:13, 197546.60it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:31, 287537.89it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:04, 407707.57it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:31, 829472.00it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:00<00:17, 1486258.31it/s][A

Trial status: 50 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:44:48. Total running time: 1hr 4min 31s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_key': 0, 'class_key': 1, 'mlp_out_l0': 64, 'mlp_af_l0': 'relu', 'mlp_bn_l0': True, 'mlp_do_l0': 0.1}
+------------------------------

[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 72%|███████▏  | 19136512/26421880 [00:02<00:00, 16366896.95it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 84%|████████▍ | 22151168/26421880 [00:02<00:00, 16900330.21it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
100%|██████████| 26421880/26421880 [00:02<00:00, 10579079.10it/s]


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 172109.45it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 171817.30it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 192840.48it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 191754.47it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 279143.83it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▍         | 196608/4422102 [00:00<00:13, 320912.61it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  9%|▉         | 393216/4422102 [00:00<00:06, 621604.34it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 18%|█▊        | 786432/4422102 [00:01<00:03, 1193679.18it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  70%|███████   | 3112960/4422102 [00:01<00:00, 4446878.75it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3231189.23it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 17096022.95it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.9 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.7 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 34.63it/s]
Epoch 0:   0%|          | 0/188 [00:00<?, ?it/s] 
Epoch 0:  11%|█         | 20/188 [00:03<00:25,  6.54it/s, v_num=0]
Epoch 0:  21%|██▏       | 40/188 [00:05<00:20,  7.24it/s, v_num=0]
Epoch 0:  32%|███▏      | 60/188 [00:07<00:15,  8.39it/s, v_num=0]
Epoch 0:  43%|████▎     | 80/188 [00:08<00:11,  9.41it/s, v_num=0]
Epoch 0:  53%|█████▎    | 100/188 [00:09<00:08, 10.16it/s, v_num=0]
Epoch 0:  64%|██████▍   | 120/188 [00:11<00:06, 10.82it/s, v_num=0]
Epoch 0:  74%|███████▍  | 140/188 [00:12<00:04, 11.31it/s, v_num=0]
Epoch 0:  85%|████████▌ | 160/188 [00:13<00:02, 11.45it/s, v_num=0]
Epoch 0:  96%|█████████▌| 180/188 [00:16<00:00, 11.00it/s, v_num=0]
Epoch 0: 100%|██████████| 188/188 [00:17<00:00, 10.96it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Validation: 0it [00:00, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%|          | 0/47 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|  

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:  11%|█         | 20/188 [00:01<00:12, 13.02it/s, v_num=0]
Epoch 1:  21%|██▏       | 40/188 [00:02<00:10, 13.93it/s, v_num=0]
Trial status: 50 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:45:18. Total running time: 1hr 5min 1s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 2:  11%|█         | 20/188 [00:01<00:12, 12.92it/s, v_num=0]
Epoch 2:  21%|██▏       | 40/188 [00:02<00:10, 13.81it/s, v_num=0]
Epoch 2:  32%|███▏      | 60/188 [00:04<00:08, 14.27it/s, v_num=0]
Epoch 2:  43%|████▎     | 80/188 [00:05<00:07, 14.60it/s, v_num=0]
Epoch 2:  53%|█████▎    | 100/188 [00:07<00:06, 13.35it/s, v_num=0]
Epoch 2:  64%|██████▍   | 120/188 [00:09<00:05, 12.38it/s, v_num=0]
Epoch 2:  74%|███████▍  | 140/188 [00:11<00:04, 11.81it/s, v_num=0]
Epoch 2:  85%|████████▌ | 160/188 [00:13<00:02, 12.15it/s, v_num=0]
Epoch 2:  96%|█████████▌| 180/188 [00:14<00:00, 12.35it/s, v_num=0]
Epoch 2: 100%|██████████| 188/188 [00:14<00:00, 12.59it/s, v_num=0]
Trial status: 50 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:45:48. Total running time: 1hr 5min 31s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config':

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 3:  11%|█         | 20/188 [00:01<00:13, 12.18it/s, v_num=0]
Epoch 3:  21%|██▏       | 40/188 [00:03<00:11, 13.27it/s, v_num=0]
Epoch 3:  32%|███▏      | 60/188 [00:04<00:10, 12.65it/s, v_num=0]
Epoch 3:  43%|████▎     | 80/188 [00:06<00:09, 11.55it/s, v_num=0]
Epoch 3:  53%|█████▎    | 100/188 [00:09<00:08, 10.91it/s, v_num=0]
Epoch 3:  64%|██████▍   | 120/188 [00:10<00:06, 11.16it/s, v_num=0]
Epoch 3:  74%|███████▍  | 140/188 [00:12<00:04, 11.65it/s, v_num=0]
Epoch 3:  85%|████████▌ | 160/188 [00:13<00:02, 11.99it/s, v_num=0]
Epoch 3:  96%|█████████▌| 180/188 [00:14<00:00, 12.37it/s, v_num=0]
Epoch 3: 100%|██████████| 188/188 [00:15<00:00, 12.50it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Validation: 0it [00:00, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%|          | 0/47 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/47 [00:00<?, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation DataLoader 0:  43%|████▎     | 20/47 [00:

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 4:  11%|█         | 20/188 [00:01<00:13, 12.29it/s, v_num=0]
Epoch 4:  21%|██▏       | 40/188 [00:03<00:13, 10.69it/s, v_num=0]
Epoch 4:  32%|███▏      | 60/188 [00:06<00:13,  9.69it/s, v_num=0]
Epoch 4:  43%|████▎     | 80/188 [00:08<00:10,  9.83it/s, v_num=0]
Trial status: 50 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:46:18. Total running time: 1hr 6min 1s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 5:  11%|█         | 20/188 [00:02<00:22,  7.56it/s, v_num=0]
Epoch 5:  21%|██▏       | 40/188 [00:04<00:18,  8.19it/s, v_num=0]
Epoch 5:  32%|███▏      | 60/188 [00:06<00:13,  9.70it/s, v_num=0]
Epoch 5:  43%|████▎     | 80/188 [00:07<00:10, 10.68it/s, v_num=0]
Epoch 5:  53%|█████▎    | 100/188 [00:08<00:07, 11.27it/s, v_num=0]
Epoch 5:  64%|██████▍   | 120/188 [00:10<00:05, 11.73it/s, v_num=0]
Epoch 5:  74%|███████▍  | 140/188 [00:11<00:03, 12.17it/s, v_num=0]
Epoch 5:  85%|████████▌ | 160/188 [00:12<00:02, 12.38it/s, v_num=0]
Epoch 5:  96%|█████████▌| 180/188 [00:14<00:00, 12.73it/s, v_num=0]
Epoch 5: 100%|██████████| 188/188 [00:14<00:00, 12.85it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Validation: 0it [00:00, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%|          | 0/47 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/47 [00:00<?, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation DataLoader 0:  43%|████▎     | 20/47 [00:

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00051_51_batch_size=64,lr=0.1000,mlp_af_l0=relu,mlp_bn_l0=True,mlp_do_l0=0.1000,mlp_out_l0=128_2023-09-02_17-24-00/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:16, 192845.89it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:16, 192383.66it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:33, 279932.05it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 400687.80it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:32, 807061.72it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1457193.19it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  96%|█████████▋| 25460736/26421880 [00:02<00:00, 17125254.34it/s][A[A100%|██████████| 26421880/26421880 [00:02<00:00, 10306284.65it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 174199.76it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 173919.29it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 192423.62it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 191981.54it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 279456.07it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 395991.96it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 10%|█         | 458752/4422102 [00:00<00:05, 737210.67it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 20%|██        | 884736/4422102 [00:01<00:02, 1334431.27it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 27969270.72it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.9 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.7 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 86.09it/s]
Epoch 0:   0%|          | 0/750 [00:00<?, ?it/s] 
Epoch 0:   3%|▎         | 20/750 [00:00<00:21, 33.86it/s, v_num=0]
Epoch 0:   5%|▌         | 40/750 [00:01<00:18, 38.13it/s, v_num=0]
Epoch 0:   8%|▊         | 60/750 [00:01<00:17, 39.99it/s, v_num=0]
Epoch 0:  11%|█         | 80/750 [00:02<00:16, 39.94it/s, v_num=0]
Epoch 0:  13%|█▎        | 100/750 [00:02<00:16, 38.46it/s, v_num=0]
Epoch 0:  16%|█▌        | 120/750 [00:03<00:17, 36.00it/s, v_num=0]
Epoch 0:  19%|█▊        | 140/750 [00:04<00:17, 34.44it/s, v_num=0]
Epoch 0:  21%|██▏       | 160/750 [00:04<00:17, 33.23it/s, v_num=0]
Epoch 0:  24%|██▍       | 180/750 [00:05<00:17, 32.21it/s, v_num=0]
Epoch 0:  27%|██▋       | 200/750 [00:06<00:17, 31.29it/s, v_num=0]
Epoch 0:  29%|██▉       | 220/750 [00:07<00:17, 30.62it/s, v_num=0]
Epoch 0:  32%|███▏      | 240/750 [00:07<00:16, 30.11it/s, v_num=0]
Epoch 0:  35%|███▍      | 260/750 [00:08<00:16, 29.80it/s, v_n

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00052_52_batch_size=128,lr=0.1000,mlp_af_l0=relu,mlp_bn_l0=True,mlp_do_l0=0.1000,mlp_out_l0=128_2023-09-02_17-24-47/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:16, 193164.90it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:16, 192739.45it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:33, 280598.22it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 397807.96it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 458752/26421880 [00:00<00:35, 740083.56it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 917504/26421880 [00:01<00:18, 1404188.93it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  93%|█████████▎| 24510464/26421880 [00:02<00:00, 16355738.59it/s][A[A100%|██████████| 26421880/26421880 [00:02<00:00, 10300426.91it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 175056.75it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 174744.66it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 191756.73it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 191178.23it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 278349.38it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 394810.44it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 802954.91it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1439111.31it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5463349.20it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3217967.41it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 32915056.39it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.9 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.7 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 30.96it/s]
Epoch 0:   0%|          | 0/375 [00:00<?, ?it/s] 
Epoch 0:   5%|▌         | 20/375 [00:01<00:24, 14.45it/s, v_num=0]
Epoch 0:  11%|█         | 40/375 [00:02<00:23, 14.19it/s, v_num=0]
Epoch 0:  16%|█▌        | 60/375 [00:04<00:21, 14.92it/s, v_num=0]
Epoch 0:  21%|██▏       | 80/375 [00:05<00:20, 14.64it/s, v_num=0]
Epoch 0:  27%|██▋       | 100/375 [00:06<00:18, 14.87it/s, v_num=0]
Epoch 0:  32%|███▏      | 120/375 [00:07<00:16, 15.28it/s, v_num=0]
Epoch 0:  37%|███▋      | 140/375 [00:08<00:14, 16.10it/s, v_num=0]
Epoch 0:  43%|████▎     | 160/375 [00:09<00:12, 16.96it/s, v_num=0]
Epoch 0:  48%|████▊     | 180/375 [00:10<00:11, 17.70it/s, v_num=0]
Epoch 0:  53%|█████▎    | 200/375 [00:10<00:09, 18.27it/s, v_num=0]
Epoch 0:  59%|█████▊    | 220/375 [00:11<00:08, 18.81it/s, v_num=0]
Epoch 0:  64%|██████▍   | 240/375 [00:12<00:06, 19.31it/s, v_num=0]
Epoch 0:  69%|██████▉   | 260/375 [00:13<00:05, 19.69it/s, v_n

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00053_53_batch_size=256,lr=0.1000,mlp_af_l0=relu,mlp_bn_l0=True,mlp_do_l0=0.1000,mlp_out_l0=128_2023-09-02_17-26-09/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:14, 196732.58it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:14, 196254.52it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:32, 285713.97it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:04, 405171.96it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 458752/26421880 [00:00<00:34, 754197.96it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 917504/26421880 [00:01<00:17, 1431292.61it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 171395.54it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 171064.43it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 195833.31it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 195444.42it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 284385.14it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 403517.93it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 10%|█         | 458752/4422102 [00:00<00:05, 750940.04it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██        | 917504/4422102 [00:01<00:02, 1425086.91it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  83%|████████▎ | 3670016/4422102 [00:01<00:00, 5353012.78it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3289979.33it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 24179481.51it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.9 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.7 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 59.20it/s]
Epoch 0:   0%|          | 0/188 [00:00<?, ?it/s] 
Epoch 0:  11%|█         | 20/188 [00:01<00:12, 13.78it/s, v_num=0]
Epoch 0:  21%|██▏       | 40/188 [00:03<00:11, 13.25it/s, v_num=0]
Epoch 0:  32%|███▏      | 60/188 [00:05<00:11, 11.38it/s, v_num=0]
Epoch 0:  43%|████▎     | 80/188 [00:07<00:10, 10.57it/s, v_num=0]
Epoch 0:  53%|█████▎    | 100/188 [00:09<00:08, 10.73it/s, v_num=0]
Epoch 0:  64%|██████▍   | 120/188 [00:10<00:06, 10.98it/s, v_num=0]
Epoch 0:  74%|███████▍  | 140/188 [00:13<00:04, 10.57it/s, v_num=0]
Epoch 0:  85%|████████▌ | 160/188 [00:15<00:02, 10.39it/s, v_num=0]
Trial status: 53 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:48:18. Total running time: 1hr 8min 1s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_co

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00054_54_batch_size=64,lr=0.0100,mlp_af_l0=none,mlp_bn_l0=True,mlp_do_l0=0.1000,mlp_out_l0=128_2023-09-02_17-28-46/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:15, 195393.42it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:15, 195020.92it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:32, 283955.58it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 402844.50it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 458752/26421880 [00:00<00:34, 753515.09it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1493667.37it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  95%|█████████▍| 24969216/26421880 [00:02<00:00, 17104180.70it/s][A[A100%|██████████| 26421880/26421880 [00:02<00:00, 10456508.00it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 176536.86it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 176236.53it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 192215.32it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 191775.78it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 279232.69it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 395975.05it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 805566.71it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1443897.66it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5481204.62it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3229126.37it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 38557637.49it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.9 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.7 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 103.63it/s]
Epoch 0:   0%|          | 0/750 [00:00<?, ?it/s] 
Epoch 0:   3%|▎         | 20/750 [00:00<00:21, 34.10it/s, v_num=0]
Epoch 0:   5%|▌         | 40/750 [00:01<00:18, 38.42it/s, v_num=0]
Epoch 0:   8%|▊         | 60/750 [00:01<00:17, 39.91it/s, v_num=0]
Epoch 0:   8%|▊         | 60/750 [00:01<00:17, 39.90it/s, v_num=0]
Epoch 0:  11%|█         | 80/750 [00:01<00:16, 40.63it/s, v_num=0]
Epoch 0:  13%|█▎        | 100/750 [00:02<00:15, 41.44it/s, v_num=0]
Epoch 0:  16%|█▌        | 120/750 [00:02<00:15, 41.98it/s, v_num=0]
Epoch 0:  19%|█▊        | 140/750 [00:03<00:14, 42.08it/s, v_num=0]
Epoch 0:  21%|██▏       | 160/750 [00:03<00:13, 42.33it/s, v_num=0]
Epoch 0:  24%|██▍       | 180/750 [00:04<00:13, 40.93it/s, v_num=0]
Epoch 0:  27%|██▋       | 200/750 [00:05<00:14, 38.97it/s, v_num=0]
Epoch 0:  29%|██▉       | 220/750 [00:05<00:13, 38.05it/s, v_num=0]
Epoch 0:  32%|███▏      | 240/750 [00:06<00:13, 36.75it/s, v_n

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:   3%|▎         | 20/750 [00:01<00:37, 19.23it/s, v_num=0]
Epoch 1:   5%|▌         | 40/750 [00:01<00:31, 22.34it/s, v_num=0]
Epoch 1:   8%|▊         | 60/750 [00:02<00:29, 23.51it/s, v_num=0]
Epoch 1:  11%|█         | 80/750 [00:03<00:25, 26.17it/s, v_num=0]
Epoch 1:  13%|█▎        | 100/750 [00:03<00:23, 27.93it/s, v_num=0]
Epoch 1:  16%|█▌        | 120/750 [00:04<00:21, 29.66it/s, v_num=0]
Epoch 1:  19%|█▊        | 140/750 [00:04<00:19, 31.15it/s, v_num=0]
Epoch 1:  21%|██▏       | 160/750 [00:04<00:18, 32.51it/s, v_num=0]
Epoch 1:  24%|██▍       | 180/750 [00:05<00:17, 33.13it/s, v_num=0]
Epoch 1:  27%|██▋       | 200/750 [00:05<00:16, 33.70it/s, v_num=0]
Epoch 1:  29%|██▉       | 220/750 [00:06<00:15, 34.26it/s, v_num=0]
Epoch 1:  32%|███▏      | 240/750 [00:06<00:14, 34.89it/s, v_num=0]
Epoch 1:  35%|███▍      | 260/750 [00:07<00:13, 35.30it/s, v_num=0]
Epoch 1:  37%|███▋      | 280/750 [00:07<00:13, 35.73it/s, v_num=0]
Epoch 1:  40%|████      | 300/750 [00:08<00:12, 36.2

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 2:   3%|▎         | 20/750 [00:00<00:27, 26.19it/s, v_num=0]
Epoch 2:   5%|▌         | 40/750 [00:01<00:22, 31.96it/s, v_num=0]
Epoch 2:   8%|▊         | 60/750 [00:01<00:19, 34.60it/s, v_num=0]
Epoch 2:  11%|█         | 80/750 [00:02<00:18, 36.39it/s, v_num=0]
Epoch 2:  13%|█▎        | 100/750 [00:02<00:17, 36.99it/s, v_num=0]
Epoch 2:  16%|█▌        | 120/750 [00:03<00:16, 37.93it/s, v_num=0]
Epoch 2:  19%|█▊        | 140/750 [00:03<00:15, 38.25it/s, v_num=0]
Epoch 2:  21%|██▏       | 160/750 [00:04<00:15, 37.59it/s, v_num=0]
Epoch 2:  24%|██▍       | 180/750 [00:05<00:16, 35.61it/s, v_num=0]
Epoch 2:  27%|██▋       | 200/750 [00:05<00:16, 34.15it/s, v_num=0]
Epoch 2:  29%|██▉       | 220/750 [00:06<00:15, 33.23it/s, v_num=0]
Epoch 2:  32%|███▏      | 240/750 [00:07<00:15, 32.47it/s, v_num=0]
Epoch 2:  35%|███▍      | 260/750 [00:08<00:15, 31.73it/s, v_num=0]
Epoch 2:  37%|███▋      | 280/750 [00:08<00:15, 31.15it/s, v_num=0]
Epoch 2:  40%|████      | 300/750 [00:09<00:14, 30.7

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00055_55_batch_size=128,lr=0.0100,mlp_af_l0=none,mlp_bn_l0=True,mlp_do_l0=0.1000,mlp_out_l0=128_2023-09-02_17-29-50/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:16, 193942.30it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:16, 193210.81it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:33, 281167.07it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 196608/26421880 [00:00<01:21, 322608.40it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 393216/26421880 [00:00<00:41, 623734.03it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 786432/26421880 [00:01<00:21, 1199439.39it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  93%|█████████▎| 24543232/26421880 [00:02<00:00, 17096344.96it/s][A[A100%|██████████| 26421880/26421880 [00:02<00:00, 10350041.90it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 176376.39it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 176100.90it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 191562.16it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 191069.64it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 278288.56it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 394744.14it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 803244.54it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1439431.52it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5465528.40it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3219604.09it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 37682856.88it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.9 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.7 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 39.53it/s]
Epoch 0:   0%|          | 0/375 [00:00<?, ?it/s] 
Epoch 0:   5%|▌         | 20/375 [00:00<00:17, 20.85it/s, v_num=0]
Epoch 0:  11%|█         | 40/375 [00:01<00:14, 23.62it/s, v_num=0]
Epoch 0:  16%|█▌        | 60/375 [00:02<00:13, 24.21it/s, v_num=0]
Epoch 0:  21%|██▏       | 80/375 [00:03<00:12, 23.25it/s, v_num=0]
Epoch 0:  27%|██▋       | 100/375 [00:04<00:13, 21.09it/s, v_num=0]
Epoch 0:  32%|███▏      | 120/375 [00:06<00:13, 19.57it/s, v_num=0]
Epoch 0:  37%|███▋      | 140/375 [00:07<00:12, 18.99it/s, v_num=0]
Epoch 0:  43%|████▎     | 160/375 [00:08<00:11, 18.79it/s, v_num=0]
Epoch 0:  48%|████▊     | 180/375 [00:09<00:10, 18.40it/s, v_num=0]
Epoch 0:  53%|█████▎    | 200/375 [00:10<00:09, 18.77it/s, v_num=0]
Epoch 0:  59%|█████▊    | 220/375 [00:11<00:08, 19.36it/s, v_num=0]
Epoch 0:  64%|██████▍   | 240/375 [00:12<00:06, 19.59it/s, v_n

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


[2m[36m(run_with_tune pid=1086)[0m 
Epoch 6: 100%|██████████| 375/375 [05:59<00:00,  1.04it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Epoch 5: 100%|██████████| 188/188 [04:06<00:00,  1.31s/it, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Epoch 0: 100%|██████████| 750/750 [03:48<00:00,  3.28it/s, v_num=0]
Trial status: 55 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:50:49. Total running time: 1hr 10min 32s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00056_56_batch_size=256,lr=0.0100,mlp_af_l0=none,mlp_bn_l0=True,mlp_do_l0=0.1000,mlp_out_l0=128_2023-09-02_17-31-35/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:15, 195110.49it/s][A[A


Trial status: 56 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:51:49. Total running time: 1hr 11min 32s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_key': 0, 'class_key': 1, 'mlp_out_l0': 64, 'mlp_af_l0': 'relu', 'mlp_bn_l0': True, 'mlp_do_l0': 0.1}
+-----------------------------

[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:15, 194688.12it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:32, 283344.37it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 402034.19it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:31, 816692.12it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1466465.34it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  7%|▋         | 1933312/26421880 [00:01<00:08, 2894551.08it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 15%|█▍        | 3833856/26421880 [00:01<00:

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 171970.06it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 171577.50it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 195373.98it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 195031.18it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 283881.13it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 402428.98it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 10%|▉         | 425984/4422102 [00:00<00:05, 678780.27it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 18%|█▊        | 786432/4422102 [00:01<00:03, 1176393.04it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  68%|██████▊   | 3014656/4422102 [00:01<00:00, 4328530.08it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3279375.02it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 27825099.22it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.9 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.7 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 58.21it/s]
Epoch 0:   0%|          | 0/188 [00:00<?, ?it/s] 
Epoch 0:  11%|█         | 20/188 [00:01<00:13, 12.37it/s, v_num=0]
Epoch 0:  21%|██▏       | 40/188 [00:02<00:10, 13.48it/s, v_num=0]
Epoch 0:  32%|███▏      | 60/188 [00:04<00:09, 13.78it/s, v_num=0]
Epoch 0:  43%|████▎     | 80/188 [00:05<00:07, 14.09it/s, v_num=0]
Epoch 0:  53%|█████▎    | 100/188 [00:07<00:06, 13.59it/s, v_num=0]
Epoch 0:  64%|██████▍   | 120/188 [00:09<00:05, 12.33it/s, v_num=0]
Epoch 0:  74%|███████▍  | 140/188 [00:11<00:04, 11.70it/s, v_num=0]
Epoch 0:  85%|████████▌ | 160/188 [00:13<00:02, 11.99it/s, v_num=0]
Epoch 0:  96%|█████████▌| 180/188 [00:14<00:00, 12.28it/s, v_num=0]
Epoch 0: 100%|██████████| 188/188 [00:15<00:00, 12.46it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Validation: 0it [00:00, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%| 

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:  11%|█         | 20/188 [00:01<00:12, 13.49it/s, v_num=0]
Epoch 1:  21%|██▏       | 40/188 [00:02<00:10, 14.26it/s, v_num=0]
Epoch 1:  32%|███▏      | 60/188 [00:04<00:09, 13.65it/s, v_num=0]
Trial status: 56 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:52:19. Total running time: 1hr 12min 2s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activat

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 2:  11%|█         | 20/188 [00:01<00:13, 12.90it/s, v_num=0]
Epoch 2:  21%|██▏       | 40/188 [00:03<00:13, 10.68it/s, v_num=0]
Epoch 2:  32%|███▏      | 60/188 [00:06<00:12,  9.85it/s, v_num=0]
Epoch 2:  43%|████▎     | 80/188 [00:08<00:10,  9.82it/s, v_num=0]
Epoch 2:  53%|█████▎    | 100/188 [00:09<00:08, 10.49it/s, v_num=0]
Epoch 2:  64%|██████▍   | 120/188 [00:10<00:06, 11.01it/s, v_num=0]
Epoch 2:  74%|███████▍  | 140/188 [00:12<00:04, 11.48it/s, v_num=0]
Epoch 2:  85%|████████▌ | 160/188 [00:13<00:02, 11.86it/s, v_num=0]
Epoch 2:  96%|█████████▌| 180/188 [00:14<00:00, 12.11it/s, v_num=0]
Epoch 2: 100%|██████████| 188/188 [00:15<00:00, 12.36it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Validation: 0it [00:00, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%|          | 0/47 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/47 [00:00<?, ?it/s][A
Trial status: 56 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:52:49. Tot

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00057_57_batch_size=64,lr=0.1000,mlp_af_l0=none,mlp_bn_l0=True,mlp_do_l0=0.1000,mlp_out_l0=128_2023-09-02_17-32-25/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:18, 190762.12it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:18, 190202.13it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:34, 276751.13it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:06, 392767.03it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:32, 798410.33it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1431812.53it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  95%|█████████▍| 25067520/26421880 [00:02<00:00, 16761065.00it/s][A[A100%|██████████| 26421880/26421880 [00:02<00:00, 10186321.01it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 171182.94it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 170939.71it/s]


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 193375.26it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 193035.44it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 281112.27it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 398544.45it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 10%|█         | 458752/4422102 [00:00<00:05, 741838.19it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██        | 917504/4422102 [00:01<00:02, 1407642.66it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  83%|████████▎ | 3670016/4422102 [00:01<00:00, 5287604.52it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3250581.65it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 32765215.47it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.9 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.7 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 104.02it/s]
Epoch 0:   0%|          | 0/750 [00:00<?, ?it/s] 
Epoch 0:   3%|▎         | 20/750 [00:00<00:22, 32.95it/s, v_num=0]
Epoch 0:   5%|▌         | 40/750 [00:01<00:18, 38.31it/s, v_num=0]
Epoch 0:   8%|▊         | 60/750 [00:01<00:17, 38.91it/s, v_num=0]
Epoch 0:  11%|█         | 80/750 [00:01<00:16, 40.27it/s, v_num=0]
Epoch 0:  13%|█▎        | 100/750 [00:02<00:15, 40.99it/s, v_num=0]
Epoch 0:  16%|█▌        | 120/750 [00:02<00:15, 41.24it/s, v_num=0]
Epoch 0:  19%|█▊        | 140/750 [00:03<00:14, 41.59it/s, v_num=0]
Epoch 0:  21%|██▏       | 160/750 [00:03<00:14, 41.96it/s, v_num=0]
Epoch 0:  24%|██▍       | 180/750 [00:04<00:13, 41.79it/s, v_num=0]
Epoch 0:  27%|██▋       | 200/750 [00:04<00:13, 41.80it/s, v_num=0]
Epoch 0:  29%|██▉       | 220/750 [00:05<00:12, 41.37it/s, v_num=0]
Epoch 0:  32%|███▏      | 240/750 [00:06<00:12, 39.47it/s, v_num=0]
Epoch 0:  35%|███▍      | 260/750 [00:06<00:12, 38.48it/s, v_

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00058_58_batch_size=128,lr=0.1000,mlp_af_l0=none,mlp_bn_l0=True,mlp_do_l0=0.1000,mlp_out_l0=128_2023-09-02_17-33-12/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:14, 195681.36it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:15, 195087.77it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:32, 283894.96it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 402752.97it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 425984/26421880 [00:00<00:38, 679219.89it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 884736/26421880 [00:01<00:18, 1376456.49it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  93%|█████████▎| 24477696/26421880 [00:02<00:00, 16824371.61it/s][A[A100%|██████████| 26421880/26421880 [00:02<00:00, 10449171.72it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 172784.94it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 172532.81it/s]


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 194812.64it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 194452.54it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 282971.90it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 401518.93it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 10%|█         | 458752/4422102 [00:00<00:05, 747043.43it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██        | 917504/4422102 [00:01<00:02, 1417478.83it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  83%|████████▎ | 3670016/4422102 [00:01<00:00, 5328103.21it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3273102.95it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 31847016.21it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.9 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.7 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 20.90it/s]
Epoch 0:   0%|          | 0/375 [00:00<?, ?it/s] 
Epoch 0:   5%|▌         | 20/375 [00:00<00:15, 23.26it/s, v_num=0]
Epoch 0:  11%|█         | 40/375 [00:01<00:13, 24.95it/s, v_num=0]
Epoch 0:  16%|█▌        | 60/375 [00:02<00:12, 25.76it/s, v_num=0]
Epoch 0:  21%|██▏       | 80/375 [00:03<00:11, 25.63it/s, v_num=0]
Epoch 0:  27%|██▋       | 100/375 [00:03<00:10, 25.37it/s, v_num=0]
Epoch 0:  32%|███▏      | 120/375 [00:05<00:10, 23.37it/s, v_num=0]
Epoch 0:  37%|███▋      | 140/375 [00:06<00:10, 22.37it/s, v_num=0]
Epoch 0:  43%|████▎     | 160/375 [00:07<00:10, 21.33it/s, v_num=0]
Epoch 0:  48%|████▊     | 180/375 [00:08<00:09, 20.81it/s, v_num=0]
Epoch 0:  53%|█████▎    | 200/375 [00:09<00:08, 20.15it/s, v_num=0]
Epoch 0:  59%|█████▊    | 220/375 [00:10<00:07, 20.37it/s, v_num=0]
Epoch 0:  64%|██████▍   | 240/375 [00:11<00:06, 20.82it/s, v_n

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:   5%|▌         | 20/375 [00:01<00:23, 15.35it/s, v_num=0]
Epoch 1:  11%|█         | 40/375 [00:02<00:21, 15.87it/s, v_num=0]
Epoch 1:  16%|█▌        | 60/375 [00:03<00:18, 16.64it/s, v_num=0]
Epoch 1:  21%|██▏       | 80/375 [00:04<00:18, 16.12it/s, v_num=0]
Epoch 1:  27%|██▋       | 100/375 [00:06<00:17, 16.05it/s, v_num=0]
Epoch 1:  32%|███▏      | 120/375 [00:07<00:15, 16.25it/s, v_num=0]
Epoch 1:  37%|███▋      | 140/375 [00:08<00:13, 17.27it/s, v_num=0]
Epoch 1:  43%|████▎     | 160/375 [00:08<00:11, 18.06it/s, v_num=0]
Epoch 1:  48%|████▊     | 180/375 [00:09<00:10, 18.71it/s, v_num=0]
Epoch 1:  53%|█████▎    | 200/375 [00:10<00:09, 19.29it/s, v_num=0]
Epoch 1:  59%|█████▊    | 220/375 [00:11<00:07, 19.60it/s, v_num=0]
Epoch 1:  64%|██████▍   | 240/375 [00:11<00:06, 20.08it/s, v_num=0]
Epoch 1:  69%|██████▉   | 260/375 [00:12<00:05, 20.56it/s, v_num=0]
Epoch 1:  75%|███████▍  | 280/375 [00:13<00:04, 20.93it/s, v_num=0]
Epoch 1:  80%|████████  | 300/375 [00:14<00:03, 21.2

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00059_59_batch_size=256,lr=0.1000,mlp_af_l0=none,mlp_bn_l0=True,mlp_do_l0=0.1000,mlp_out_l0=128_2023-09-02_17-34-37/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:19, 189497.00it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:19, 188763.83it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:35, 274775.74it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:07, 389793.22it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:32, 793158.72it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1421536.68it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 170964.27it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 170661.41it/s]


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz
Trial status: 59 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:54:19. Total running time: 1hr 14min 2s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'paddi

[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 196760.46it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 196345.93it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 285762.76it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 405203.10it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 824627.42it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1477799.08it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5609381.43it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3305088.33it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 33015714.06it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.9 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.7 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 53.68it/s]
Epoch 0:   0%|          | 0/188 [00:00<?, ?it/s] 
Epoch 0:  11%|█         | 20/188 [00:01<00:13, 12.87it/s, v_num=0]
Epoch 0:  21%|██▏       | 40/188 [00:03<00:11, 13.33it/s, v_num=0]
Epoch 0:  32%|███▏      | 60/188 [00:05<00:11, 11.34it/s, v_num=0]
Epoch 0:  43%|████▎     | 80/188 [00:07<00:10, 10.77it/s, v_num=0]
Epoch 0:  53%|█████▎    | 100/188 [00:09<00:08, 10.66it/s, v_num=0]
Epoch 0:  64%|██████▍   | 120/188 [00:10<00:06, 11.21it/s, v_num=0]
Epoch 0:  74%|███████▍  | 140/188 [00:11<00:04, 11.70it/s, v_num=0]
Epoch 0:  85%|████████▌ | 160/188 [00:13<00:02, 12.01it/s, v_num=0]
Epoch 0:  96%|█████████▌| 180/188 [00:14<00:00, 12.39it/s, v_num=0]
Epoch 0: 100%|██████████| 188/188 [00:15<00:00, 12.53it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Validation: 0it [00:00, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%|          | 0/47 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|  

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:  11%|█         | 20/188 [00:01<00:14, 11.27it/s, v_num=0]
Epoch 1:  21%|██▏       | 40/188 [00:03<00:14, 10.32it/s, v_num=0]
Epoch 1:  32%|███▏      | 60/188 [00:06<00:14,  9.12it/s, v_num=0]
Trial status: 59 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:54:49. Total running time: 1hr 14min 32s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activa

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00060_60_batch_size=64,lr=0.0100,mlp_af_l0=relu,mlp_bn_l0=False,mlp_do_l0=0.1000,mlp_out_l0=128_2023-09-02_17-35-50/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:16, 193591.53it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:16, 193057.26it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:33, 280975.67it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 398425.72it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 425984/26421880 [00:00<00:38, 672186.13it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 884736/26421880 [00:01<00:18, 1361051.67it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  93%|█████████▎| 24608768/26421880 [00:02<00:00, 16951470.07it/s][A[A100%|██████████| 26421880/26421880 [00:02<00:00, 10334310.74it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 175680.55it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 175419.66it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 195636.79it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 195176.10it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 284122.43it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 402988.00it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 820122.57it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1469481.00it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 36909875.20it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.6 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.4 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 61.74it/s]
Epoch 0:   0%|          | 0/750 [00:00<?, ?it/s] 
Epoch 0:   3%|▎         | 20/750 [00:00<00:21, 34.34it/s, v_num=0]
Epoch 0:   5%|▌         | 40/750 [00:01<00:18, 37.40it/s, v_num=0]
Epoch 0:   8%|▊         | 60/750 [00:01<00:17, 40.02it/s, v_num=0]
Epoch 0:  11%|█         | 80/750 [00:01<00:16, 41.46it/s, v_num=0]
Epoch 0:  13%|█▎        | 100/750 [00:02<00:15, 42.00it/s, v_num=0]
Epoch 0:  16%|█▌        | 120/750 [00:02<00:15, 41.92it/s, v_num=0]
Epoch 0:  19%|█▊        | 140/750 [00:03<00:14, 42.27it/s, v_num=0]
Epoch 0:  21%|██▏       | 160/750 [00:03<00:13, 42.39it/s, v_num=0]
Epoch 0:  24%|██▍       | 180/750 [00:04<00:13, 42.58it/s, v_num=0]
Epoch 0:  27%|██▋       | 200/750 [00:04<00:13, 42.11it/s, v_num=0]
Epoch 0:  29%|██▉       | 220/750 [00:05<00:12, 40.86it/s, v_num=0]
Epoch 0:  32%|███▏      | 240/750 [00:06<00:13, 39.20it/s, v_num=0]
Epoch 0:  35%|███▍      | 260/750 [00:06<00:12, 37.76it/s, v_n

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:   3%|▎         | 20/750 [00:01<00:38, 18.97it/s, v_num=0]
Epoch 1:   5%|▌         | 40/750 [00:01<00:32, 21.72it/s, v_num=0]
Epoch 1:   8%|▊         | 60/750 [00:02<00:29, 23.58it/s, v_num=0]
Epoch 1:  11%|█         | 80/750 [00:03<00:27, 24.49it/s, v_num=0]
Epoch 1:  13%|█▎        | 100/750 [00:03<00:24, 26.74it/s, v_num=0]
Epoch 1:  16%|█▌        | 120/750 [00:04<00:21, 28.71it/s, v_num=0]
Epoch 1:  19%|█▊        | 140/750 [00:04<00:20, 30.36it/s, v_num=0]
Epoch 1:  21%|██▏       | 160/750 [00:05<00:18, 31.50it/s, v_num=0]
Epoch 1:  24%|██▍       | 180/750 [00:05<00:17, 32.68it/s, v_num=0]
Epoch 1:  27%|██▋       | 200/750 [00:05<00:16, 33.42it/s, v_num=0]
Epoch 1:  29%|██▉       | 220/750 [00:06<00:15, 34.20it/s, v_num=0]
Epoch 1:  32%|███▏      | 240/750 [00:06<00:14, 34.98it/s, v_num=0]
Epoch 1:  35%|███▍      | 260/750 [00:07<00:13, 35.51it/s, v_num=0]
Epoch 1:  37%|███▋      | 280/750 [00:07<00:13, 36.07it/s, v_num=0]
Epoch 1:  40%|████      | 300/750 [00:08<00:12, 36.5

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 2:   3%|▎         | 20/750 [00:00<00:28, 25.92it/s, v_num=0]
Epoch 2:   5%|▌         | 40/750 [00:01<00:22, 31.65it/s, v_num=0]
Epoch 2:   8%|▊         | 60/750 [00:01<00:19, 35.08it/s, v_num=0]
Epoch 2:  11%|█         | 80/750 [00:02<00:18, 36.69it/s, v_num=0]
Epoch 2:  13%|█▎        | 100/750 [00:02<00:17, 38.00it/s, v_num=0]
Epoch 2:  16%|█▌        | 120/750 [00:03<00:16, 38.60it/s, v_num=0]
Epoch 2:  19%|█▊        | 140/750 [00:03<00:15, 39.26it/s, v_num=0]
Epoch 2:  21%|██▏       | 160/750 [00:04<00:14, 39.74it/s, v_num=0]
Epoch 2:  24%|██▍       | 180/750 [00:04<00:14, 40.11it/s, v_num=0]
Epoch 2:  27%|██▋       | 200/750 [00:04<00:13, 40.58it/s, v_num=0]
Epoch 2:  29%|██▉       | 220/750 [00:05<00:12, 40.78it/s, v_num=0]
Epoch 2:  32%|███▏      | 240/750 [00:06<00:12, 39.25it/s, v_num=0]
Epoch 2:  35%|███▍      | 260/750 [00:06<00:12, 37.90it/s, v_num=0]
Epoch 2:  37%|███▋      | 280/750 [00:07<00:12, 36.66it/s, v_num=0]
Epoch 2:  40%|████      | 300/750 [00:08<00:12, 35.5

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 3:   3%|▎         | 20/750 [00:01<00:40, 18.22it/s, v_num=0]
Epoch 3:   5%|▌         | 40/750 [00:01<00:33, 20.96it/s, v_num=0]
Epoch 3:   8%|▊         | 60/750 [00:02<00:30, 22.73it/s, v_num=0]
Epoch 3:  11%|█         | 80/750 [00:03<00:28, 23.32it/s, v_num=0]
Epoch 3:  13%|█▎        | 100/750 [00:04<00:26, 24.13it/s, v_num=0]
Epoch 3:  16%|█▌        | 120/750 [00:04<00:24, 26.14it/s, v_num=0]
Epoch 3:  19%|█▊        | 140/750 [00:05<00:21, 27.85it/s, v_num=0]
Epoch 3:  21%|██▏       | 160/750 [00:05<00:20, 29.16it/s, v_num=0]
Epoch 3:  24%|██▍       | 180/750 [00:06<00:19, 29.84it/s, v_num=0]
Epoch 3:  27%|██▋       | 200/750 [00:06<00:17, 30.78it/s, v_num=0]
Epoch 3:  29%|██▉       | 220/750 [00:06<00:16, 31.69it/s, v_num=0]
Epoch 3:  32%|███▏      | 240/750 [00:07<00:15, 32.49it/s, v_num=0]
Epoch 3:  35%|███▍      | 260/750 [00:07<00:14, 33.06it/s, v_num=0]
Epoch 3:  37%|███▋      | 280/750 [00:08<00:13, 33.58it/s, v_num=0]
Epoch 3:  40%|████      | 300/750 [00:08<00:13, 34.0

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 4:   3%|▎         | 20/750 [00:00<00:23, 31.13it/s, v_num=0]
Epoch 4:   5%|▌         | 40/750 [00:01<00:19, 36.30it/s, v_num=0]
Epoch 4:   8%|▊         | 60/750 [00:01<00:17, 38.36it/s, v_num=0]
Epoch 4:  11%|█         | 80/750 [00:02<00:16, 39.79it/s, v_num=0]
Epoch 4:  13%|█▎        | 100/750 [00:02<00:15, 40.64it/s, v_num=0]
Epoch 4:  16%|█▌        | 120/750 [00:02<00:15, 41.51it/s, v_num=0]
Epoch 4:  19%|█▊        | 140/750 [00:03<00:14, 41.36it/s, v_num=0]
Epoch 4:  21%|██▏       | 160/750 [00:03<00:14, 41.89it/s, v_num=0]
Epoch 4:  24%|██▍       | 180/750 [00:04<00:13, 42.14it/s, v_num=0]
Epoch 4:  27%|██▋       | 200/750 [00:04<00:13, 42.14it/s, v_num=0]
Epoch 4:  29%|██▉       | 220/750 [00:05<00:12, 42.11it/s, v_num=0]
Epoch 4:  32%|███▏      | 240/750 [00:05<00:12, 40.36it/s, v_num=0]
Epoch 4:  32%|███▏      | 240/750 [00:05<00:12, 40.35it/s, v_num=0]
Epoch 4:  35%|███▍      | 260/750 [00:06<00:12, 38.87it/s, v_num=0]
Epoch 4:  37%|███▋      | 280/750 [00:07<00:12, 38.1

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 5:   3%|▎         | 20/750 [00:01<00:40, 17.92it/s, v_num=0]
Epoch 5:   5%|▌         | 40/750 [00:01<00:34, 20.78it/s, v_num=0]
Epoch 5:   8%|▊         | 60/750 [00:02<00:30, 22.44it/s, v_num=0]
Epoch 5:  11%|█         | 80/750 [00:03<00:28, 23.25it/s, v_num=0]
Trial status: 60 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:57:19. Total running time: 1hr 17min 2s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_nor

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00061_61_batch_size=128,lr=0.0100,mlp_af_l0=relu,mlp_bn_l0=False,mlp_do_l0=0.1000,mlp_out_l0=128_2023-09-02_17-36-54/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:17, 191629.20it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:17, 191243.81it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:34, 278360.05it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 397082.67it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:32, 802593.48it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1444452.21it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 174935.04it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 174469.81it/s]


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 198372.41it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 198022.71it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:14, 288173.78it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 408847.67it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 831731.74it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:00<00:02, 1487158.26it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  76%|███████▋  | 3375104/4422102 [00:01<00:00, 4769683.27it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3326907.09it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 18646180.48it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.6 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.4 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 57.24it/s]
Epoch 0:   0%|          | 0/375 [00:00<?, ?it/s] 
Trial status: 61 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:57:49. Total running time: 1hr 17min 32s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_key':

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:   5%|▌         | 20/375 [00:00<00:17, 20.75it/s, v_num=0]
Epoch 1:  11%|█         | 40/375 [00:01<00:14, 23.49it/s, v_num=0]
Epoch 1:  16%|█▌        | 60/375 [00:02<00:12, 24.75it/s, v_num=0]
Epoch 1:  21%|██▏       | 80/375 [00:03<00:11, 25.37it/s, v_num=0]
Epoch 1:  27%|██▋       | 100/375 [00:03<00:10, 25.61it/s, v_num=0]
Epoch 1:  32%|███▏      | 120/375 [00:04<00:09, 25.86it/s, v_num=0]
Epoch 1:  37%|███▋      | 140/375 [00:05<00:09, 25.89it/s, v_num=0]
Trial status: 61 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:58:19. Total running time: 1hr 18min 2s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 2:   5%|▌         | 20/375 [00:00<00:17, 20.69it/s, v_num=0]
Epoch 2:  11%|█         | 40/375 [00:01<00:15, 22.31it/s, v_num=0]
Epoch 2:  16%|█▌        | 60/375 [00:02<00:13, 23.46it/s, v_num=0]
Epoch 2:  21%|██▏       | 80/375 [00:03<00:12, 24.08it/s, v_num=0]
Epoch 2:  27%|██▋       | 100/375 [00:04<00:11, 24.36it/s, v_num=0]
Epoch 2:  32%|███▏      | 120/375 [00:04<00:10, 24.29it/s, v_num=0]
Epoch 2:  37%|███▋      | 140/375 [00:06<00:10, 22.73it/s, v_num=0]
Epoch 2:  43%|████▎     | 160/375 [00:07<00:10, 21.50it/s, v_num=0]
Epoch 2:  48%|████▊     | 180/375 [00:08<00:09, 20.30it/s, v_num=0]
Epoch 2:  53%|█████▎    | 200/375 [00:10<00:08, 19.90it/s, v_num=0]
Epoch 2:  59%|█████▊    | 220/375 [00:11<00:07, 19.54it/s, v_num=0]
Epoch 2:  64%|██████▍   | 240/375 [00:12<00:06, 19.70it/s, v_num=0]
Epoch 2:  69%|██████▉   | 260/375 [00:12<00:05, 20.09it/s, v_num=0]
Epoch 2:  75%|███████▍  | 280/375 [00:13<00:04, 20.53it/s, v_num=0]
Epoch 2:  80%|████████  | 300/375 [00:14<00:03, 20.8

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 3:   5%|▌         | 20/375 [00:00<00:17, 20.79it/s, v_num=0]
Epoch 3:  11%|█         | 40/375 [00:01<00:16, 20.48it/s, v_num=0]
Epoch 3:  16%|█▌        | 60/375 [00:03<00:16, 18.94it/s, v_num=0]
Epoch 3:  21%|██▏       | 80/375 [00:04<00:16, 18.23it/s, v_num=0]
Epoch 3:  27%|██▋       | 100/375 [00:05<00:15, 17.71it/s, v_num=0]
Epoch 3:  32%|███▏      | 120/375 [00:06<00:14, 17.57it/s, v_num=0]
Epoch 3:  37%|███▋      | 140/375 [00:08<00:13, 17.25it/s, v_num=0]
Epoch 3:  43%|████▎     | 160/375 [00:09<00:12, 17.67it/s, v_num=0]
Epoch 3:  48%|████▊     | 180/375 [00:09<00:10, 18.34it/s, v_num=0]
Epoch 3:  53%|█████▎    | 200/375 [00:10<00:09, 19.06it/s, v_num=0]
Epoch 3:  59%|█████▊    | 220/375 [00:11<00:07, 19.52it/s, v_num=0]
Epoch 3:  64%|██████▍   | 240/375 [00:12<00:06, 20.00it/s, v_num=0]
Epoch 3:  69%|██████▉   | 260/375 [00:12<00:05, 20.43it/s, v_num=0]
Epoch 3:  75%|███████▍  | 280/375 [00:13<00:04, 20.81it/s, v_num=0]
Epoch 3:  80%|████████  | 300/375 [00:14<00:03, 21.0

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 4:   5%|▌         | 20/375 [00:01<00:27, 12.77it/s, v_num=0]
Epoch 4:  11%|█         | 40/375 [00:02<00:23, 14.21it/s, v_num=0]
Trial status: 61 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 17:59:19. Total running time: 1hr 19min 2s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'im

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 5:   5%|▌         | 20/375 [00:01<00:17, 19.88it/s, v_num=0]
Epoch 5:  11%|█         | 40/375 [00:01<00:14, 22.91it/s, v_num=0]
Epoch 5:  16%|█▌        | 60/375 [00:02<00:13, 23.71it/s, v_num=0]
Epoch 5:  21%|██▏       | 80/375 [00:03<00:12, 24.38it/s, v_num=0]
Epoch 5:  27%|██▋       | 100/375 [00:03<00:10, 25.17it/s, v_num=0]
Epoch 5:  32%|███▏      | 120/375 [00:04<00:09, 25.51it/s, v_num=0]
Epoch 5:  37%|███▋      | 140/375 [00:05<00:09, 25.68it/s, v_num=0]
Epoch 5:  43%|████▎     | 160/375 [00:06<00:08, 25.70it/s, v_num=0]
Epoch 5:  48%|████▊     | 180/375 [00:06<00:07, 25.78it/s, v_num=0]
Epoch 5:  53%|█████▎    | 200/375 [00:07<00:06, 25.88it/s, v_num=0]
Epoch 5:  59%|█████▊    | 220/375 [00:08<00:05, 26.13it/s, v_num=0]
Epoch 5:  64%|██████▍   | 240/375 [00:09<00:05, 26.09it/s, v_num=0]
Epoch 5:  64%|██████▍   | 240/375 [00:09<00:05, 26.08it/s, v_num=0]
Epoch 5:  69%|██████▉   | 260/375 [00:10<00:04, 25.56it/s, v_num=0]
Trial status: 61 TERMINATED | 1 RUNNING | 16 PENDING

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 6:   5%|▌         | 20/375 [00:00<00:17, 20.52it/s, v_num=0]
Epoch 6:  11%|█         | 40/375 [00:01<00:14, 23.91it/s, v_num=0]
Epoch 6:  16%|█▌        | 60/375 [00:02<00:12, 25.08it/s, v_num=0]
Epoch 6:  21%|██▏       | 80/375 [00:03<00:11, 25.44it/s, v_num=0]
Epoch 6:  27%|██▋       | 100/375 [00:03<00:10, 26.15it/s, v_num=0]
Epoch 6:  32%|███▏      | 120/375 [00:04<00:09, 26.68it/s, v_num=0]
Epoch 6:  37%|███▋      | 140/375 [00:05<00:08, 26.63it/s, v_num=0]
Epoch 6:  43%|████▎     | 160/375 [00:06<00:08, 26.19it/s, v_num=0]
Epoch 6:  48%|████▊     | 180/375 [00:07<00:07, 25.05it/s, v_num=0]
Epoch 6:  53%|█████▎    | 200/375 [00:08<00:07, 24.12it/s, v_num=0]
Epoch 6:  59%|█████▊    | 220/375 [00:09<00:06, 23.03it/s, v_num=0]
Epoch 6:  64%|██████▍   | 240/375 [00:10<00:06, 22.14it/s, v_num=0]
Epoch 6:  69%|██████▉   | 260/375 [00:11<00:05, 21.70it/s, v_num=0]
Epoch 6:  75%|███████▍  | 280/375 [00:13<00:04, 21.21it/s, v_num=0]
Epoch 6:  80%|████████  | 300/375 [00:13<00:03, 21.5

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Trial status: 61 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 18:00:20. Total running time: 1hr 20min 2s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_key': 0, 'class_key': 1, 'mlp_out_l0': 64, 'mlp_af_l0': 'relu', 'mlp_bn_l0': True, 'mlp_do_l0': 0.1}
+------------------------------

[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00062_62_batch_size=256,lr=0.0100,mlp_af_l0=relu,mlp_bn_l0=False,mlp_do_l0=0.1000,mlp_out_l0=128_2023-09-02_17-37-26/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:17, 192476.70it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:17, 192162.32it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:33, 279720.55it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:06, 396424.65it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:32, 806841.92it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1447555.09it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  95%|█████████▌| 25133056/26421880 [00:02<00:00, 16912424.41it/s][A[A100%|██████████| 26421880/26421880 [00:02<00:00, 10293310.80it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz
Trial status: 62 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 18:01:20. Total running time: 1hr 21min 3s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'ml

[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 176123.45it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 175846.50it/s]


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 196850.64it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 196445.81it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 285939.72it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 405434.41it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 825508.56it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1478718.30it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5611380.80it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3306652.73it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 31293155.06it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.6 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.4 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 71.25it/s]
Epoch 0:   0%|          | 0/188 [00:00<?, ?it/s] 
Epoch 0:  11%|█         | 20/188 [00:01<00:12, 13.46it/s, v_num=0]
Epoch 0:  21%|██▏       | 40/188 [00:02<00:10, 14.38it/s, v_num=0]
Epoch 0:  32%|███▏      | 60/188 [00:04<00:08, 14.30it/s, v_num=0]
Epoch 0:  43%|████▎     | 80/188 [00:05<00:07, 14.72it/s, v_num=0]
Epoch 0:  53%|█████▎    | 100/188 [00:06<00:06, 14.55it/s, v_num=0]
Epoch 0:  64%|██████▍   | 120/188 [00:09<00:05, 13.06it/s, v_num=0]
Epoch 0:  74%|███████▍  | 140/188 [00:11<00:03, 12.15it/s, v_num=0]
Epoch 0:  85%|████████▌ | 160/188 [00:13<00:02, 12.09it/s, v_num=0]
Epoch 0:  96%|█████████▌| 180/188 [00:14<00:00, 12.34it/s, v_num=0]
Epoch 0: 100%|██████████| 188/188 [00:15<00:00, 12.50it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Validation: 0it [00:00, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%|          | 0/47 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|  

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:  11%|█         | 20/188 [00:01<00:13, 12.89it/s, v_num=0]
Epoch 1:  21%|██▏       | 40/188 [00:02<00:10, 14.09it/s, v_num=0]
Epoch 1:  32%|███▏      | 60/188 [00:04<00:08, 14.58it/s, v_num=0]
Epoch 1:  43%|████▎     | 80/188 [00:05<00:08, 13.48it/s, v_num=0]
Epoch 1:  53%|█████▎    | 100/188 [00:08<00:07, 12.24it/s, v_num=0]
Trial status: 62 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 18:01:50. Total running time: 1hr 21min 33s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': 

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 2:  11%|█         | 20/188 [00:01<00:13, 12.43it/s, v_num=0]
Epoch 2:  21%|██▏       | 40/188 [00:02<00:10, 13.71it/s, v_num=0]
Epoch 2:  32%|███▏      | 60/188 [00:05<00:11, 11.47it/s, v_num=0]
Epoch 2:  43%|████▎     | 80/188 [00:07<00:10, 10.54it/s, v_num=0]
Epoch 2:  53%|█████▎    | 100/188 [00:09<00:08, 10.65it/s, v_num=0]
Epoch 2:  64%|██████▍   | 120/188 [00:10<00:06, 11.12it/s, v_num=0]
Epoch 2:  74%|███████▍  | 140/188 [00:12<00:04, 11.62it/s, v_num=0]
Epoch 2:  85%|████████▌ | 160/188 [00:13<00:02, 11.97it/s, v_num=0]
Epoch 2:  96%|█████████▌| 180/188 [00:14<00:00, 12.26it/s, v_num=0]
Epoch 2: 100%|██████████| 188/188 [00:15<00:00, 12.41it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Validation: 0it [00:00, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%|          | 0/47 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/47 [00:00<?, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation DataLoader 0:  43%|████▎     | 20/47 [00:

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00063_63_batch_size=64,lr=0.1000,mlp_af_l0=relu,mlp_bn_l0=False,mlp_do_l0=0.1000,mlp_out_l0=128_2023-09-02_17-38-15/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:12, 199663.19it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:12, 198949.30it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:30, 289461.59it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:03, 410887.26it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:31, 835047.41it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:00<00:16, 1498422.11it/s][A

Trial status: 63 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 18:02:20. Total running time: 1hr 22min 3s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_key': 0, 'class_key': 1, 'mlp_out_l0': 64, 'mlp_af_l0': 'relu', 'mlp_bn_l0': True, 'mlp_do_l0': 0.1}
+------------------------------

[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 38%|███▊      | 10027008/26421880 [00:01<00:01, 12558726.16it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 50%|████▉     | 13139968/26421880 [00:01<00:00, 14455321.67it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 61%|██████▏   | 16220160/26421880 [00:01<00:00, 15772027.73it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 73%|███████▎  | 19234816/26421880 [00:02<00:00, 16527918.50it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 84%|████████▍ | 22249472/26421880 [00:02<00:00, 17052919.62it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
100%|██████████| 26421880/26421880 [00:02<00:00, 10651576.35it/s]


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 171554.91it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 171302.33it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 191971.54it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 191540.33it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 278991.86it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 395832.37it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 805475.10it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1443785.83it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5479141.39it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3227192.48it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 22398627.59it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.6 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.4 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 47.75it/s]
Epoch 0:   0%|          | 0/750 [00:00<?, ?it/s] 
Epoch 0:   3%|▎         | 20/750 [00:00<00:22, 32.24it/s, v_num=0]
Epoch 0:   5%|▌         | 40/750 [00:01<00:19, 36.77it/s, v_num=0]
Epoch 0:   8%|▊         | 60/750 [00:01<00:18, 38.00it/s, v_num=0]
Epoch 0:  11%|█         | 80/750 [00:02<00:17, 38.94it/s, v_num=0]
Epoch 0:  13%|█▎        | 100/750 [00:02<00:16, 39.71it/s, v_num=0]
Epoch 0:  16%|█▌        | 120/750 [00:02<00:15, 40.05it/s, v_num=0]
Epoch 0:  19%|█▊        | 140/750 [00:03<00:14, 40.70it/s, v_num=0]
Epoch 0:  21%|██▏       | 160/750 [00:03<00:14, 40.77it/s, v_num=0]
Epoch 0:  24%|██▍       | 180/750 [00:04<00:13, 41.18it/s, v_num=0]
Epoch 0:  27%|██▋       | 200/750 [00:04<00:13, 40.92it/s, v_num=0]
Epoch 0:  29%|██▉       | 220/750 [00:05<00:12, 41.23it/s, v_num=0]
Epoch 0:  32%|███▏      | 240/750 [00:05<00:12, 40.94it/s, v_num=0]
Epoch 0:  35%|███▍      | 260/750 [00:06<00:12, 40.05it/s, v_n

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00064_64_batch_size=128,lr=0.1000,mlp_af_l0=relu,mlp_bn_l0=False,mlp_do_l0=0.1000,mlp_out_l0=128_2023-09-02_17-39-00/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:13, 198358.10it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:13, 197730.95it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:31, 287673.90it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:03, 411231.75it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:31, 828100.49it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:00<00:17, 1495946.34it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 175054.77it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 174794.01it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 193277.36it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 192914.31it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 280772.02it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 398194.50it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 810425.79it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1452488.75it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5512220.67it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3247608.35it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 33321415.11it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.6 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.4 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 48.87it/s]
Epoch 0:   0%|          | 0/375 [00:00<?, ?it/s] 
Epoch 0:   5%|▌         | 20/375 [00:00<00:16, 21.54it/s, v_num=0]
Epoch 0:  11%|█         | 40/375 [00:01<00:13, 25.09it/s, v_num=0]
Epoch 0:  16%|█▌        | 60/375 [00:02<00:12, 25.17it/s, v_num=0]
Epoch 0:  21%|██▏       | 80/375 [00:03<00:11, 25.30it/s, v_num=0]
Epoch 0:  27%|██▋       | 100/375 [00:03<00:10, 25.57it/s, v_num=0]
Epoch 0:  32%|███▏      | 120/375 [00:04<00:10, 24.70it/s, v_num=0]
Epoch 0:  37%|███▋      | 140/375 [00:06<00:10, 22.82it/s, v_num=0]
Epoch 0:  43%|████▎     | 160/375 [00:07<00:09, 21.63it/s, v_num=0]
Epoch 0:  48%|████▊     | 180/375 [00:08<00:09, 20.68it/s, v_num=0]
Epoch 0:  53%|█████▎    | 200/375 [00:09<00:08, 20.18it/s, v_num=0]
Epoch 0:  59%|█████▊    | 220/375 [00:11<00:07, 19.90it/s, v_num=0]
Epoch 0:  64%|██████▍   | 240/375 [00:11<00:06, 20.28it/s, v_n

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Trial status: 64 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 18:03:20. Total running time: 1hr 23min 3s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_key': 0, 'class_key': 1, 'mlp_out_l0': 64, 'mlp_af_l0': 'relu', 'mlp_bn_l0': True, 'mlp_do_l0': 0.1}
+------------------------------

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00065_65_batch_size=256,lr=0.1000,mlp_af_l0=relu,mlp_bn_l0=False,mlp_do_l0=0.1000,mlp_out_l0=128_2023-09-02_17-42-09/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:19, 189439.28it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:18, 189766.85it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:35, 276363.61it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:06, 393006.99it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:32, 799081.22it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1431104.17it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  95%|█████████▍| 25001984/26421880 [00:02<00:00, 16456615.76it/s][A[A100%|██████████| 26421880/26421880 [00:02<00:00, 10179922.67it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 176701.40it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 176397.75it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 195785.89it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 195321.72it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 284230.88it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 403181.41it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 10%|█         | 458752/4422102 [00:00<00:05, 749709.07it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 20%|██        | 884736/4422102 [00:01<00:02, 1358204.96it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  81%|████████  | 3571712/4422102 [00:01<00:00, 5195050.71it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3287009.28it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 28561212.95it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.6 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.4 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 38.08it/s]
Epoch 0:   0%|          | 0/188 [00:00<?, ?it/s] 
Trial status: 65 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 18:03:50. Total running time: 1hr 23min 33s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fu

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:  11%|█         | 20/188 [00:02<00:17,  9.86it/s, v_num=0]
Epoch 1:  21%|██▏       | 40/188 [00:04<00:15,  9.78it/s, v_num=0]
Epoch 1:  32%|███▏      | 60/188 [00:06<00:13,  9.58it/s, v_num=0]
Epoch 1:  43%|████▎     | 80/188 [00:07<00:10, 10.06it/s, v_num=0]
Epoch 1:  53%|█████▎    | 100/188 [00:09<00:08, 10.90it/s, v_num=0]
Epoch 1:  64%|██████▍   | 120/188 [00:10<00:05, 11.48it/s, v_num=0]
Epoch 1:  74%|███████▍  | 140/188 [00:11<00:04, 11.78it/s, v_num=0]
Trial status: 65 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 18:04:20. Total running time: 1hr 24min 3s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00066_66_batch_size=64,lr=0.0100,mlp_af_l0=none,mlp_bn_l0=False,mlp_do_l0=0.1000,mlp_out_l0=128_2023-09-02_17-44-45/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:14, 196696.26it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:14, 196326.20it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:32, 285613.89it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:04, 404521.25it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:31, 824556.90it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1478978.35it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  94%|█████████▍| 24903680/26421880 [00:02<00:00, 17189207.93it/s][A[A100%|██████████| 26421880/26421880 [00:02<00:00, 10513737.60it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 174729.37it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 174465.14it/s]


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:23, 190230.61it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 189791.76it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 276217.02it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 391791.11it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 797111.29it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1428895.45it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 33321415.11it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.6 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.4 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 38.35it/s]
Epoch 0:   0%|          | 0/750 [00:00<?, ?it/s] 
Epoch 0:   3%|▎         | 20/750 [00:00<00:22, 33.04it/s, v_num=0]
Epoch 0:   5%|▌         | 40/750 [00:01<00:19, 36.26it/s, v_num=0]
Epoch 0:   8%|▊         | 60/750 [00:01<00:18, 37.77it/s, v_num=0]
Epoch 0:  11%|█         | 80/750 [00:02<00:17, 38.91it/s, v_num=0]
Epoch 0:  13%|█▎        | 100/750 [00:02<00:16, 39.85it/s, v_num=0]
Epoch 0:  16%|█▌        | 120/750 [00:03<00:16, 38.88it/s, v_num=0]
Epoch 0:  19%|█▊        | 140/750 [00:03<00:15, 38.73it/s, v_num=0]
Epoch 0:  21%|██▏       | 160/750 [00:04<00:15, 37.20it/s, v_num=0]
Epoch 0:  24%|██▍       | 180/750 [00:04<00:15, 36.11it/s, v_num=0]
Epoch 0:  24%|██▍       | 180/750 [00:04<00:15, 36.06it/s, v_num=0]
Epoch 0:  27%|██▋       | 200/750 [00:05<00:15, 35.06it/s, v_num=0]
Epoch 0:  29%|██▉       | 220/750 [00:06<00:15, 34.18it/s, v_n

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:   3%|▎         | 20/750 [00:01<00:38, 18.93it/s, v_num=0]
Epoch 1:   5%|▌         | 40/750 [00:01<00:27, 26.12it/s, v_num=0]
Epoch 1:   8%|▊         | 60/750 [00:01<00:22, 30.07it/s, v_num=0]
Epoch 1:  11%|█         | 80/750 [00:02<00:20, 32.79it/s, v_num=0]
Epoch 1:  13%|█▎        | 100/750 [00:02<00:18, 34.68it/s, v_num=0]
Epoch 1:  16%|█▌        | 120/750 [00:03<00:17, 35.33it/s, v_num=0]
Epoch 1:  19%|█▊        | 140/750 [00:03<00:17, 35.71it/s, v_num=0]
Epoch 1:  21%|██▏       | 160/750 [00:04<00:16, 36.44it/s, v_num=0]
Epoch 1:  24%|██▍       | 180/750 [00:04<00:15, 37.05it/s, v_num=0]
Epoch 1:  27%|██▋       | 200/750 [00:05<00:14, 37.68it/s, v_num=0]
Epoch 1:  29%|██▉       | 220/750 [00:05<00:13, 38.14it/s, v_num=0]
Epoch 1:  32%|███▏      | 240/750 [00:06<00:13, 38.51it/s, v_num=0]
Epoch 1:  35%|███▍      | 260/750 [00:06<00:12, 38.95it/s, v_num=0]
Epoch 1:  37%|███▋      | 280/750 [00:07<00:12, 39.15it/s, v_num=0]
Epoch 1:  40%|████      | 300/750 [00:07<00:11, 39.3

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 2:   3%|▎         | 20/750 [00:00<00:23, 30.61it/s, v_num=0]
Epoch 2:   5%|▌         | 40/750 [00:01<00:19, 37.22it/s, v_num=0]
Epoch 2:   8%|▊         | 60/750 [00:01<00:17, 38.42it/s, v_num=0]
Epoch 2:  11%|█         | 80/750 [00:02<00:16, 39.72it/s, v_num=0]
Epoch 2:  13%|█▎        | 100/750 [00:02<00:16, 40.02it/s, v_num=0]
Epoch 2:  16%|█▌        | 120/750 [00:02<00:15, 40.71it/s, v_num=0]
Epoch 2:  19%|█▊        | 140/750 [00:03<00:14, 41.03it/s, v_num=0]
Epoch 2:  21%|██▏       | 160/750 [00:03<00:14, 40.45it/s, v_num=0]
Epoch 2:  24%|██▍       | 180/750 [00:04<00:14, 38.07it/s, v_num=0]
Epoch 2:  27%|██▋       | 200/750 [00:05<00:15, 36.39it/s, v_num=0]
Epoch 2:  29%|██▉       | 220/750 [00:06<00:15, 35.15it/s, v_num=0]
Epoch 2:  32%|███▏      | 240/750 [00:07<00:14, 34.14it/s, v_num=0]
Epoch 2:  35%|███▍      | 260/750 [00:07<00:14, 33.46it/s, v_num=0]
Epoch 2:  37%|███▋      | 280/750 [00:08<00:14, 32.63it/s, v_num=0]
Epoch 2:  40%|████      | 300/750 [00:09<00:14, 31.9

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00067_67_batch_size=128,lr=0.0100,mlp_af_l0=none,mlp_bn_l0=False,mlp_do_l0=0.1000,mlp_out_l0=128_2023-09-02_17-46-48/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:15, 195120.47it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:15, 194799.50it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:32, 283467.18it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 402089.31it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:31, 818127.53it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1466435.38it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 171346.19it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 171032.53it/s]


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 196615.50it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 196340.41it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 285918.47it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 405439.94it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 824840.78it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1478365.64it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5612739.52it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3305077.14it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 36597079.65it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.6 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.4 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 56.02it/s]
Epoch 0:   0%|          | 0/375 [00:00<?, ?it/s] 
Epoch 0:   5%|▌         | 20/375 [00:00<00:15, 23.39it/s, v_num=0]
Epoch 0:  11%|█         | 40/375 [00:01<00:13, 25.05it/s, v_num=0]
Epoch 0:  16%|█▌        | 60/375 [00:02<00:11, 26.87it/s, v_num=0]
Epoch 0:  21%|██▏       | 80/375 [00:03<00:11, 26.17it/s, v_num=0]
Epoch 0:  27%|██▋       | 100/375 [00:04<00:11, 23.25it/s, v_num=0]
Epoch 0:  32%|███▏      | 120/375 [00:05<00:11, 21.98it/s, v_num=0]
Epoch 0:  37%|███▋      | 140/375 [00:06<00:11, 20.70it/s, v_num=0]
Epoch 0:  43%|████▎     | 160/375 [00:07<00:10, 20.19it/s, v_num=0]
Epoch 0:  48%|████▊     | 180/375 [00:09<00:09, 19.54it/s, v_num=0]
Epoch 0:  53%|█████▎    | 200/375 [00:10<00:08, 19.50it/s, v_num=0]
Epoch 0:  59%|█████▊    | 220/375 [00:10<00:07, 20.06it/s, v_num=0]
Epoch 0:  64%|██████▍   | 240/375 [00:11<00:06, 20.47it/s, v_num=0]
Epoch 0:  69%|██████▉   | 260/375 [00:12<00:05, 20.96it/s, v_n

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:   5%|▌         | 20/375 [00:01<00:24, 14.57it/s, v_num=0]
Epoch 1:  11%|█         | 40/375 [00:02<00:20, 16.08it/s, v_num=0]
Epoch 1:  16%|█▌        | 60/375 [00:03<00:19, 16.11it/s, v_num=0]
Epoch 1:  21%|██▏       | 80/375 [00:04<00:18, 16.26it/s, v_num=0]
Epoch 1:  27%|██▋       | 100/375 [00:06<00:16, 16.28it/s, v_num=0]
Epoch 1:  32%|███▏      | 120/375 [00:07<00:15, 16.21it/s, v_num=0]
Epoch 1:  37%|███▋      | 140/375 [00:08<00:13, 17.23it/s, v_num=0]
Epoch 1:  43%|████▎     | 160/375 [00:08<00:11, 18.20it/s, v_num=0]
Epoch 1:  48%|████▊     | 180/375 [00:09<00:10, 18.77it/s, v_num=0]
Epoch 1:  53%|█████▎    | 200/375 [00:10<00:08, 19.45it/s, v_num=0]
Epoch 1:  59%|█████▊    | 220/375 [00:11<00:07, 19.86it/s, v_num=0]
Epoch 1:  64%|██████▍   | 240/375 [00:11<00:06, 20.36it/s, v_num=0]
Epoch 1:  69%|██████▉   | 260/375 [00:12<00:05, 20.77it/s, v_num=0]
Epoch 1:  75%|███████▍  | 280/375 [00:13<00:04, 21.25it/s, v_num=0]
Epoch 1:  80%|████████  | 300/375 [00:13<00:03, 21.4

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 2:   5%|▌         | 20/375 [00:01<00:27, 12.92it/s, v_num=0]
Epoch 2:  11%|█         | 40/375 [00:02<00:22, 14.88it/s, v_num=0]
Epoch 2:  16%|█▌        | 60/375 [00:03<00:17, 17.57it/s, v_num=0]
Epoch 2:  21%|██▏       | 80/375 [00:04<00:15, 19.46it/s, v_num=0]
Epoch 2:  27%|██▋       | 100/375 [00:04<00:13, 20.52it/s, v_num=0]
Epoch 2:  32%|███▏      | 120/375 [00:05<00:11, 21.54it/s, v_num=0]
Epoch 2:  37%|███▋      | 140/375 [00:06<00:10, 22.46it/s, v_num=0]
Trial status: 67 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 18:06:50. Total running time: 1hr 26min 33s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00068_68_batch_size=256,lr=0.0100,mlp_af_l0=none,mlp_bn_l0=False,mlp_do_l0=0.1000,mlp_out_l0=128_2023-09-02_17-47-23/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:13, 197177.96it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:13, 196807.42it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:31, 286501.91it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:04, 406319.47it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:31, 826834.90it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:00<00:17, 1481417.46it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  95%|█████████▌| 25165824/26421880 [00:02<00:00, 17243961.83it/s][A[A100%|██████████| 26421880/26421880 [00:02<00:00, 10544626.32it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 177467.42it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 177203.99it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 196747.22it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 196609.64it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:14, 286122.93it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 405581.24it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 825284.39it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1479072.12it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5615294.18it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3308005.61it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 30156811.44it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.6 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.4 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 39.89it/s]
Epoch 0:   0%|          | 0/188 [00:00<?, ?it/s] 
Epoch 0:  11%|█         | 20/188 [00:02<00:17,  9.48it/s, v_num=0]
Epoch 0:  21%|██▏       | 40/188 [00:04<00:15,  9.58it/s, v_num=0]
Epoch 0:  32%|███▏      | 60/188 [00:06<00:13,  9.42it/s, v_num=0]
Trial status: 68 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 18:07:20. Total running time: 1hr 27min 3s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00069_69_batch_size=64,lr=0.1000,mlp_af_l0=none,mlp_bn_l0=False,mlp_do_l0=0.1000,mlp_out_l0=128_2023-09-02_17-47-55/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:15, 194422.14it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:15, 193985.01it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:33, 282414.66it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 400543.09it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:31, 814858.85it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1460815.44it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  95%|█████████▌| 25165824/26421880 [00:02<00:00, 16991725.09it/s][A[A100%|██████████| 26421880/26421880 [00:02<00:00, 10388689.48it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 175723.44it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 175446.01it/s]


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 196584.57it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 196150.19it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 285426.92it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 405062.59it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 824436.58it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1477025.94it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 31941238.15it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.6 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.4 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 54.02it/s]
Epoch 0:   0%|          | 0/750 [00:00<?, ?it/s] 
Epoch 0:   3%|▎         | 20/750 [00:00<00:22, 32.89it/s, v_num=0]
Epoch 0:   5%|▌         | 40/750 [00:01<00:19, 35.89it/s, v_num=0]
Epoch 0:   8%|▊         | 60/750 [00:01<00:18, 38.21it/s, v_num=0]
Epoch 0:  11%|█         | 80/750 [00:02<00:16, 39.46it/s, v_num=0]
Epoch 0:  13%|█▎        | 100/750 [00:02<00:16, 39.71it/s, v_num=0]
Epoch 0:  16%|█▌        | 120/750 [00:02<00:15, 40.39it/s, v_num=0]
Epoch 0:  19%|█▊        | 140/750 [00:03<00:14, 40.91it/s, v_num=0]
Epoch 0:  21%|██▏       | 160/750 [00:03<00:14, 41.10it/s, v_num=0]
Epoch 0:  24%|██▍       | 180/750 [00:04<00:14, 38.64it/s, v_num=0]
Epoch 0:  27%|██▋       | 200/750 [00:05<00:14, 37.01it/s, v_num=0]
Epoch 0:  27%|██▋       | 200/750 [00:05<00:14, 36.98it/s, v_num=0]
Epoch 0:  29%|██▉       | 220/750 [00:06<00:14, 36.10it/s, v_num=0]
Epoch 0:  32%|███▏      | 240/750 [00:06<00:14, 35.20it/s, v_n

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00070_70_batch_size=128,lr=0.1000,mlp_af_l0=none,mlp_bn_l0=False,mlp_do_l0=0.1000,mlp_out_l0=128_2023-09-02_17-48-25/lightning_logs


Trial run_with_tune_62480_00070 started with configuration:
+-----------------------------------------------------------------+
| Trial run_with_tune_62480_00070 config                          |
+-----------------------------------------------------------------+
| batch_size                                                  128 |
| class_key                                                     1 |
| img_key                                                       0 |
| lr                                                          0.1 |
| mlp_af_l0                                                  none |
| mlp_bn_l0                                                 False |
| mlp_config/block_list                      ... 'dropout': 0.0}] |
| mlp_do_l0                                                   0.1 |
| mlp_out_l0                                                  128 |
| regularization_ratio                                        0.5 |
| resnet_config/block_list                   ...adding':

[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:17, 192479.13it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:17, 192217.38it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:34, 279268.31it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:06, 396652.74it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:32, 807022.39it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1445647.38it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 176826.09it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 176540.63it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 193878.28it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 193493.42it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 281633.66it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 399652.46it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 813343.07it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1457005.91it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 28599042.37it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.6 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.4 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 38.56it/s]
Epoch 0:   0%|          | 0/375 [00:00<?, ?it/s] 
Epoch 0:   5%|▌         | 20/375 [00:00<00:16, 21.08it/s, v_num=0]
Epoch 0:  11%|█         | 40/375 [00:01<00:13, 24.45it/s, v_num=0]
Epoch 0:  16%|█▌        | 60/375 [00:02<00:12, 25.53it/s, v_num=0]
Epoch 0:  21%|██▏       | 80/375 [00:03<00:11, 25.91it/s, v_num=0]
Trial status: 70 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 18:08:21. Total running time: 1hr 28min 3s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channel

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:   5%|▌         | 20/375 [00:01<00:20, 17.35it/s, v_num=0]
Epoch 1:  11%|█         | 40/375 [00:02<00:20, 16.68it/s, v_num=0]
Epoch 1:  16%|█▌        | 60/375 [00:03<00:18, 16.86it/s, v_num=0]
Epoch 1:  21%|██▏       | 80/375 [00:04<00:17, 16.48it/s, v_num=0]
Epoch 1:  27%|██▋       | 100/375 [00:06<00:16, 16.61it/s, v_num=0]
Epoch 1:  32%|███▏      | 120/375 [00:07<00:15, 16.71it/s, v_num=0]
Epoch 1:  37%|███▋      | 140/375 [00:08<00:14, 16.62it/s, v_num=0]
Epoch 1:  43%|████▎     | 160/375 [00:09<00:12, 17.46it/s, v_num=0]
Epoch 1:  48%|████▊     | 180/375 [00:09<00:10, 18.26it/s, v_num=0]
Epoch 1:  53%|█████▎    | 200/375 [00:10<00:09, 18.91it/s, v_num=0]
Epoch 1:  59%|█████▊    | 220/375 [00:11<00:07, 19.42it/s, v_num=0]
Epoch 1:  64%|██████▍   | 240/375 [00:12<00:06, 19.91it/s, v_num=0]
Epoch 1:  69%|██████▉   | 260/375 [00:12<00:05, 20.44it/s, v_num=0]
Epoch 1:  75%|███████▍  | 280/375 [00:13<00:04, 20.77it/s, v_num=0]
Trial status: 70 TERMINATED | 1 RUNNING | 16 PENDING

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00071_71_batch_size=256,lr=0.1000,mlp_af_l0=none,mlp_bn_l0=False,mlp_do_l0=0.1000,mlp_out_l0=128_2023-09-02_17-49-51/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:15, 195424.54it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:14, 196079.57it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:32, 285399.73it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:04, 406681.60it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:31, 825166.55it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1481700.80it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 172704.67it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 172440.77it/s]


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 195617.86it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 195301.13it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 284270.45it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 410404.39it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 816761.57it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:00<00:02, 1488200.90it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5612119.44it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3285292.31it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 27471090.32it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.6 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.4 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 56.46it/s]
Epoch 0:   0%|          | 0/188 [00:00<?, ?it/s] 
Epoch 0:  11%|█         | 20/188 [00:01<00:13, 12.81it/s, v_num=0]
Epoch 0:  21%|██▏       | 40/188 [00:02<00:10, 14.22it/s, v_num=0]
Epoch 0:  32%|███▏      | 60/188 [00:04<00:08, 14.27it/s, v_num=0]
Epoch 0:  43%|████▎     | 80/188 [00:06<00:08, 13.09it/s, v_num=0]
Epoch 0:  53%|█████▎    | 100/188 [00:08<00:07, 12.23it/s, v_num=0]
Epoch 0:  64%|██████▍   | 120/188 [00:10<00:05, 11.40it/s, v_num=0]
Epoch 0:  74%|███████▍  | 140/188 [00:12<00:04, 11.27it/s, v_num=0]
Epoch 0:  85%|████████▌ | 160/188 [00:13<00:02, 11.67it/s, v_num=0]
Trial status: 71 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 18:09:21. Total running time: 1hr 29min 4s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_c

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:  11%|█         | 20/188 [00:01<00:13, 12.56it/s, v_num=0]
Epoch 1:  21%|██▏       | 40/188 [00:02<00:10, 13.64it/s, v_num=0]
Epoch 1:  32%|███▏      | 60/188 [00:04<00:09, 12.98it/s, v_num=0]
Epoch 1:  43%|████▎     | 80/188 [00:06<00:09, 11.70it/s, v_num=0]
Epoch 1:  53%|█████▎    | 100/188 [00:08<00:07, 11.15it/s, v_num=0]
Epoch 1:  64%|██████▍   | 120/188 [00:11<00:06, 10.75it/s, v_num=0]
Epoch 1:  74%|███████▍  | 140/188 [00:12<00:04, 11.09it/s, v_num=0]
Epoch 1:  85%|████████▌ | 160/188 [00:13<00:02, 11.47it/s, v_num=0]
Epoch 1:  96%|█████████▌| 180/188 [00:15<00:00, 11.80it/s, v_num=0]
Epoch 1: 100%|██████████| 188/188 [00:15<00:00, 12.01it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Validation: 0it [00:00, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%|          | 0/47 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/47 [00:00<?, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation DataLoader 0:  43%|████▎     | 20/47 [00:

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00072_72_batch_size=64,lr=0.0100,mlp_af_l0=relu,mlp_bn_l0=True,mlp_do_l0=0.3000,mlp_out_l0=128_2023-09-02_17-51-48/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:17, 192157.54it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:17, 191767.51it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:34, 279063.17it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:06, 395924.78it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:32, 805112.96it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1443476.19it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 177794.43it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 177351.99it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 192670.98it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 192765.56it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 281069.88it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 399676.71it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 811573.78it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1456717.74it/s][A[A


Trial status: 72 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 18:09:51. Total running time: 1hr 29min 34s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_key': 0, 'class_key': 1, 'mlp_out_l0': 64, 'mlp_af_l0': 'relu', 'mlp_bn_l0': True, 'mlp_do_l0': 0.1}
+-----------------------------

[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  44%|████▎     | 1933312/4422102 [00:01<00:00, 2872568.97it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5527386.66it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3252810.07it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 24233756.44it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.9 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.7 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 120.01it/s]
Epoch 0:   0%|          | 0/750 [00:00<?, ?it/s] 
Epoch 0:   3%|▎         | 20/750 [00:00<00:23, 30.57it/s, v_num=0]
Epoch 0:   5%|▌         | 40/750 [00:01<00:19, 35.90it/s, v_num=0]
Epoch 0:   8%|▊         | 60/750 [00:01<00:18, 37.88it/s, v_num=0]
Epoch 0:  11%|█         | 80/750 [00:02<00:16, 39.43it/s, v_num=0]
Epoch 0:  13%|█▎        | 100/750 [00:02<00:16, 40.48it/s, v_num=0]
Epoch 0:  16%|█▌        | 120/750 [00:02<00:15, 40.99it/s, v_num=0]
Epoch 0:  19%|█▊        | 140/750 [00:03<00:14, 41.29it/s, v_num=0]
Epoch 0:  21%|██▏       | 160/750 [00:03<00:14, 41.07it/s, v_num=0]
Epoch 0:  24%|██▍       | 180/750 [00:04<00:13, 41.44it/s, v_num=0]
Epoch 0:  27%|██▋       | 200/750 [00:04<00:13, 41.42it/s, v_num=0]
Epoch 0:  29%|██▉       | 220/750 [00:05<00:12, 41.46it/s, v_num=0]
Epoch 0:  32%|███▏      | 240/750 [00:05<00:12, 41.32it/s, v_num=0]
Epoch 0:  35%|███▍      | 260/750 [00:06<00:11, 41.42it/s, v_

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Trial status: 72 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 18:10:21. Total running time: 1hr 30min 4s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_key': 0, 'class_key': 1, 'mlp_out_l0': 64, 'mlp_af_l0': 'relu', 'mlp_bn_l0': True, 'mlp_do_l0': 0.1}
+------------------------------

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00073_73_batch_size=128,lr=0.0100,mlp_af_l0=relu,mlp_bn_l0=True,mlp_do_l0=0.3000,mlp_out_l0=128_2023-09-02_17-52-51/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:18, 190218.24it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:18, 189920.75it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:35, 276314.21it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:06, 391855.96it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:32, 796921.73it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1428318.70it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  95%|█████████▍| 25100288/26421880 [00:02<00:00, 16321762.07it/s][A[A100%|██████████| 26421880/26421880 [00:02<00:00, 10167232.16it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 173789.89it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 173523.63it/s]


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 196839.93it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 196648.75it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:14, 286225.93it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 406309.86it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 826412.33it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1481217.98it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5616380.76it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3304965.83it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 27611607.41it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.9 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.7 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 83.01it/s]
Epoch 0:   0%|          | 0/375 [00:00<?, ?it/s] 
Epoch 0:   5%|▌         | 20/375 [00:00<00:15, 22.29it/s, v_num=0]
Epoch 0:  11%|█         | 40/375 [00:01<00:14, 22.91it/s, v_num=0]
Epoch 0:  16%|█▌        | 60/375 [00:02<00:12, 24.63it/s, v_num=0]
Epoch 0:  21%|██▏       | 80/375 [00:03<00:12, 23.73it/s, v_num=0]
Epoch 0:  27%|██▋       | 100/375 [00:04<00:12, 21.59it/s, v_num=0]
Epoch 0:  32%|███▏      | 120/375 [00:05<00:12, 20.36it/s, v_num=0]
Epoch 0:  37%|███▋      | 140/375 [00:07<00:12, 19.49it/s, v_num=0]
Epoch 0:  43%|████▎     | 160/375 [00:08<00:11, 19.22it/s, v_num=0]
Epoch 0:  48%|████▊     | 180/375 [00:09<00:10, 19.19it/s, v_num=0]
Epoch 0:  53%|█████▎    | 200/375 [00:10<00:08, 19.64it/s, v_num=0]
Epoch 0:  59%|█████▊    | 220/375 [00:10<00:07, 20.12it/s, v_num=0]
Epoch 0:  64%|██████▍   | 240/375 [00:11<00:06, 20.56it/s, v_num=0]
Trial status: 73 TERMINATED | 1 RUNNING | 16 PENDING
Current t

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:   5%|▌         | 20/375 [00:01<00:27, 12.80it/s, v_num=0]
Epoch 1:  11%|█         | 40/375 [00:02<00:23, 14.25it/s, v_num=0]
Epoch 1:  16%|█▌        | 60/375 [00:04<00:21, 14.93it/s, v_num=0]
Epoch 1:  21%|██▏       | 80/375 [00:05<00:18, 15.85it/s, v_num=0]
Epoch 1:  27%|██▋       | 100/375 [00:05<00:15, 17.24it/s, v_num=0]
Epoch 1:  32%|███▏      | 120/375 [00:06<00:13, 18.31it/s, v_num=0]
Epoch 1:  37%|███▋      | 140/375 [00:07<00:12, 19.06it/s, v_num=0]
Epoch 1:  43%|████▎     | 160/375 [00:08<00:10, 19.92it/s, v_num=0]
Epoch 1:  48%|████▊     | 180/375 [00:08<00:09, 20.40it/s, v_num=0]
Epoch 1:  53%|█████▎    | 200/375 [00:09<00:08, 20.88it/s, v_num=0]
Epoch 1:  59%|█████▊    | 220/375 [00:10<00:07, 21.41it/s, v_num=0]
Epoch 1:  64%|██████▍   | 240/375 [00:11<00:06, 21.79it/s, v_num=0]
Epoch 1:  69%|██████▉   | 260/375 [00:11<00:05, 22.07it/s, v_num=0]
Epoch 1:  75%|███████▍  | 280/375 [00:12<00:04, 22.29it/s, v_num=0]
Epoch 1:  80%|████████  | 300/375 [00:13<00:03, 22.5

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 2:   5%|▌         | 20/375 [00:00<00:17, 20.24it/s, v_num=0]
Epoch 2:  11%|█         | 40/375 [00:01<00:14, 22.95it/s, v_num=0]
Epoch 2:  16%|█▌        | 60/375 [00:02<00:13, 24.13it/s, v_num=0]
Epoch 2:  21%|██▏       | 80/375 [00:03<00:11, 24.93it/s, v_num=0]
Epoch 2:  27%|██▋       | 100/375 [00:04<00:11, 24.92it/s, v_num=0]
Epoch 2:  32%|███▏      | 120/375 [00:04<00:10, 25.17it/s, v_num=0]
Epoch 2:  37%|███▋      | 140/375 [00:05<00:09, 25.55it/s, v_num=0]
Epoch 2:  43%|████▎     | 160/375 [00:06<00:08, 25.67it/s, v_num=0]
Epoch 2:  48%|████▊     | 180/375 [00:06<00:07, 25.79it/s, v_num=0]
Epoch 2:  53%|█████▎    | 200/375 [00:07<00:06, 26.03it/s, v_num=0]
Epoch 2:  59%|█████▊    | 220/375 [00:08<00:05, 26.10it/s, v_num=0]
Epoch 2:  64%|██████▍   | 240/375 [00:09<00:05, 25.35it/s, v_num=0]
Epoch 2:  69%|██████▉   | 260/375 [00:10<00:04, 24.28it/s, v_num=0]
Epoch 2:  75%|███████▍  | 280/375 [00:11<00:04, 23.57it/s, v_num=0]
Epoch 2:  80%|████████  | 300/375 [00:13<00:03, 22.6

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 3:   5%|▌         | 20/375 [00:01<00:19, 18.48it/s, v_num=0]
Epoch 3:  11%|█         | 40/375 [00:01<00:15, 21.75it/s, v_num=0]
Epoch 3:  16%|█▌        | 60/375 [00:02<00:13, 23.47it/s, v_num=0]
Epoch 3:  21%|██▏       | 80/375 [00:03<00:12, 24.02it/s, v_num=0]
Epoch 3:  27%|██▋       | 100/375 [00:04<00:11, 23.94it/s, v_num=0]
Epoch 3:  32%|███▏      | 120/375 [00:05<00:11, 22.17it/s, v_num=0]
Epoch 3:  37%|███▋      | 140/375 [00:06<00:11, 20.66it/s, v_num=0]
Trial status: 73 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 18:13:52. Total running time: 1hr 33min 34s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 4:   5%|▌         | 20/375 [00:01<00:30, 11.79it/s, v_num=0]
Epoch 4:  11%|█         | 40/375 [00:02<00:25, 13.35it/s, v_num=0]
Epoch 4:  16%|█▌        | 60/375 [00:04<00:22, 14.15it/s, v_num=0]
Epoch 4:  21%|██▏       | 80/375 [00:05<00:20, 14.67it/s, v_num=0]
Epoch 4:  27%|██▋       | 100/375 [00:06<00:17, 15.61it/s, v_num=0]
Epoch 4:  32%|███▏      | 120/375 [00:07<00:15, 16.73it/s, v_num=0]
Epoch 4:  37%|███▋      | 140/375 [00:07<00:13, 17.65it/s, v_num=0]
Epoch 4:  43%|████▎     | 160/375 [00:08<00:11, 18.48it/s, v_num=0]
Epoch 4:  48%|████▊     | 180/375 [00:09<00:10, 18.99it/s, v_num=0]
Epoch 4:  53%|█████▎    | 200/375 [00:10<00:08, 19.47it/s, v_num=0]
Epoch 4:  59%|█████▊    | 220/375 [00:11<00:07, 19.92it/s, v_num=0]
Epoch 4:  64%|██████▍   | 240/375 [00:11<00:06, 20.32it/s, v_num=0]
Epoch 4:  69%|██████▉   | 260/375 [00:12<00:05, 20.57it/s, v_num=0]
Epoch 4:  75%|███████▍  | 280/375 [00:13<00:04, 20.96it/s, v_num=0]
Epoch 4:  80%|████████  | 300/375 [00:14<00:03, 21.2

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 5:   5%|▌         | 20/375 [00:00<00:16, 21.18it/s, v_num=0]
Epoch 5:  11%|█         | 40/375 [00:01<00:14, 22.57it/s, v_num=0]
Epoch 5:  16%|█▌        | 60/375 [00:02<00:13, 23.78it/s, v_num=0]
Epoch 5:  21%|██▏       | 80/375 [00:03<00:12, 24.43it/s, v_num=0]
Epoch 5:  27%|██▋       | 100/375 [00:04<00:11, 24.55it/s, v_num=0]
Epoch 5:  32%|███▏      | 120/375 [00:04<00:10, 25.15it/s, v_num=0]
Epoch 5:  37%|███▋      | 140/375 [00:05<00:09, 25.17it/s, v_num=0]
Epoch 5:  43%|████▎     | 160/375 [00:06<00:08, 25.47it/s, v_num=0]
Epoch 5:  48%|████▊     | 180/375 [00:07<00:07, 25.37it/s, v_num=0]
Epoch 5:  53%|█████▎    | 200/375 [00:07<00:06, 25.49it/s, v_num=0]
Epoch 5:  59%|█████▊    | 220/375 [00:08<00:06, 25.47it/s, v_num=0]
Epoch 5:  64%|██████▍   | 240/375 [00:09<00:05, 25.46it/s, v_num=0]
Epoch 5:  69%|██████▉   | 260/375 [00:10<00:04, 24.49it/s, v_num=0]
Epoch 5:  75%|███████▍  | 280/375 [00:11<00:04, 23.54it/s, v_num=0]
Epoch 5:  80%|████████  | 300/375 [00:13<00:03, 22.8

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 6:   5%|▌         | 20/375 [00:01<00:18, 19.71it/s, v_num=0]
Epoch 6:  11%|█         | 40/375 [00:01<00:14, 23.07it/s, v_num=0]
Epoch 6:  16%|█▌        | 60/375 [00:02<00:13, 24.04it/s, v_num=0]
Epoch 6:  21%|██▏       | 80/375 [00:03<00:12, 24.49it/s, v_num=0]
Epoch 6:  27%|██▋       | 100/375 [00:04<00:11, 24.92it/s, v_num=0]
Trial status: 73 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 18:14:52. Total running time: 1hr 34min 35s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': 

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00074_74_batch_size=256,lr=0.0100,mlp_af_l0=relu,mlp_bn_l0=True,mlp_do_l0=0.3000,mlp_out_l0=128_2023-09-02_17-53-24/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:18, 190932.25it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:18, 190589.45it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:34, 277553.28it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 196608/26421880 [00:00<01:21, 321068.03it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 425984/26421880 [00:00<00:38, 682835.05it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 851968/26421880 [00:01<00:19, 1300773.05it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 175496.01it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 175127.83it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 191147.34it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 190918.68it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 278036.23it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 394470.72it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 10%|█         | 458752/4422102 [00:00<00:05, 734147.34it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1457896.41it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  85%|████████▌ | 3768320/4422102 [00:01<00:00, 5382730.70it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3216197.99it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 19313306.79it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.9 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.7 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 25.05it/s]
Epoch 0:   0%|          | 0/188 [00:00<?, ?it/s] 
Epoch 0:  11%|█         | 20/188 [00:01<00:12, 13.65it/s, v_num=0]
Epoch 0:  21%|██▏       | 40/188 [00:02<00:10, 14.39it/s, v_num=0]
Epoch 0:  32%|███▏      | 60/188 [00:04<00:08, 14.31it/s, v_num=0]
Trial status: 74 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 18:15:22. Total running time: 1hr 35min 5s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding'

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:  11%|█         | 20/188 [00:01<00:13, 12.92it/s, v_num=0]
Epoch 1:  21%|██▏       | 40/188 [00:02<00:10, 14.01it/s, v_num=0]
Epoch 1:  32%|███▏      | 60/188 [00:04<00:08, 14.27it/s, v_num=0]
Epoch 1:  43%|████▎     | 80/188 [00:05<00:07, 13.59it/s, v_num=0]
Epoch 1:  53%|█████▎    | 100/188 [00:07<00:07, 12.53it/s, v_num=0]
Epoch 1:  64%|██████▍   | 120/188 [00:10<00:05, 11.82it/s, v_num=0]
Epoch 1:  74%|███████▍  | 140/188 [00:11<00:04, 11.67it/s, v_num=0]
Epoch 1:  85%|████████▌ | 160/188 [00:13<00:02, 12.07it/s, v_num=0]
Epoch 1:  96%|█████████▌| 180/188 [00:14<00:00, 12.36it/s, v_num=0]
Epoch 1: 100%|██████████| 188/188 [00:15<00:00, 12.52it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Validation: 0it [00:00, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%|          | 0/47 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/47 [00:00<?, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation DataLoader 0:  43%|████▎     | 20/47 [00:

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 2:  11%|█         | 20/188 [00:01<00:13, 12.73it/s, v_num=0]
Epoch 2:  21%|██▏       | 40/188 [00:02<00:10, 13.49it/s, v_num=0]
Epoch 2:  32%|███▏      | 60/188 [00:05<00:10, 11.85it/s, v_num=0]
Epoch 2:  43%|████▎     | 80/188 [00:07<00:09, 11.07it/s, v_num=0]
Epoch 2:  53%|█████▎    | 100/188 [00:09<00:08, 10.68it/s, v_num=0]
Epoch 2:  64%|██████▍   | 120/188 [00:10<00:06, 11.17it/s, v_num=0]
Epoch 2:  74%|███████▍  | 140/188 [00:12<00:04, 11.62it/s, v_num=0]
Epoch 2:  85%|████████▌ | 160/188 [00:13<00:02, 12.01it/s, v_num=0]
Epoch 2:  96%|█████████▌| 180/188 [00:14<00:00, 12.23it/s, v_num=0]
Epoch 2: 100%|██████████| 188/188 [00:15<00:00, 12.41it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Validation: 0it [00:00, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%|          | 0/47 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/47 [00:00<?, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation DataLoader 0:  43%|████▎     | 20/47 [00:

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 3:  11%|█         | 20/188 [00:01<00:15, 10.97it/s, v_num=0]
Epoch 3:  11%|█         | 20/188 [00:01<00:15, 10.92it/s, v_num=0]
Epoch 3:  21%|██▏       | 40/188 [00:03<00:14, 10.12it/s, v_num=0]
Epoch 3:  32%|███▏      | 60/188 [00:06<00:13,  9.79it/s, v_num=0]
Epoch 3:  43%|████▎     | 80/188 [00:07<00:10, 10.04it/s, v_num=0]
Epoch 3:  53%|█████▎    | 100/188 [00:09<00:08, 10.78it/s, v_num=0]
Epoch 3:  64%|██████▍   | 120/188 [00:10<00:06, 11.31it/s, v_num=0]
Trial status: 74 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 18:16:22. Total running time: 1hr 36min 5s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'i

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 4:  11%|█         | 20/188 [00:02<00:22,  7.52it/s, v_num=0]
Epoch 4:  21%|██▏       | 40/188 [00:04<00:17,  8.46it/s, v_num=0]
Epoch 4:  32%|███▏      | 60/188 [00:06<00:12,  9.86it/s, v_num=0]
Epoch 4:  43%|████▎     | 80/188 [00:07<00:10, 10.79it/s, v_num=0]
Epoch 4:  53%|█████▎    | 100/188 [00:08<00:07, 11.40it/s, v_num=0]
Epoch 4:  64%|██████▍   | 120/188 [00:10<00:05, 11.89it/s, v_num=0]
Epoch 4:  74%|███████▍  | 140/188 [00:12<00:04, 11.60it/s, v_num=0]
Epoch 4:  85%|████████▌ | 160/188 [00:14<00:02, 11.29it/s, v_num=0]
Epoch 4:  96%|█████████▌| 180/188 [00:16<00:00, 10.66it/s, v_num=0]
Epoch 4: 100%|██████████| 188/188 [00:17<00:00, 10.58it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Validation: 0it [00:00, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%|          | 0/47 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/47 [00:00<?, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation DataLoader 0:  43%|████▎     | 20/47 [00:

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 5:  11%|█         | 20/188 [00:01<00:14, 11.98it/s, v_num=0]
Epoch 5:  21%|██▏       | 40/188 [00:02<00:10, 13.48it/s, v_num=0]
Epoch 5:  32%|███▏      | 60/188 [00:04<00:09, 14.14it/s, v_num=0]
Epoch 5:  43%|████▎     | 80/188 [00:05<00:07, 14.64it/s, v_num=0]
Epoch 5:  53%|█████▎    | 100/188 [00:07<00:06, 14.26it/s, v_num=0]
Epoch 5:  64%|██████▍   | 120/188 [00:08<00:04, 14.41it/s, v_num=0]
Epoch 5:  74%|███████▍  | 140/188 [00:09<00:03, 14.16it/s, v_num=0]
Epoch 5:  85%|████████▌ | 160/188 [00:12<00:02, 13.22it/s, v_num=0]
Epoch 5:  96%|█████████▌| 180/188 [00:14<00:00, 12.48it/s, v_num=0]
Epoch 5: 100%|██████████| 188/188 [00:15<00:00, 12.42it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Validation: 0it [00:00, ?it/s][A
Validation:   0%|          | 0/47 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/47 [00:00<?, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation DataLoader 0:  43%|████▎     | 20/47 [00:01<00:01, 15.88it/s][A
[2m[36m(run_w

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00075_75_batch_size=64,lr=0.1000,mlp_af_l0=relu,mlp_bn_l0=True,mlp_do_l0=0.3000,mlp_out_l0=128_2023-09-02_17-54-14/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:15, 194341.04it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:15, 193986.71it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:33, 282363.43it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 400147.95it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 425984/26421880 [00:00<00:38, 675630.50it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 884736/26421880 [00:01<00:18, 1368448.62it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 177557.53it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 177242.04it/s]


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 195418.43it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 195093.71it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 284049.20it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 402712.60it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 10%|█         | 458752/4422102 [00:00<00:05, 749211.72it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 20%|██        | 884736/4422102 [00:01<00:02, 1356498.96it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  81%|████████  | 3571712/4422102 [00:01<00:00, 5189830.14it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3282753.64it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 30540702.96it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.9 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.7 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 18.86it/s]
Epoch 0:   0%|          | 0/750 [00:00<?, ?it/s] 
Epoch 0:   3%|▎         | 20/750 [00:01<00:36, 19.77it/s, v_num=0]
Epoch 0:   5%|▌         | 40/750 [00:01<00:32, 22.16it/s, v_num=0]
Epoch 0:   8%|▊         | 60/750 [00:02<00:29, 23.27it/s, v_num=0]
Trial status: 75 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 18:17:22. Total running time: 1hr 37min 5s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding'

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00076_76_batch_size=128,lr=0.1000,mlp_af_l0=relu,mlp_bn_l0=True,mlp_do_l0=0.3000,mlp_out_l0=128_2023-09-02_17-55-02/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:16, 193952.42it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:16, 193532.95it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:33, 281394.46it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 399007.85it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 458752/26421880 [00:00<00:34, 742734.90it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1474991.37it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 175169.70it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 174873.51it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 191780.01it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 191245.97it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 278246.04it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 394738.39it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 803655.48it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1440240.91it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
Trial status: 76 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 18:17:52. Total running time: 1hr 37min 35s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_key': 0, 

[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5466540.96it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3218850.90it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 33424577.39it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.9 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.7 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 46.67it/s]
Epoch 0:   0%|          | 0/375 [00:00<?, ?it/s] 
Epoch 0:   5%|▌         | 20/375 [00:01<00:22, 15.74it/s, v_num=0]
Epoch 0:  11%|█         | 40/375 [00:02<00:16, 19.87it/s, v_num=0]
Epoch 0:  16%|█▌        | 60/375 [00:02<00:14, 21.20it/s, v_num=0]
Epoch 0:  21%|██▏       | 80/375 [00:03<00:13, 22.29it/s, v_num=0]
Epoch 0:  27%|██▋       | 100/375 [00:04<00:11, 22.97it/s, v_num=0]
Epoch 0:  32%|███▏      | 120/375 [00:05<00:10, 23.56it/s, v_num=0]
Epoch 0:  37%|███▋      | 140/375 [00:05<00:09, 23.95it/s, v_num=0]
Epoch 0:  43%|████▎     | 160/375 [00:06<00:08, 24.28it/s, v_num=0]
Epoch 0:  48%|████▊     | 180/375 [00:07<00:08, 24.36it/s, v_num=0]
Epoch 0:  53%|█████▎    | 200/375 [00:08<00:07, 24.54it/s, v_num=0]
Epoch 0:  59%|█████▊    | 220/375 [00:08<00:06, 24.87it/s, v_num=0]
Epoch 0:  64%|██████▍   | 240/375 [00:09<00:05, 25.05it/s, v_num=0]
Epoch 0:  69%|██████▉   | 260/375 [00:10<00:04, 25.15it/s, v_n

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:   5%|▌         | 20/375 [00:01<00:17, 19.74it/s, v_num=0]
Epoch 1:  11%|█         | 40/375 [00:01<00:14, 23.25it/s, v_num=0]
Epoch 1:  16%|█▌        | 60/375 [00:02<00:13, 23.83it/s, v_num=0]
Epoch 1:  21%|██▏       | 80/375 [00:03<00:12, 24.55it/s, v_num=0]
Epoch 1:  27%|██▋       | 100/375 [00:03<00:10, 25.09it/s, v_num=0]
Epoch 1:  32%|███▏      | 120/375 [00:04<00:10, 24.90it/s, v_num=0]
Epoch 1:  37%|███▋      | 140/375 [00:05<00:09, 25.18it/s, v_num=0]
Epoch 1:  43%|████▎     | 160/375 [00:06<00:08, 25.47it/s, v_num=0]
Epoch 1:  48%|████▊     | 180/375 [00:07<00:07, 25.06it/s, v_num=0]
Trial status: 76 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 18:18:22. Total running time: 1hr 38min 5s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size'

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00077_77_batch_size=256,lr=0.1000,mlp_af_l0=relu,mlp_bn_l0=True,mlp_do_l0=0.3000,mlp_out_l0=128_2023-09-02_17-57-40/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:16, 193278.99it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:16, 192772.85it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:33, 280436.87it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 398106.70it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:32, 810055.22it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1452419.24it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 26421880/26421880 [00:02<00:00, 10329665.89it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 175829.52it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 175447.75it/s]


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:23, 190680.60it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 190334.52it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 276753.24it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 392873.55it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 799191.14it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1432781.67it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5436410.31it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3201795.60it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 34770172.29it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.9 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.7 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 26.59it/s]
Epoch 0:   0%|          | 0/188 [00:00<?, ?it/s] 
Epoch 0:  11%|█         | 20/188 [00:01<00:12, 13.31it/s, v_num=0]
Epoch 0:  21%|██▏       | 40/188 [00:02<00:10, 14.26it/s, v_num=0]
Epoch 0:  21%|██▏       | 40/188 [00:02<00:10, 14.24it/s, v_num=0]
Epoch 0:  32%|███▏      | 60/188 [00:04<00:08, 14.47it/s, v_num=0]
Epoch 0:  43%|████▎     | 80/188 [00:05<00:07, 14.54it/s, v_num=0]
Epoch 0:  53%|█████▎    | 100/188 [00:06<00:06, 14.60it/s, v_num=0]
Epoch 0:  64%|██████▍   | 120/188 [00:08<00:04, 14.75it/s, v_num=0]
Trial status: 77 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 18:18:52. Total running time: 1hr 38min 35s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_c

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:  11%|█         | 20/188 [00:01<00:12, 13.09it/s, v_num=0]
Epoch 1:  21%|██▏       | 40/188 [00:02<00:10, 14.34it/s, v_num=0]
Epoch 1:  32%|███▏      | 60/188 [00:04<00:08, 14.68it/s, v_num=0]
Epoch 1:  43%|████▎     | 80/188 [00:05<00:07, 14.65it/s, v_num=0]
Epoch 1:  53%|█████▎    | 100/188 [00:06<00:05, 14.68it/s, v_num=0]
Epoch 1:  64%|██████▍   | 120/188 [00:08<00:04, 14.12it/s, v_num=0]
Epoch 1:  74%|███████▍  | 140/188 [00:10<00:03, 13.20it/s, v_num=0]
Epoch 1:  85%|████████▌ | 160/188 [00:12<00:02, 12.46it/s, v_num=0]
Epoch 1:  96%|█████████▌| 180/188 [00:14<00:00, 12.42it/s, v_num=0]
Epoch 1: 100%|██████████| 188/188 [00:14<00:00, 12.56it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Validation: 0it [00:00, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%|          | 0/47 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/47 [00:00<?, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation DataLoader 0:  43%|████▎     | 20/47 [00:

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00078_78_batch_size=64,lr=0.0100,mlp_af_l0=none,mlp_bn_l0=True,mlp_do_l0=0.3000,mlp_out_l0=128_2023-09-02_18-01-15/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:17, 191975.83it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:17, 191551.83it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:34, 278752.97it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:06, 395614.48it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:32, 804744.99it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1441367.57it/s][A

Trial status: 78 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 18:19:22. Total running time: 1hr 39min 5s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_key': 0, 'class_key': 1, 'mlp_out_l0': 64, 'mlp_af_l0': 'relu', 'mlp_bn_l0': True, 'mlp_do_l0': 0.1}
+------------------------------

[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 72%|███████▏  | 18907136/26421880 [00:02<00:00, 15509525.51it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 83%|████████▎ | 21987328/26421880 [00:02<00:00, 16255757.82it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 95%|█████████▍| 25001984/26421880 [00:02<00:00, 16651165.69it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 26421880/26421880 [00:02<00:00, 10254890.97it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 173176.51it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 172799.41it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:23, 190814.82it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 190540.63it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 277024.55it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 392846.52it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 799926.90it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1434303.88it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5442440.53it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3205696.41it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 28410890.78it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.9 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.7 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 45.42it/s]
                                                                           
Epoch 0:   0%|          | 0/750 [00:00<?, ?it/s] 
Epoch 0:   3%|▎         | 20/750 [00:00<00:35, 20.59it/s, v_num=0]
Epoch 0:   5%|▌         | 40/750 [00:01<00:30, 23.13it/s, v_num=0]
Epoch 0:   8%|▊         | 60/750 [00:02<00:29, 23.56it/s, v_num=0]
Epoch 0:  11%|█         | 80/750 [00:03<00:26, 25.06it/s, v_num=0]
Epoch 0:  13%|█▎        | 100/750 [00:03<00:23, 27.38it/s, v_num=0]
Epoch 0:  16%|█▌        | 120/750 [00:04<00:21, 29.28it/s, v_num=0]
Epoch 0:  19%|█▊        | 140/750 [00:04<00:19, 30.84it/s, v_num=0]
Epoch 0:  21%|██▏       | 160/750 [00:05<00:18, 31.80it/s, v_num=0]
Epoch 0:  24%|██▍       | 180/750 [00:05<00:17, 32.88it/s, v_num=0]
Epoch 0:  27%|██▋       | 200/750 [00:05<00:16, 33.96it/s, v_num=0]
Epoch 0:  29%|██▉       | 220/750 [00:06<00:15, 34.57it/s, v_num=0]
Epoch 0:  32%|███▏      | 240/750 [00:06<00:14, 35.39i

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00079_79_batch_size=128,lr=0.0100,mlp_af_l0=none,mlp_bn_l0=True,mlp_do_l0=0.3000,mlp_out_l0=128_2023-09-02_18-02-18/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:16, 193595.08it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:16, 193170.29it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:33, 281439.14it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 399187.72it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:31, 812423.98it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1455951.08it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 174636.69it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 174368.08it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 195672.16it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 195180.32it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 284074.59it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 402924.58it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 819066.27it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1470610.07it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 24018105.66it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.9 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.7 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 30.02it/s]
Epoch 0:   0%|          | 0/375 [00:00<?, ?it/s] 
Epoch 0:   5%|▌         | 20/375 [00:01<00:28, 12.44it/s, v_num=0]
Epoch 0:  11%|█         | 40/375 [00:02<00:23, 14.08it/s, v_num=0]
Epoch 0:  16%|█▌        | 60/375 [00:03<00:19, 15.88it/s, v_num=0]
Epoch 0:  21%|██▏       | 80/375 [00:04<00:16, 17.47it/s, v_num=0]
Epoch 0:  27%|██▋       | 100/375 [00:05<00:14, 18.97it/s, v_num=0]
Epoch 0:  32%|███▏      | 120/375 [00:06<00:12, 19.75it/s, v_num=0]
Epoch 0:  37%|███▋      | 140/375 [00:06<00:11, 20.64it/s, v_num=0]
Epoch 0:  43%|████▎     | 160/375 [00:07<00:10, 21.30it/s, v_num=0]
Epoch 0:  48%|████▊     | 180/375 [00:08<00:08, 21.79it/s, v_num=0]
Epoch 0:  53%|█████▎    | 200/375 [00:08<00:07, 22.30it/s, v_num=0]
Epoch 0:  59%|█████▊    | 220/375 [00:09<00:06, 22.56it/s, v_num=0]
Epoch 0:  64%|██████▍   | 240/375 [00:10<00:05, 22.95it/s, v_num=0]
Epoch 1: 100%|██████████| 750/750 [08:09<00:00,  1.53it/s, v_n

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


[2m[36m(run_with_tune pid=1086)[0m 
Epoch 5: 100%|██████████| 188/188 [03:42<00:00,  1.19s/it, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
                                                                        [A
Trial status: 79 TERMINATED | 1 RUNNING | 16 PENDING
Current time: 2023-09-02 18:20:52. Total running time: 1hr 40min 35s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'o

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00080_80_batch_size=256,lr=0.0100,mlp_af_l0=none,mlp_bn_l0=True,mlp_do_l0=0.3000,mlp_out_l0=128_2023-09-02_18-02-51/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:15, 194964.36it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:15, 194378.66it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:32, 282934.34it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 401249.46it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 425984/26421880 [00:00<00:38, 676824.22it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 884736/26421880 [00:01<00:18, 1370840.58it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 170525.76it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 170233.11it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 192476.97it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 191997.73it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 279357.57it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 396079.80it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 10%|█         | 458752/4422102 [00:00<00:05, 737114.99it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 20%|██        | 884736/4422102 [00:01<00:02, 1334367.56it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz
Trial status: 80 TERMINATED | 1 RUNNING | 15 PENDING
Current time: 2023-09-02 18:21:53. Total running time: 1hr 41min 35s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activa

[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  81%|████████  | 3571712/4422102 [00:01<00:00, 5124541.74it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3231407.09it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 33167860.20it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.9 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.7 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 22.88it/s]
Epoch 0:   0%|          | 0/188 [00:00<?, ?it/s] 
Epoch 0:  11%|█         | 20/188 [00:01<00:11, 14.06it/s, v_num=0]
Epoch 0:  21%|██▏       | 40/188 [00:02<00:10, 14.33it/s, v_num=0]
Epoch 0:  32%|███▏      | 60/188 [00:04<00:08, 14.50it/s, v_num=0]
Epoch 0:  43%|████▎     | 80/188 [00:05<00:07, 13.91it/s, v_num=0]
Epoch 0:  53%|█████▎    | 100/188 [00:07<00:06, 12.62it/s, v_num=0]
Epoch 0:  64%|██████▍   | 120/188 [00:10<00:05, 11.75it/s, v_num=0]
Epoch 0:  64%|██████▍   | 120/188 [00:10<00:05, 11.75it/s, v_num=0]
Epoch 0:  74%|███████▍  | 140/188 [00:11<00:04, 11.83it/s, v_num=0]
Epoch 0:  85%|████████▌ | 160/188 [00:13<00:02, 12.12it/s, v_num=0]
Epoch 0:  96%|█████████▌| 180/188 [00:14<00:00, 12.44it/s, v_num=0]
Epoch 0: 100%|██████████| 188/188 [00:14<00:00, 12.56it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Validation: 0it [00:00,

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:  11%|█         | 20/188 [00:01<00:12, 13.57it/s, v_num=0]
Epoch 1:  21%|██▏       | 40/188 [00:02<00:10, 14.24it/s, v_num=0]
Epoch 1:  32%|███▏      | 60/188 [00:04<00:10, 12.45it/s, v_num=0]
Epoch 1:  43%|████▎     | 80/188 [00:07<00:09, 11.28it/s, v_num=0]
Epoch 1:  53%|█████▎    | 100/188 [00:09<00:08, 10.88it/s, v_num=0]
Epoch 1:  64%|██████▍   | 120/188 [00:10<00:05, 11.36it/s, v_num=0]
Trial status: 80 TERMINATED | 1 RUNNING | 15 PENDING
Current time: 2023-09-02 18:22:23. Total running time: 1hr 42min 5s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00081_81_batch_size=64,lr=0.1000,mlp_af_l0=none,mlp_bn_l0=True,mlp_do_l0=0.3000,mlp_out_l0=128_2023-09-02_18-03-41/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:15, 194835.56it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:15, 195226.44it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:32, 284142.52it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:04, 403557.22it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:31, 820670.57it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1472190.05it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 177434.10it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 177156.31it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 192423.35it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 192174.39it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 279589.53it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 396463.51it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 806921.31it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1445774.89it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5490041.13it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3233812.25it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 36228652.67it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.9 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.7 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 123.99it/s]
Epoch 0:   0%|          | 0/750 [00:00<?, ?it/s] 
Epoch 0:   3%|▎         | 20/750 [00:00<00:24, 30.10it/s, v_num=0]
Epoch 0:   5%|▌         | 40/750 [00:01<00:20, 34.79it/s, v_num=0]
Epoch 0:   8%|▊         | 60/750 [00:01<00:18, 36.97it/s, v_num=0]
Epoch 0:  11%|█         | 80/750 [00:02<00:17, 38.01it/s, v_num=0]
Epoch 0:  13%|█▎        | 100/750 [00:02<00:16, 39.19it/s, v_num=0]
Epoch 0:  16%|█▌        | 120/750 [00:03<00:15, 39.58it/s, v_num=0]
Epoch 0:  19%|█▊        | 140/750 [00:03<00:15, 39.89it/s, v_num=0]
Epoch 0:  21%|██▏       | 160/750 [00:03<00:14, 40.11it/s, v_num=0]
Epoch 0:  24%|██▍       | 180/750 [00:04<00:14, 40.47it/s, v_num=0]
Epoch 0:  27%|██▋       | 200/750 [00:04<00:13, 40.67it/s, v_num=0]
Epoch 0:  29%|██▉       | 220/750 [00:05<00:12, 41.10it/s, v_num=0]
Epoch 0:  32%|███▏      | 240/750 [00:05<00:12, 41.28it/s, v_num=0]
Epoch 0:  35%|███▍      | 260/750 [00:06<00:11, 41.37it/s, v_

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Trial run_with_tune_62480_00082 started with configuration:
+-----------------------------------------------------------------+
| Trial run_with_tune_62480_00082 config                          |
+-----------------------------------------------------------------+
| batch_size                                                  128 |
| class_key                                                     1 |
| img_key                                                       0 |
| lr                                                          0.1 |
| mlp_af_l0                                                  none |
| mlp_bn_l0                                                  True |
| mlp_config/block_list                      ... 'dropout': 0.0}] |
| mlp_do_l0                                                   0.3 |
| mlp_out_l0                                                  128 |
| regularization_ratio                                        0.5 |
| resnet_config/block_list                   ...adding':

[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00082_82_batch_size=128,lr=0.1000,mlp_af_l0=none,mlp_bn_l0=True,mlp_do_l0=0.3000,mlp_out_l0=128_2023-09-02_18-04-30/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:15, 194667.78it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:15, 194224.87it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:33, 282472.55it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 400809.33it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:31, 811254.87it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1458236.88it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  94%|█████████▎| 24739840/26421880 [00:02<00:00, 16588672.54it/s][A[A100%|██████████| 26421880/26421880 [00:02<00:00, 10390171.91it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 175119.65it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 174800.67it/s]


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 195568.87it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 195110.77it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 283901.37it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 402825.69it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 818930.81it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1469055.76it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5575114.89it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3284356.86it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 21315179.66it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.9 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.7 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

[2m[36m(run_with_tune pid=1086)[0m Epoch 0: 100%|██████████| 750/750 [00:35<00:00, 21.26it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m Epoch 0: 100%|██████████| 750/750 [00:35<00:00, 21.26it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m                                                                           [A
[2m[36m(run_with_tune pid=1086)[0m                                                                           [A
[2m[36m(run_with_tune pid=1086)[0m Sanity Checking:   0%|          | 0/2 [00:00<?, ?it/s]Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 44.18it/s]
[2m[36m(run_with_tune pid=1086)[0m                                                                            Training: 0it [00:00, ?it/s]Training:   0%|          | 0/375 [00:00<?, ?it/s]Epoch 0:   0%|          | 0/375 [00:00<?, ?it/s] 


[2m[36m(run_with_tune pid=1086)[0m Exception ignored in: <function _MultiProcessingDataLoaderIter.__del__ at 0x7acc463f4820>
[2m[36m(run_with_tune pid=1086)[0m Traceback (most recent call last):
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/local/lib/python3.10/dist-packages/torch/utils/data/dataloader.py", line 1478, in __del__
[2m[36m(run_with_tune pid=1086)[0m     self._shutdown_workers()
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/local/lib/python3.10/dist-packages/torch/utils/data/dataloader.py", line 1461, in _shutdown_workers
[2m[36m(run_with_tune pid=1086)[0m     if w.is_alive():
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/lib/python3.10/multiprocessing/process.py", line 160, in is_alive
[2m[36m(run_with_tune pid=1086)[0m     assert self._parent_pid == os.getpid(), 'can only test a child process'
[2m[36m(run_with_tune pid=1086)[0m AssertionError: can only test a child process
[2m[36m(run_with_tune pid=1086)[0m Exception ignored in: <funct

[2m[36m(run_with_tune pid=1086)[0m Epoch 0: 100%|██████████| 750/750 [00:35<00:00, 21.00it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m Epoch 0: 100%|██████████| 750/750 [00:35<00:00, 20.99it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m                                                                           [A
[2m[36m(run_with_tune pid=1086)[0m                                                                           [A
[2m[36m(run_with_tune pid=1086)[0m Epoch 0: 100%|██████████| 750/750 [00:35<00:00, 20.94it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m                                                                           [A


[2m[36m(run_with_tune pid=1086)[0m Exception ignored in: <function _MultiProcessingDataLoaderIter.__del__ at 0x7acc463f4820>
[2m[36m(run_with_tune pid=1086)[0m Traceback (most recent call last):
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/local/lib/python3.10/dist-packages/torch/utils/data/dataloader.py", line 1478, in __del__
[2m[36m(run_with_tune pid=1086)[0m     self._shutdown_workers()
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/local/lib/python3.10/dist-packages/torch/utils/data/dataloader.py", line 1461, in _shutdown_workers
[2m[36m(run_with_tune pid=1086)[0m     if w.is_alive():
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/lib/python3.10/multiprocessing/process.py", line 160, in is_alive
[2m[36m(run_with_tune pid=1086)[0m     assert self._parent_pid == os.getpid(), 'can only test a child process'
[2m[36m(run_with_tune pid=1086)[0m AssertionError: can only test a child process
[2m[36m(run_with_tune pid=1086)[0m Exception ignored in: <funct

Epoch 0:   5%|▌         | 20/375 [00:01<00:18, 18.73it/s, v_num=0]
Epoch 0:  11%|█         | 40/375 [00:01<00:15, 21.75it/s, v_num=0]
Epoch 0:  16%|█▌        | 60/375 [00:02<00:13, 23.52it/s, v_num=0]
Epoch 0:  21%|██▏       | 80/375 [00:03<00:12, 23.77it/s, v_num=0]
Epoch 0:  27%|██▋       | 100/375 [00:04<00:11, 24.40it/s, v_num=0]
Epoch 0:  32%|███▏      | 120/375 [00:04<00:10, 24.30it/s, v_num=0]
Epoch 0:  37%|███▋      | 140/375 [00:06<00:10, 23.25it/s, v_num=0]
Epoch 0:  43%|████▎     | 160/375 [00:07<00:09, 21.95it/s, v_num=0]
Epoch 0:  48%|████▊     | 180/375 [00:08<00:09, 21.00it/s, v_num=0]
Trial status: 82 TERMINATED | 1 RUNNING | 13 PENDING
Current time: 2023-09-02 18:23:23. Total running time: 1hr 43min 6s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size'

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:   5%|▌         | 20/375 [00:00<00:17, 20.73it/s, v_num=0]
Epoch 1:  11%|█         | 40/375 [00:02<00:18, 18.28it/s, v_num=0]
Epoch 1:  16%|█▌        | 60/375 [00:03<00:18, 17.29it/s, v_num=0]
Epoch 1:  21%|██▏       | 80/375 [00:04<00:17, 16.99it/s, v_num=0]
Epoch 1:  27%|██▋       | 100/375 [00:06<00:16, 16.52it/s, v_num=0]
Epoch 1:  32%|███▏      | 120/375 [00:07<00:15, 16.78it/s, v_num=0]
Epoch 1:  37%|███▋      | 140/375 [00:07<00:13, 17.77it/s, v_num=0]
Epoch 1:  43%|████▎     | 160/375 [00:08<00:11, 18.52it/s, v_num=0]
Epoch 1:  48%|████▊     | 180/375 [00:09<00:10, 19.13it/s, v_num=0]
Epoch 1:  53%|█████▎    | 200/375 [00:10<00:08, 19.85it/s, v_num=0]
Epoch 1:  59%|█████▊    | 220/375 [00:10<00:07, 20.25it/s, v_num=0]
Epoch 1:  64%|██████▍   | 240/375 [00:11<00:06, 20.62it/s, v_num=0]
Epoch 1:  69%|██████▉   | 260/375 [00:12<00:05, 21.09it/s, v_num=0]
Epoch 1:  75%|███████▍  | 280/375 [00:13<00:04, 21.45it/s, v_num=0]
Epoch 1:  80%|████████  | 300/375 [00:13<00:03, 21.7

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00083_83_batch_size=256,lr=0.1000,mlp_af_l0=none,mlp_bn_l0=True,mlp_do_l0=0.3000,mlp_out_l0=128_2023-09-02_18-05-54/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:18, 189959.80it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:19, 189509.59it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:35, 275755.93it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:06, 391063.42it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:32, 795618.10it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1426348.42it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 26421880/26421880 [00:02<00:00, 10148519.54it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 171910.36it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 171619.36it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 194353.68it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 193917.02it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 282129.23it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 400090.24it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 10%|█         | 458752/4422102 [00:00<00:05, 744159.94it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██        | 917504/4422102 [00:01<00:02, 1413104.71it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 40284098.87it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.9 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.7 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 64.24it/s]
Epoch 0:   0%|          | 0/188 [00:00<?, ?it/s] 
Epoch 0:  11%|█         | 20/188 [00:01<00:12, 13.88it/s, v_num=0]
Epoch 0:  21%|██▏       | 40/188 [00:02<00:10, 13.85it/s, v_num=0]
Epoch 0:  32%|███▏      | 60/188 [00:04<00:10, 12.16it/s, v_num=0]
Epoch 0:  43%|████▎     | 80/188 [00:07<00:09, 11.28it/s, v_num=0]
Epoch 0:  53%|█████▎    | 100/188 [00:09<00:07, 11.04it/s, v_num=0]
Epoch 0:  64%|██████▍   | 120/188 [00:10<00:05, 11.60it/s, v_num=0]
Epoch 0:  74%|███████▍  | 140/188 [00:11<00:03, 12.08it/s, v_num=0]
Epoch 0:  85%|████████▌ | 160/188 [00:12<00:02, 12.42it/s, v_num=0]
Epoch 0:  96%|█████████▌| 180/188 [00:14<00:00, 12.66it/s, v_num=0]
Epoch 0: 100%|██████████| 188/188 [00:14<00:00, 12.84it/s, v_num=0]
Validation: 0it [00:00, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%|          | 0/47 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/47 [00:00<?, ?it/s][A
[2m

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Trial status: 83 TERMINATED | 1 RUNNING | 12 PENDING
Current time: 2023-09-02 18:24:23. Total running time: 1hr 44min 6s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_key': 0, 'class_key': 1, 'mlp_out_l0': 64, 'mlp_af_l0': 'relu', 'mlp_bn_l0': True, 'mlp_do_l0': 0.1}
+------------------------------

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00084_84_batch_size=64,lr=0.0100,mlp_af_l0=relu,mlp_bn_l0=False,mlp_do_l0=0.3000,mlp_out_l0=128_2023-09-02_18-07-05/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:13, 198338.63it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:13, 197917.60it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:31, 287813.47it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:04, 408192.33it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:31, 831009.08it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:00<00:17, 1488741.11it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  96%|█████████▌| 25296896/26421880 [00:02<00:00, 17533836.93it/s][A[A100%|██████████| 26421880/26421880 [00:02<00:00, 10592472.97it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 175658.12it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 175390.58it/s]


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 193349.96it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 193063.98it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 281065.09it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 398480.14it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 810848.99it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1452974.84it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5514518.74it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3249948.85it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 33580524.09it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.6 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.4 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 27.95it/s]
Epoch 0:   0%|          | 0/750 [00:00<?, ?it/s] 
Epoch 0:   3%|▎         | 20/750 [00:00<00:28, 25.41it/s, v_num=0]
Epoch 0:   5%|▌         | 40/750 [00:01<00:23, 30.29it/s, v_num=0]
Epoch 0:   8%|▊         | 60/750 [00:01<00:20, 33.38it/s, v_num=0]
Epoch 0:  11%|█         | 80/750 [00:02<00:19, 34.89it/s, v_num=0]
Epoch 0:  13%|█▎        | 100/750 [00:02<00:18, 35.83it/s, v_num=0]
Epoch 0:  16%|█▌        | 120/750 [00:03<00:17, 36.59it/s, v_num=0]
Epoch 0:  19%|█▊        | 140/750 [00:03<00:16, 37.42it/s, v_num=0]
Epoch 0:  21%|██▏       | 160/750 [00:04<00:15, 38.01it/s, v_num=0]
Trial status: 84 TERMINATED | 1 RUNNING | 11 PENDING
Current time: 2023-09-02 18:24:53. Total running time: 1hr 44min 36s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:   3%|▎         | 20/750 [00:01<00:41, 17.72it/s, v_num=0]
Epoch 1:   5%|▌         | 40/750 [00:01<00:33, 21.19it/s, v_num=0]
Epoch 1:   8%|▊         | 60/750 [00:02<00:30, 22.82it/s, v_num=0]
Epoch 1:  11%|█         | 80/750 [00:03<00:27, 24.34it/s, v_num=0]
Epoch 1:  13%|█▎        | 100/750 [00:03<00:24, 26.38it/s, v_num=0]
Epoch 1:  16%|█▌        | 120/750 [00:04<00:22, 28.24it/s, v_num=0]
Epoch 1:  19%|█▊        | 140/750 [00:04<00:20, 29.23it/s, v_num=0]
Epoch 1:  21%|██▏       | 160/750 [00:05<00:19, 30.37it/s, v_num=0]
Epoch 1:  24%|██▍       | 180/750 [00:05<00:18, 31.18it/s, v_num=0]
Epoch 1:  27%|██▋       | 200/750 [00:06<00:17, 32.04it/s, v_num=0]
Epoch 1:  29%|██▉       | 220/750 [00:06<00:16, 32.83it/s, v_num=0]
Epoch 1:  32%|███▏      | 240/750 [00:07<00:15, 33.34it/s, v_num=0]
Epoch 1:  35%|███▍      | 260/750 [00:07<00:14, 33.83it/s, v_num=0]
Trial status: 84 TERMINATED | 1 RUNNING | 11 PENDING
Current time: 2023-09-02 18:25:23. Total running time: 1hr 45min 6s

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1: 100%|██████████| 750/750 [00:25<00:00, 29.26it/s, v_num=0]
Epoch 2:   0%|          | 0/750 [00:00<?, ?it/s, v_num=0]
Epoch 2:   3%|▎         | 20/750 [00:00<00:24, 29.93it/s, v_num=0]
Epoch 2:   5%|▌         | 40/750 [00:01<00:20, 34.66it/s, v_num=0]
Epoch 2:   8%|▊         | 60/750 [00:01<00:18, 37.31it/s, v_num=0]
Epoch 2:  11%|█         | 80/750 [00:02<00:17, 38.62it/s, v_num=0]
Epoch 2:  13%|█▎        | 100/750 [00:02<00:16, 39.66it/s, v_num=0]
Epoch 2:  16%|█▌        | 120/750 [00:02<00:15, 40.34it/s, v_num=0]
Epoch 2:  19%|█▊        | 140/750 [00:03<00:14, 41.15it/s, v_num=0]
Epoch 2:  21%|██▏       | 160/750 [00:03<00:14, 41.10it/s, v_num=0]
Epoch 2:  24%|██▍       | 180/750 [00:04<00:14, 39.43it/s, v_num=0]
Epoch 2:  27%|██▋       | 200/750 [00:05<00:14, 37.67it/s, v_num=0]
Epoch 2:  29%|██▉       | 220/750 [00:06<00:14, 36.65it/s, v_num=0]
Epoch 2:  32%|███▏      | 240/750 [00:06<00:14, 35.64it/s, v_num=0]
Epoch 2:  35%|███▍      | 260/750 [00:07<00:14, 34.80it/s, v_n

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 2: 100%|██████████| 750/750 [00:29<00:00, 25.44it/s, v_num=0]
Epoch 3:   0%|          | 0/750 [00:00<?, ?it/s, v_num=0]
Epoch 3:   3%|▎         | 20/750 [00:00<00:24, 29.61it/s, v_num=0]
Epoch 3:   5%|▌         | 40/750 [00:01<00:20, 35.47it/s, v_num=0]
Epoch 3:   8%|▊         | 60/750 [00:01<00:18, 37.35it/s, v_num=0]
Epoch 3:  11%|█         | 80/750 [00:02<00:17, 38.89it/s, v_num=0]
Epoch 3:  13%|█▎        | 100/750 [00:02<00:16, 39.98it/s, v_num=0]
Epoch 3:  16%|█▌        | 120/750 [00:02<00:15, 40.50it/s, v_num=0]
Epoch 3:  19%|█▊        | 140/750 [00:03<00:14, 41.27it/s, v_num=0]
Epoch 3:  21%|██▏       | 160/750 [00:03<00:14, 41.62it/s, v_num=0]
Epoch 3:  24%|██▍       | 180/750 [00:04<00:13, 41.92it/s, v_num=0]
Epoch 3:  27%|██▋       | 200/750 [00:04<00:13, 42.15it/s, v_num=0]
Epoch 3:  29%|██▉       | 220/750 [00:05<00:12, 42.38it/s, v_num=0]
Epoch 3:  32%|███▏      | 240/750 [00:05<00:11, 42.59it/s, v_num=0]
Epoch 3:  35%|███▍      | 260/750 [00:06<00:11, 42.52it/s, v_n

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 4:   3%|▎         | 20/750 [00:00<00:25, 28.55it/s, v_num=0]
Epoch 4:   5%|▌         | 40/750 [00:01<00:20, 35.08it/s, v_num=0]
Epoch 4:   8%|▊         | 60/750 [00:01<00:18, 36.96it/s, v_num=0]
Epoch 4:  11%|█         | 80/750 [00:02<00:17, 38.63it/s, v_num=0]
Epoch 4:  13%|█▎        | 100/750 [00:02<00:17, 36.57it/s, v_num=0]
Epoch 4:  16%|█▌        | 120/750 [00:03<00:18, 34.70it/s, v_num=0]
Epoch 4:  19%|█▊        | 140/750 [00:04<00:18, 33.62it/s, v_num=0]
Epoch 4:  21%|██▏       | 160/750 [00:04<00:18, 32.62it/s, v_num=0]
Epoch 4:  24%|██▍       | 180/750 [00:05<00:18, 31.67it/s, v_num=0]
Epoch 4:  27%|██▋       | 200/750 [00:06<00:17, 30.96it/s, v_num=0]
Epoch 4:  29%|██▉       | 220/750 [00:07<00:17, 30.34it/s, v_num=0]
Epoch 4:  29%|██▉       | 220/750 [00:07<00:17, 30.31it/s, v_num=0]
Epoch 4:  32%|███▏      | 240/750 [00:07<00:16, 30.02it/s, v_num=0]
Epoch 4:  35%|███▍      | 260/750 [00:08<00:16, 29.92it/s, v_num=0]
Epoch 4:  37%|███▋      | 280/750 [00:09<00:15, 29.9

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 5:   3%|▎         | 20/750 [00:00<00:24, 29.38it/s, v_num=0]
Epoch 5:   5%|▌         | 40/750 [00:01<00:20, 34.74it/s, v_num=0]
Epoch 5:   8%|▊         | 60/750 [00:01<00:18, 37.21it/s, v_num=0]
Epoch 5:  11%|█         | 80/750 [00:02<00:17, 37.93it/s, v_num=0]
Epoch 5:  13%|█▎        | 100/750 [00:02<00:16, 39.48it/s, v_num=0]
Epoch 5:  16%|█▌        | 120/750 [00:03<00:15, 39.82it/s, v_num=0]
Epoch 5:  19%|█▊        | 140/750 [00:03<00:15, 40.02it/s, v_num=0]
Epoch 5:  21%|██▏       | 160/750 [00:03<00:14, 40.49it/s, v_num=0]
Epoch 5:  24%|██▍       | 180/750 [00:04<00:13, 40.78it/s, v_num=0]
Epoch 5:  27%|██▋       | 200/750 [00:04<00:13, 41.30it/s, v_num=0]
Epoch 5:  29%|██▉       | 220/750 [00:05<00:12, 41.41it/s, v_num=0]
Epoch 5:  32%|███▏      | 240/750 [00:05<00:12, 41.63it/s, v_num=0]
Epoch 5:  35%|███▍      | 260/750 [00:06<00:11, 41.50it/s, v_num=0]
Epoch 5:  37%|███▋      | 280/750 [00:06<00:11, 41.61it/s, v_num=0]
Epoch 5:  40%|████      | 300/750 [00:07<00:10, 41.7

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00085_85_batch_size=128,lr=0.0100,mlp_af_l0=relu,mlp_bn_l0=False,mlp_do_l0=0.3000,mlp_out_l0=128_2023-09-02_18-07-35/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:17, 191284.62it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:18, 190813.62it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:34, 277722.26it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:06, 393780.27it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 425984/26421880 [00:00<00:39, 664075.85it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 884736/26421880 [00:01<00:18, 1345434.73it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 26421880/26421880 [00:02<00:00, 10174657.89it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 170693.17it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 170315.55it/s]


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:23, 188792.36it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:23, 189215.57it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 275344.96it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 396431.97it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 790931.61it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1438178.47it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 4422102/4422102 [00:01<00:00, 3183339.78it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 37228063.78it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.6 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.4 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 27.78it/s]
Epoch 0:   0%|          | 0/375 [00:00<?, ?it/s] 
Epoch 0:   5%|▌         | 20/375 [00:00<00:16, 22.02it/s, v_num=0]
Epoch 0:  11%|█         | 40/375 [00:01<00:14, 23.29it/s, v_num=0]
Epoch 0:  16%|█▌        | 60/375 [00:02<00:12, 24.30it/s, v_num=0]
Epoch 0:  21%|██▏       | 80/375 [00:03<00:12, 24.07it/s, v_num=0]
Epoch 0:  27%|██▋       | 100/375 [00:04<00:11, 24.40it/s, v_num=0]
Epoch 0:  32%|███▏      | 120/375 [00:04<00:10, 24.69it/s, v_num=0]
Epoch 0:  37%|███▋      | 140/375 [00:05<00:09, 24.51it/s, v_num=0]
Epoch 0:  43%|████▎     | 160/375 [00:06<00:08, 24.74it/s, v_num=0]
Epoch 0:  48%|████▊     | 180/375 [00:07<00:07, 24.56it/s, v_num=0]
Epoch 0:  53%|█████▎    | 200/375 [00:08<00:07, 23.71it/s, v_num=0]
Epoch 0:  59%|█████▊    | 220/375 [00:09<00:06, 22.73it/s, v_num=0]
Epoch 0:  64%|██████▍   | 240/375 [00:10<00:06, 22.05it/s, v_num=0]
Epoch 0:  69%|██████▉   | 260/375 [00:12<00:05, 21.18it/s, v_n

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:   5%|▌         | 20/375 [00:01<00:18, 19.69it/s, v_num=0]
Epoch 1:  11%|█         | 40/375 [00:01<00:14, 22.67it/s, v_num=0]
Epoch 1:  16%|█▌        | 60/375 [00:02<00:13, 22.74it/s, v_num=0]
Epoch 1:  21%|██▏       | 80/375 [00:03<00:12, 23.34it/s, v_num=0]
Epoch 1:  21%|██▏       | 80/375 [00:03<00:12, 23.32it/s, v_num=0]
Epoch 1:  27%|██▋       | 100/375 [00:04<00:12, 21.72it/s, v_num=0]
Epoch 1:  32%|███▏      | 120/375 [00:05<00:12, 20.75it/s, v_num=0]
Epoch 1:  37%|███▋      | 140/375 [00:07<00:11, 19.68it/s, v_num=0]
Epoch 1:  43%|████▎     | 160/375 [00:08<00:11, 18.94it/s, v_num=0]
Epoch 1:  48%|████▊     | 180/375 [00:09<00:10, 18.42it/s, v_num=0]
Epoch 1:  53%|█████▎    | 200/375 [00:10<00:09, 18.72it/s, v_num=0]
Epoch 1:  59%|█████▊    | 220/375 [00:11<00:08, 19.19it/s, v_num=0]
Epoch 1:  64%|██████▍   | 240/375 [00:12<00:06, 19.75it/s, v_num=0]
Epoch 1:  69%|██████▉   | 260/375 [00:12<00:05, 20.04it/s, v_num=0]
Epoch 1:  75%|███████▍  | 280/375 [00:13<00:04, 20.34

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 2:   5%|▌         | 20/375 [00:01<00:29, 11.97it/s, v_num=0]
Epoch 2:  11%|█         | 40/375 [00:02<00:24, 13.81it/s, v_num=0]
Epoch 2:  16%|█▌        | 60/375 [00:04<00:21, 14.33it/s, v_num=0]
Epoch 2:  21%|██▏       | 80/375 [00:05<00:19, 14.85it/s, v_num=0]
Epoch 2:  27%|██▋       | 100/375 [00:06<00:17, 15.34it/s, v_num=0]
Epoch 2:  32%|███▏      | 120/375 [00:07<00:15, 16.62it/s, v_num=0]
Epoch 2:  32%|███▏      | 120/375 [00:07<00:15, 16.62it/s, v_num=0]
Epoch 2:  37%|███▋      | 140/375 [00:07<00:13, 17.59it/s, v_num=0]
Trial status: 85 TERMINATED | 1 RUNNING | 10 PENDING
Current time: 2023-09-02 18:28:23. Total running time: 1hr 48min 6s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 3:   5%|▌         | 20/375 [00:01<00:17, 19.96it/s, v_num=0]
Epoch 3:  11%|█         | 40/375 [00:01<00:15, 21.94it/s, v_num=0]
Epoch 3:  16%|█▌        | 60/375 [00:02<00:13, 23.84it/s, v_num=0]
Epoch 3:  21%|██▏       | 80/375 [00:03<00:12, 24.05it/s, v_num=0]
Epoch 3:  27%|██▋       | 100/375 [00:04<00:11, 24.30it/s, v_num=0]
Epoch 3:  32%|███▏      | 120/375 [00:04<00:10, 24.92it/s, v_num=0]
Epoch 3:  37%|███▋      | 140/375 [00:05<00:09, 25.08it/s, v_num=0]
Epoch 3:  43%|████▎     | 160/375 [00:06<00:08, 25.37it/s, v_num=0]
Epoch 3:  48%|████▊     | 180/375 [00:07<00:07, 25.62it/s, v_num=0]
Epoch 3:  53%|█████▎    | 200/375 [00:07<00:06, 26.04it/s, v_num=0]
Epoch 3:  59%|█████▊    | 220/375 [00:08<00:05, 26.02it/s, v_num=0]
Epoch 3:  64%|██████▍   | 240/375 [00:09<00:05, 26.22it/s, v_num=0]
Epoch 3:  69%|██████▉   | 260/375 [00:09<00:04, 26.34it/s, v_num=0]
Epoch 3:  75%|███████▍  | 280/375 [00:11<00:03, 25.34it/s, v_num=0]
Epoch 3:  80%|████████  | 300/375 [00:12<00:03, 24.4

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 4:   5%|▌         | 20/375 [00:01<00:19, 18.54it/s, v_num=0]
Epoch 4:  11%|█         | 40/375 [00:01<00:15, 21.26it/s, v_num=0]
Epoch 4:  16%|█▌        | 60/375 [00:02<00:13, 23.03it/s, v_num=0]
Epoch 4:  21%|██▏       | 80/375 [00:03<00:12, 23.92it/s, v_num=0]
Epoch 4:  27%|██▋       | 100/375 [00:04<00:11, 24.35it/s, v_num=0]
Epoch 4:  32%|███▏      | 120/375 [00:04<00:10, 24.43it/s, v_num=0]
Epoch 4:  37%|███▋      | 140/375 [00:05<00:09, 25.00it/s, v_num=0]
Epoch 4:  43%|████▎     | 160/375 [00:06<00:08, 25.28it/s, v_num=0]
Epoch 4:  48%|████▊     | 180/375 [00:07<00:07, 24.98it/s, v_num=0]
Epoch 4:  53%|█████▎    | 200/375 [00:08<00:07, 23.61it/s, v_num=0]
Epoch 4:  59%|█████▊    | 220/375 [00:09<00:06, 22.20it/s, v_num=0]
Epoch 4:  64%|██████▍   | 240/375 [00:11<00:06, 21.36it/s, v_num=0]
Epoch 4:  69%|██████▉   | 260/375 [00:12<00:05, 20.85it/s, v_num=0]
Epoch 4:  75%|███████▍  | 280/375 [00:13<00:04, 20.41it/s, v_num=0]
Epoch 4:  80%|████████  | 300/375 [00:14<00:03, 20.8

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 5:   5%|▌         | 20/375 [00:00<00:17, 20.42it/s, v_num=0]
Trial status: 85 TERMINATED | 1 RUNNING | 10 PENDING
Current time: 2023-09-02 18:29:23. Total running time: 1hr 49min 6s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_key': 0, 'class_key': 1, 'mlp_out_l0': 64, 'mlp_af_l0': 'relu', '

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 6:   5%|▌         | 20/375 [00:01<00:27, 12.95it/s, v_num=0]
Epoch 6:  11%|█         | 40/375 [00:02<00:23, 14.29it/s, v_num=0]
Epoch 6:  16%|█▌        | 60/375 [00:04<00:21, 14.37it/s, v_num=0]
Epoch 6:  21%|██▏       | 80/375 [00:05<00:20, 14.69it/s, v_num=0]
Epoch 6:  27%|██▋       | 100/375 [00:06<00:16, 16.21it/s, v_num=0]
Epoch 6:  32%|███▏      | 120/375 [00:06<00:14, 17.28it/s, v_num=0]
Epoch 6:  37%|███▋      | 140/375 [00:07<00:12, 18.20it/s, v_num=0]
Epoch 6:  43%|████▎     | 160/375 [00:08<00:11, 18.86it/s, v_num=0]
Epoch 6:  48%|████▊     | 180/375 [00:09<00:09, 19.51it/s, v_num=0]
Epoch 6:  53%|█████▎    | 200/375 [00:10<00:08, 19.97it/s, v_num=0]
Trial status: 85 TERMINATED | 1 RUNNING | 10 PENDING
Current time: 2023-09-02 18:29:54. Total running time: 1hr 49min 36s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config'

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00086_86_batch_size=256,lr=0.0100,mlp_af_l0=relu,mlp_bn_l0=False,mlp_do_l0=0.3000,mlp_out_l0=128_2023-09-02_18-08-09/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:16, 193309.17it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:16, 192940.74it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:33, 280837.51it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 400689.52it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:32, 809057.06it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1457926.79it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 170106.56it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 169732.00it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 196652.92it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 196223.84it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 285511.11it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 404972.29it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 823570.30it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1477094.98it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5606465.65it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3302374.92it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 31521572.25it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.6 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.4 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 30.61it/s]
Epoch 0:   0%|          | 0/188 [00:00<?, ?it/s] 
Epoch 1: 100%|██████████| 375/375 [08:49<00:00,  1.41s/it, v_num=0]
Epoch 0:  11%|█         | 20/188 [00:02<00:23,  7.08it/s, v_num=0]
Epoch 0:  21%|██▏       | 40/188 [00:04<00:18,  8.06it/s, v_num=0]
Epoch 0:  32%|███▏      | 60/188 [00:07<00:15,  8.28it/s, v_num=0]
Epoch 0:  43%|████▎     | 80/188 [00:08<00:11,  9.20it/s, v_num=0]
Trial status: 86 TERMINATED | 1 RUNNING | 9 PENDING
Current time: 2023-09-02 18:30:24. Total running time: 1hr 50min 6s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channe

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1: 100%|██████████| 188/188 [08:23<00:00,  2.68s/it, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Epoch 1: 100%|██████████| 375/375 [07:01<00:00,  1.12s/it, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Epoch 1: 100%|██████████| 188/188 [06:23<00:00,  2.04s/it, v_num=0]
Trial status: 86 TERMINATED | 1 RUNNING | 9 PENDING
Current time: 2023-09-02 18:30:54. Total running time: 1hr 50min 37s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'rel

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00087_87_batch_size=64,lr=0.1000,mlp_af_l0=relu,mlp_bn_l0=False,mlp_do_l0=0.3000,mlp_out_l0=128_2023-09-02_18-08-58/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:12, 198421.10it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:13, 198040.33it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:31, 288243.03it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:04, 408807.90it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:31, 831295.74it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:00<00:17, 1490888.81it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  96%|█████████▌| 25264128/26421880 [00:02<00:00, 17214766.47it/s][A[A100%|██████████| 26421880/26421880 [00:02<00:00, 10599921.70it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 176519.24it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 176259.87it/s]


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 194410.31it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 194085.87it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 282678.53it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 401358.14it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 816664.94it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1462908.36it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5551445.29it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3270147.13it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 37486592.00it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.6 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.4 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 96.86it/s]
Epoch 0:   0%|          | 0/750 [00:00<?, ?it/s] 
Epoch 0:   3%|▎         | 20/750 [00:00<00:23, 31.54it/s, v_num=0]
Epoch 0:   5%|▌         | 40/750 [00:01<00:19, 36.27it/s, v_num=0]
Epoch 0:   8%|▊         | 60/750 [00:01<00:19, 35.62it/s, v_num=0]
Epoch 0:  11%|█         | 80/750 [00:02<00:20, 32.58it/s, v_num=0]
Epoch 0:  13%|█▎        | 100/750 [00:03<00:21, 30.72it/s, v_num=0]
Epoch 0:  16%|█▌        | 120/750 [00:04<00:21, 29.34it/s, v_num=0]
Epoch 0:  19%|█▊        | 140/750 [00:04<00:21, 28.30it/s, v_num=0]
Epoch 0:  21%|██▏       | 160/750 [00:05<00:21, 27.49it/s, v_num=0]
Epoch 0:  24%|██▍       | 180/750 [00:06<00:21, 27.00it/s, v_num=0]
Epoch 0:  27%|██▋       | 200/750 [00:07<00:20, 26.91it/s, v_num=0]
Epoch 0:  29%|██▉       | 220/750 [00:08<00:19, 26.71it/s, v_num=0]
Epoch 0:  32%|███▏      | 240/750 [00:09<00:19, 26.62it/s, v_num=0]
Epoch 0:  35%|███▍      | 260/750 [00:09<00:18, 26.44it/s, v_n

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00088_88_batch_size=128,lr=0.1000,mlp_af_l0=relu,mlp_bn_l0=False,mlp_do_l0=0.3000,mlp_out_l0=128_2023-09-02_18-09-44/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:15, 195400.65it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:15, 194996.70it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:32, 283813.27it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 196608/26421880 [00:00<01:20, 325697.68it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 425984/26421880 [00:00<00:37, 699607.73it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 851968/26421880 [00:01<00:19, 1322647.01it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 173589.57it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 173216.49it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 197833.02it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 197268.62it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:14, 287124.44it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 406618.92it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 827909.14it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:00<00:02, 1484661.33it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 35808087.88it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.6 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.4 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 42.01it/s]
Epoch 0:   0%|          | 0/375 [00:00<?, ?it/s] 
Epoch 0:   5%|▌         | 20/375 [00:00<00:16, 21.22it/s, v_num=0]
Epoch 0:  11%|█         | 40/375 [00:01<00:14, 23.03it/s, v_num=0]
Epoch 0:  16%|█▌        | 60/375 [00:02<00:13, 23.83it/s, v_num=0]
Trial status: 88 TERMINATED | 1 RUNNING | 7 PENDING
Current time: 2023-09-02 18:32:24. Total running time: 1hr 52min 7s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size'

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:   5%|▌         | 20/375 [00:00<00:17, 20.23it/s, v_num=0]
Epoch 1:  11%|█         | 40/375 [00:01<00:14, 22.56it/s, v_num=0]
Epoch 1:  16%|█▌        | 60/375 [00:02<00:13, 23.54it/s, v_num=0]
Epoch 1:  21%|██▏       | 80/375 [00:03<00:12, 24.58it/s, v_num=0]
Epoch 1:  27%|██▋       | 100/375 [00:04<00:11, 24.87it/s, v_num=0]
Epoch 1:  32%|███▏      | 120/375 [00:04<00:10, 25.09it/s, v_num=0]
Epoch 1:  37%|███▋      | 140/375 [00:05<00:09, 25.12it/s, v_num=0]
Epoch 1:  43%|████▎     | 160/375 [00:06<00:09, 23.56it/s, v_num=0]
Epoch 1:  48%|████▊     | 180/375 [00:08<00:08, 22.47it/s, v_num=0]
Epoch 1:  53%|█████▎    | 200/375 [00:09<00:08, 21.57it/s, v_num=0]
Epoch 1:  59%|█████▊    | 220/375 [00:10<00:07, 20.70it/s, v_num=0]
Epoch 1:  64%|██████▍   | 240/375 [00:11<00:06, 20.28it/s, v_num=0]
Trial status: 88 TERMINATED | 1 RUNNING | 7 PENDING
Current time: 2023-09-02 18:32:54. Total running time: 1hr 52min 37s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00089_89_batch_size=256,lr=0.1000,mlp_af_l0=relu,mlp_bn_l0=False,mlp_do_l0=0.3000,mlp_out_l0=128_2023-09-02_18-12-31/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:13, 197001.60it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:14, 196616.16it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:31, 286176.26it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:04, 405821.74it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:31, 825441.90it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1479910.29it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  95%|█████████▍| 25067520/26421880 [00:02<00:00, 17213578.48it/s][A[A100%|██████████| 26421880/26421880 [00:02<00:00, 10514216.40it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 173180.87it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 172775.78it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 192134.71it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 191705.91it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 278690.65it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 396051.23it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 805653.97it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1443931.80it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 40663421.83it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.6 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.4 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking:   0%|          | 0/2 [00:00<?, ?it/s]
Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 118.31it/s]
Epoch 0:   0%|          | 0/188 [00:00<?, ?it/s] 
Epoch 0:  11%|█         | 20/188 [00:01<00:12, 13.23it/s, v_num=0]
Epoch 0:  21%|██▏       | 40/188 [00:02<00:10, 14.00it/s, v_num=0]
Epoch 0:  32%|███▏      | 60/188 [00:04<00:09, 14.10it/s, v_num=0]
Epoch 0:  43%|████▎     | 80/188 [00:05<00:07, 14.52it/s, v_num=0]
Epoch 0:  53%|█████▎    | 100/188 [00:06<00:06, 14.35it/s, v_num=0]
Epoch 0:  64%|██████▍   | 120/188 [00:08<00:04, 13.70it/s, v_num=0]
Epoch 0:  74%|███████▍  | 140/188 [00:10<00:03, 12.75it/s, v_num=0]
Trial status: 89 TERMINATED | 1 RUNNING | 6 PENDING
Current time: 2023-09-02 18:33:24. Total running time: 1hr 53min 7s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, '

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:  11%|█         | 20/188 [00:01<00:13, 12.56it/s, v_num=0]
Epoch 1:  21%|██▏       | 40/188 [00:02<00:11, 13.43it/s, v_num=0]
Epoch 1:  32%|███▏      | 60/188 [00:04<00:09, 13.97it/s, v_num=0]
Epoch 1:  43%|████▎     | 80/188 [00:05<00:07, 13.71it/s, v_num=0]
Epoch 1:  53%|█████▎    | 100/188 [00:07<00:07, 12.57it/s, v_num=0]
Epoch 1:  64%|██████▍   | 120/188 [00:10<00:05, 11.77it/s, v_num=0]
Epoch 1:  74%|███████▍  | 140/188 [00:12<00:04, 11.40it/s, v_num=0]
Epoch 1:  85%|████████▌ | 160/188 [00:13<00:02, 11.68it/s, v_num=0]
Epoch 1:  96%|█████████▌| 180/188 [00:14<00:00, 12.09it/s, v_num=0]
Epoch 1: 100%|██████████| 188/188 [00:15<00:00, 12.22it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Validation: 0it [00:00, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%|          | 0/47 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/47 [00:00<?, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation DataLoader 0:  43%|████▎     | 20/47 [00:

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00090_90_batch_size=64,lr=0.0100,mlp_af_l0=none,mlp_bn_l0=False,mlp_do_l0=0.3000,mlp_out_l0=128_2023-09-02_18-15-08/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:15, 194632.49it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:15, 194209.27it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:32, 282757.18it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 400926.11it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 425984/26421880 [00:00<00:38, 676275.23it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 884736/26421880 [00:01<00:18, 1369732.55it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  94%|█████████▍| 24805376/26421880 [00:02<00:00, 17141231.78it/s][A[A100%|██████████| 26421880/26421880 [00:02<00:00, 10397522.13it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 174971.14it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 174570.93it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 192265.61it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 191873.25it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 279186.14it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 395878.01it/s][A[A


Trial status: 90 TERMINATED | 1 RUNNING | 5 PENDING
Current time: 2023-09-02 18:33:54. Total running time: 1hr 53min 37s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_key': 0, 'class_key': 1, 'mlp_out_l0': 64, 'mlp_af_l0': 'relu', 'mlp_bn_l0': True, 'mlp_do_l0': 0.1}
+------------------------------

[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 804797.98it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1443687.26it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 44%|████▎     | 1933312/4422102 [00:01<00:00, 2843439.51it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
100%|██████████| 4422102/4422102 [00:01<00:00, 3225843.16it/s]


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 25343048.11it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.6 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.4 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

[2m[36m(run_with_tune pid=1086)[0m Sanity Checking:   0%|          | 0/2 [00:00<?, ?it/s]Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 40.36it/s]
Epoch 0:   0%|          | 0/750 [00:00<?, ?it/s] 
Epoch 0:   3%|▎         | 20/750 [00:00<00:32, 22.62it/s, v_num=0]
Epoch 0:   5%|▌         | 40/750 [00:01<00:24, 29.37it/s, v_num=0]
Epoch 0:   8%|▊         | 60/750 [00:01<00:21, 31.89it/s, v_num=0]
Epoch 0:  11%|█         | 80/750 [00:02<00:19, 33.90it/s, v_num=0]
Epoch 0:  13%|█▎        | 100/750 [00:02<00:18, 35.61it/s, v_num=0]
Epoch 0:  16%|█▌        | 120/750 [00:03<00:17, 36.42it/s, v_num=0]
Epoch 0:  19%|█▊        | 140/750 [00:03<00:16, 37.36it/s, v_num=0]
Epoch 0:  21%|██▏       | 160/750 [00:04<00:15, 38.03it/s, v_num=0]
Epoch 0:  24%|██▍       | 180/750 [00:04<00:14, 38.69it/s, v_num=0]
Epoch 0:  27%|██▋       | 200/750 [00:05<00:14, 38.76it/s, v_num=0]
Epoch 0:  29%|██▉       | 220/750 [0

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:   3%|▎         | 20/750 [00:00<00:24, 29.66it/s, v_num=0]
Epoch 1:   5%|▌         | 40/750 [00:01<00:20, 34.50it/s, v_num=0]
Epoch 1:   8%|▊         | 60/750 [00:01<00:19, 35.31it/s, v_num=0]
Epoch 1:  11%|█         | 80/750 [00:02<00:20, 32.88it/s, v_num=0]
Epoch 1:  13%|█▎        | 100/750 [00:03<00:20, 31.56it/s, v_num=0]
Trial status: 90 TERMINATED | 1 RUNNING | 5 PENDING
Current time: 2023-09-02 18:34:24. Total running time: 1hr 54min 7s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00091_91_batch_size=128,lr=0.0100,mlp_af_l0=none,mlp_bn_l0=False,mlp_do_l0=0.3000,mlp_out_l0=128_2023-09-02_18-17-11/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:15, 194279.78it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:16, 193784.77it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:33, 281999.37it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 400000.36it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:31, 813292.99it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1458410.82it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 172813.40it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 172424.20it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 194807.95it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 194339.02it/s][A[A


Trial status: 91 TERMINATED | 1 RUNNING | 4 PENDING
Current time: 2023-09-02 18:34:54. Total running time: 1hr 54min 37s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_key': 0, 'class_key': 1, 'mlp_out_l0': 64, 'mlp_af_l0': 'relu', 'mlp_bn_l0': True, 'mlp_do_l0': 0.1}
+------------------------------

[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   3%|▎         | 131072/4422102 [00:00<00:15, 282151.45it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 400783.99it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 10%|█         | 458752/4422102 [00:00<00:05, 746753.25it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 20%|██        | 884736/4422102 [00:01<00:02, 1351986.76it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 41%|████      | 1802240/4422102 [00:01<00:00, 2686531.75it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  81%|████████  | 3571712/4422102 [00:01<00:00, 5169644.00it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3269390.28it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 17042049.72it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.6 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.4 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

[2m[36m(run_with_tune pid=1086)[0m Sanity Checking:   0%|          | 0/2 [00:00<?, ?it/s]Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 29.81it/s]
Epoch 0:   0%|          | 0/375 [00:00<?, ?it/s] 
Epoch 0:   5%|▌         | 20/375 [00:01<00:31, 11.38it/s, v_num=0]
Epoch 0:  11%|█         | 40/375 [00:03<00:26, 12.83it/s, v_num=0]
Epoch 0:  16%|█▌        | 60/375 [00:04<00:23, 13.62it/s, v_num=0]
Epoch 0:  21%|██▏       | 80/375 [00:05<00:21, 13.97it/s, v_num=0]
Epoch 0:  27%|██▋       | 100/375 [00:07<00:19, 14.28it/s, v_num=0]
Epoch 0:  32%|███▏      | 120/375 [00:08<00:17, 14.80it/s, v_num=0]
Epoch 0:  37%|███▋      | 140/375 [00:08<00:14, 15.89it/s, v_num=0]
Epoch 0:  43%|████▎     | 160/375 [00:09<00:12, 16.68it/s, v_num=0]
Epoch 0:  48%|████▊     | 180/375 [00:10<00:11, 17.19it/s, v_num=0]
Epoch 0:  53%|█████▎    | 200/375 [00:11<00:09, 17.82it/s, v_num=0]
Epoch 0:  59%|█████▊    | 220/375 [0

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:   5%|▌         | 20/375 [00:01<00:28, 12.66it/s, v_num=0]
Epoch 1:  11%|█         | 40/375 [00:02<00:19, 16.92it/s, v_num=0]
Epoch 1:  16%|█▌        | 60/375 [00:03<00:16, 19.24it/s, v_num=0]
Epoch 1:  21%|██▏       | 80/375 [00:03<00:14, 20.44it/s, v_num=0]
Trial status: 91 TERMINATED | 1 RUNNING | 4 PENDING
Current time: 2023-09-02 18:35:24. Total running time: 1hr 55min 7s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 2:   5%|▌         | 20/375 [00:00<00:17, 20.72it/s, v_num=0]
Epoch 2:  11%|█         | 40/375 [00:01<00:14, 23.38it/s, v_num=0]
Epoch 2:  16%|█▌        | 60/375 [00:02<00:12, 24.31it/s, v_num=0]
Epoch 2:  21%|██▏       | 80/375 [00:03<00:11, 24.71it/s, v_num=0]
Epoch 2:  27%|██▋       | 100/375 [00:03<00:10, 25.25it/s, v_num=0]
Epoch 2:  32%|███▏      | 120/375 [00:04<00:10, 25.32it/s, v_num=0]
Epoch 2:  37%|███▋      | 140/375 [00:05<00:09, 25.53it/s, v_num=0]
Epoch 2:  43%|████▎     | 160/375 [00:06<00:08, 25.31it/s, v_num=0]
Epoch 2:  48%|████▊     | 180/375 [00:07<00:07, 25.40it/s, v_num=0]
Epoch 2:  53%|█████▎    | 200/375 [00:08<00:07, 24.50it/s, v_num=0]
Epoch 2:  59%|█████▊    | 220/375 [00:09<00:06, 23.33it/s, v_num=0]
Epoch 2:  64%|██████▍   | 240/375 [00:10<00:06, 22.42it/s, v_num=0]
Epoch 2:  69%|██████▉   | 260/375 [00:11<00:05, 21.82it/s, v_num=0]
Epoch 2:  75%|███████▍  | 280/375 [00:13<00:04, 21.17it/s, v_num=0]
Trial status: 91 TERMINATED | 1 RUNNING | 4 PENDING


[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 3:   5%|▌         | 20/375 [00:01<00:17, 19.94it/s, v_num=0]
Epoch 3:  11%|█         | 40/375 [00:01<00:15, 21.02it/s, v_num=0]
Epoch 3:  16%|█▌        | 60/375 [00:02<00:14, 22.31it/s, v_num=0]
Epoch 3:  21%|██▏       | 80/375 [00:03<00:12, 22.82it/s, v_num=0]
Epoch 3:  27%|██▋       | 100/375 [00:04<00:13, 21.11it/s, v_num=0]
Epoch 3:  32%|███▏      | 120/375 [00:05<00:12, 20.05it/s, v_num=0]
Epoch 3:  37%|███▋      | 140/375 [00:07<00:12, 19.29it/s, v_num=0]
Epoch 3:  43%|████▎     | 160/375 [00:08<00:11, 18.87it/s, v_num=0]
Epoch 3:  48%|████▊     | 180/375 [00:09<00:10, 18.30it/s, v_num=0]
Epoch 3:  53%|█████▎    | 200/375 [00:10<00:09, 18.36it/s, v_num=0]
Epoch 3:  59%|█████▊    | 220/375 [00:11<00:08, 18.88it/s, v_num=0]
Epoch 3:  64%|██████▍   | 240/375 [00:12<00:06, 19.32it/s, v_num=0]
Epoch 3:  69%|██████▉   | 260/375 [00:13<00:05, 19.63it/s, v_num=0]
Epoch 3:  75%|███████▍  | 280/375 [00:14<00:04, 19.96it/s, v_num=0]
Epoch 3:  80%|████████  | 300/375 [00:14<00:03, 20.2

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Trial status: 91 TERMINATED | 1 RUNNING | 4 PENDING
Current time: 2023-09-02 18:36:24. Total running time: 1hr 56min 7s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logsoftmax', 'batch_norm': False, 'dropout': 0.0}]}, 'img_key': 0, 'class_key': 1, 'mlp_out_l0': 64, 'mlp_af_l0': 'relu', 'mlp_bn_l0': True, 'mlp_do_l0': 0.1}
+-------------------------------

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 5:   5%|▌         | 20/375 [00:01<00:18, 19.55it/s, v_num=0]
Epoch 5:  11%|█         | 40/375 [00:01<00:14, 22.66it/s, v_num=0]
Epoch 5:  16%|█▌        | 60/375 [00:02<00:12, 24.36it/s, v_num=0]
Epoch 5:  21%|██▏       | 80/375 [00:03<00:12, 24.53it/s, v_num=0]
Epoch 5:  27%|██▋       | 100/375 [00:04<00:11, 24.85it/s, v_num=0]
Epoch 5:  32%|███▏      | 120/375 [00:04<00:10, 25.17it/s, v_num=0]
Epoch 5:  37%|███▋      | 140/375 [00:05<00:09, 25.31it/s, v_num=0]
Epoch 5:  43%|████▎     | 160/375 [00:06<00:08, 25.25it/s, v_num=0]
Epoch 5:  48%|████▊     | 180/375 [00:07<00:07, 25.35it/s, v_num=0]
Trial status: 91 TERMINATED | 1 RUNNING | 4 PENDING
Current time: 2023-09-02 18:36:54. Total running time: 1hr 56min 37s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size'

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00092_92_batch_size=256,lr=0.0100,mlp_af_l0=none,mlp_bn_l0=False,mlp_do_l0=0.3000,mlp_out_l0=128_2023-09-02_18-17-45/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:15, 195068.96it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:15, 194619.19it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:32, 283014.14it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 401681.71it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:31, 817732.06it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1464428.13it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  95%|█████████▌| 25231360/26421880 [00:02<00:00, 17099046.92it/s][A[A100%|██████████| 26421880/26421880 [00:02<00:00, 10424768.40it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 175880.48it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 175536.32it/s]


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:23, 190480.02it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 189964.93it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 276368.60it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 391863.34it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 797905.98it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 34492455.26it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.6 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.4 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 41.73it/s]
Epoch 0:   0%|          | 0/188 [00:00<?, ?it/s] 
Epoch 0:  11%|█         | 20/188 [00:02<00:17,  9.71it/s, v_num=0]
Epoch 0:  21%|██▏       | 40/188 [00:03<00:12, 12.12it/s, v_num=0]
Epoch 0:  32%|███▏      | 60/188 [00:04<00:09, 12.94it/s, v_num=0]
Epoch 0:  43%|████▎     | 80/188 [00:06<00:08, 13.25it/s, v_num=0]
Epoch 0:  53%|█████▎    | 100/188 [00:07<00:06, 13.52it/s, v_num=0]
Trial status: 92 TERMINATED | 1 RUNNING | 3 PENDING
Current time: 2023-09-02 18:37:24. Total running time: 1hr 57min 7s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:  11%|█         | 20/188 [00:01<00:13, 12.73it/s, v_num=0]
Epoch 1:  21%|██▏       | 40/188 [00:02<00:10, 14.14it/s, v_num=0]
Epoch 1:  32%|███▏      | 60/188 [00:04<00:08, 14.57it/s, v_num=0]
Epoch 1:  43%|████▎     | 80/188 [00:05<00:07, 14.75it/s, v_num=0]
Epoch 1:  53%|█████▎    | 100/188 [00:06<00:05, 14.75it/s, v_num=0]
Epoch 1:  64%|██████▍   | 120/188 [00:08<00:04, 14.74it/s, v_num=0]
Epoch 1:  74%|███████▍  | 140/188 [00:10<00:03, 13.95it/s, v_num=0]
Epoch 1:  85%|████████▌ | 160/188 [00:12<00:02, 13.07it/s, v_num=0]
Epoch 1:  96%|█████████▌| 180/188 [00:14<00:00, 12.43it/s, v_num=0]
Epoch 1: 100%|██████████| 188/188 [00:15<00:00, 12.25it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Validation: 0it [00:00, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%|          | 0/47 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/47 [00:00<?, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation DataLoader 0:  43%|████▎     | 20/47 [00:

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 2:  11%|█         | 20/188 [00:02<00:22,  7.55it/s, v_num=0]
Epoch 2:  21%|██▏       | 40/188 [00:05<00:18,  7.94it/s, v_num=0]
Epoch 2:  32%|███▏      | 60/188 [00:06<00:14,  8.65it/s, v_num=0]
Epoch 2:  43%|████▎     | 80/188 [00:09<00:12,  8.71it/s, v_num=0]
Epoch 2:  53%|█████▎    | 100/188 [00:11<00:10,  8.66it/s, v_num=0]
Epoch 2:  64%|██████▍   | 120/188 [00:13<00:07,  8.74it/s, v_num=0]
Epoch 2:  74%|███████▍  | 140/188 [00:14<00:05,  9.35it/s, v_num=0]
Epoch 2:  85%|████████▌ | 160/188 [00:16<00:02,  9.77it/s, v_num=0]
Epoch 2:  96%|█████████▌| 180/188 [00:17<00:00, 10.08it/s, v_num=0]
Epoch 2: 100%|██████████| 188/188 [00:18<00:00, 10.30it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Validation: 0it [00:00, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%|          | 0/47 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/47 [00:00<?, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation DataLoader 0:  43%|████▎     | 20/47 [00:

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00093_93_batch_size=64,lr=0.1000,mlp_af_l0=none,mlp_bn_l0=False,mlp_do_l0=0.3000,mlp_out_l0=128_2023-09-02_18-18-35/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:16, 193669.83it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:16, 193247.10it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:33, 281239.03it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 398818.29it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 458752/26421880 [00:00<00:34, 742194.11it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 884736/26

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  93%|█████████▎| 24576000/26421880 [00:02<00:00, 16619908.71it/s][A[A100%|██████████| 26421880/26421880 [00:02<00:00, 10306160.05it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 171542.31it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 171155.02it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 193310.80it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 192858.12it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 280539.18it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 397890.22it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 809718.03it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:01<00:02, 1450975.54it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5508139.90it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3245265.53it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 37617207.30it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.6 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.4 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

[2m[36m(run_with_tune pid=1086)[0m Sanity Checking:   0%|          | 0/2 [00:00<?, ?it/s]Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 77.79it/s]
Epoch 0:   0%|          | 0/750 [00:00<?, ?it/s] 
Trial status: 93 TERMINATED | 1 RUNNING | 2 PENDING
Current time: 2023-09-02 18:38:25. Total running time: 1hr 58min 7s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun':

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.
[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00094_94_batch_size=128,lr=0.1000,mlp_af_l0=none,mlp_bn_l0=False,mlp_do_l0=0.3000,mlp_out_l0=128_2023-09-02_18-19-19/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:18, 190477.38it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:18, 189868.91it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:35, 276501.17it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 196608/26421880 [00:00<01:22, 317111.44it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 425984/26421880 [00:00<00:38, 681604.33it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 819200/26

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 171233.38it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 170846.29it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz
Trial status: 94 TERMINATED | 1 RUNNING | 1 PENDING
Current time: 2023-09-02 18:38:55. Total running time: 1hr 58min 37s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out_size': 64, 'activation_fun': 'relu', 'batch_norm': True, 'dropout': 0.1}, {'in_size': 64, 'out_size': 10, 'activation_fun': 'logs

[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 197886.86it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 197458.40it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:14, 287257.41it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 407501.94it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 829112.42it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 [00:00<00:02, 1486127.30it/s][A[A
[2

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 35455298.84it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.6 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.4 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

[2m[36m(run_with_tune pid=1086)[0m Sanity Checking:   0%|          | 0/2 [00:00<?, ?it/s]Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]
Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 34.82it/s]
Epoch 0:   0%|          | 0/375 [00:00<?, ?it/s] 
Epoch 0:   5%|▌         | 20/375 [00:00<00:16, 21.09it/s, v_num=0]
Epoch 0:  11%|█         | 40/375 [00:01<00:13, 24.38it/s, v_num=0]
Epoch 0:  16%|█▌        | 60/375 [00:02<00:12, 24.62it/s, v_num=0]
Epoch 0:  21%|██▏       | 80/375 [00:03<00:12, 24.53it/s, v_num=0]
Epoch 0:  27%|██▋       | 100/375 [00:04<00:11, 24.97it/s, v_num=0]
Epoch 0:  32%|███▏      | 120/375 [00:04<00:10, 25.15it/s, v_num=0]
Epoch 0:  37%|███▋      | 140/375 [00:05<00:09, 25.13it/s, v_num=0]
Epoch 0:  43%|████▎     | 160/375 [00:06<00:08, 25.27it/s, v_num=0]
Epoch 0:  48%|████▊     | 180/375 [00:07<00:07, 24.86it/s, v_num=0]
Epoch 0:  53%|█████▎    | 200/375 [00:08<00:07, 22.96it/s, v_num=0]
Epoch 0:  59%|█████▊    | 220/375 [0

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:   5%|▌         | 20/375 [00:01<00:18, 19.11it/s, v_num=0]
Epoch 1:  11%|█         | 40/375 [00:01<00:15, 22.10it/s, v_num=0]
Epoch 1:  16%|█▌        | 60/375 [00:02<00:13, 23.23it/s, v_num=0]
Epoch 1:  21%|██▏       | 80/375 [00:03<00:12, 24.25it/s, v_num=0]
Epoch 1:  27%|██▋       | 100/375 [00:04<00:12, 21.93it/s, v_num=0]
Epoch 1:  32%|███▏      | 120/375 [00:05<00:12, 20.84it/s, v_num=0]
Trial status: 94 TERMINATED | 1 RUNNING | 1 PENDING
Current time: 2023-09-02 18:39:25. Total running time: 1hr 59min 7s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, '

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m GPU available: True (cuda), used: True
[2m[36m(run_with_tune pid=1086)[0m TPU available: False, using: 0 TPU cores
[2m[36m(run_with_tune pid=1086)[0m IPU available: False, using: 0 IPUs
[2m[36m(run_with_tune pid=1086)[0m HPU available: False, using: 0 HPUs
[2m[36m(run_with_tune pid=1086)[0m Missing logger folder: /root/ray_results/tune_mnist_asha/run_with_tune_62480_00095_95_batch_size=256,lr=0.1000,mlp_af_l0=none,mlp_bn_l0=False,mlp_do_l0=0.3000,mlp_out_l0=128_2023-09-02_18-19-56/lightning_logs


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz to data/FashionMNIST/raw/train-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 0/26421880 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 32768/26421880 [00:00<02:16, 193602.44it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 65536/26421880 [00:00<02:16, 193188.48it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  0%|          | 131072/26421880 [00:00<01:33, 281088.51it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 229376/26421880 [00:00<01:05, 398555.43it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  2%|▏         | 491520/26421880 [00:00<00:31, 810836.14it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  4%|▎         | 950272/26421880 [00:01<00:17, 1454313.68it/s][A

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw/train-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/29515 [00:00<?, ?it/s][A[A


[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/train-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 100%|██████████| 29515/29515 [00:00<00:00, 176823.06it/s][A[A100%|██████████| 29515/29515 [00:00<00:00, 176522.51it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/4422102 [00:00<?, ?it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|          | 32768/4422102 [00:00<00:22, 193347.24it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  1%|▏         | 65536/4422102 [00:00<00:22, 193477.25it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  3%|▎         | 131072/4422102 [00:00<00:15, 281686.74it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
  5%|▌         | 229376/4422102 [00:00<00:10, 399600.14it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 11%|█         | 491520/4422102 [00:00<00:04, 812929.79it/s][A[A
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
 21%|██▏       | 950272/4422102 

[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-images-idx3-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m  87%|████████▋ | 3833856/4422102 [00:01<00:00, 5524759.03it/s][A[A100%|██████████| 4422102/4422102 [00:01<00:00, 3256340.51it/s]


[2m[36m(run_with_tune pid=1086)[0m Downloading http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz
[2m[36m(run_with_tune pid=1086)[0m Extracting data/FashionMNIST/raw/t10k-labels-idx1-ubyte.gz to data/FashionMNIST/raw
[2m[36m(run_with_tune pid=1086)[0m 
Sanity Checking: 0it [00:00, ?it/s]


[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   0%|          | 0/5148 [00:00<?, ?it/s][A[A100%|██████████| 5148/5148 [00:00<00:00, 37036495.70it/s]
[2m[36m(run_with_tune pid=1086)[0m LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m   | Name     | Type               | Params
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 0 | accuracy | MulticlassAccuracy | 0     
[2m[36m(run_with_tune pid=1086)[0m 1 | mlp      | MLP                | 10.6 K
[2m[36m(run_with_tune pid=1086)[0m 2 | resnet   | ResNet             | 9.8 K 
[2m[36m(run_with_tune pid=1086)[0m ------------------------------------------------
[2m[36m(run_with_tune pid=1086)[0m 20.4 K    Trainable params
[2m[36m(run_with_tune pid=1086)[0m 0         Non-trainable params
[2m[36m(run_with_tune pid

[2m[36m(run_with_tune pid=1086)[0m Epoch 1: 100%|██████████| 375/375 [00:29<00:00, 12.80it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m                                                                         [AEpoch 1: 100%|██████████| 375/375 [00:29<00:00, 12.79it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m                                                                         [A
[2m[36m(run_with_tune pid=1086)[0m Sanity Checking:   0%|          | 0/2 [00:00<?, ?it/s]Sanity Checking DataLoader 0:   0%|          | 0/2 [00:00<?, ?it/s]Sanity Checking DataLoader 0: 100%|██████████| 2/2 [00:00<00:00, 67.20it/s]


[2m[36m(run_with_tune pid=1086)[0m Exception ignored in: <function _MultiProcessingDataLoaderIter.__del__ at 0x7acc463f4820>
[2m[36m(run_with_tune pid=1086)[0m Traceback (most recent call last):
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/local/lib/python3.10/dist-packages/torch/utils/data/dataloader.py", line 1478, in __del__
[2m[36m(run_with_tune pid=1086)[0m     self._shutdown_workers()
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/local/lib/python3.10/dist-packages/torch/utils/data/dataloader.py", line 1461, in _shutdown_workers
[2m[36m(run_with_tune pid=1086)[0m     if w.is_alive():
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/lib/python3.10/multiprocessing/process.py", line 160, in is_alive
[2m[36m(run_with_tune pid=1086)[0m     assert self._parent_pid == os.getpid(), 'can only test a child process'
[2m[36m(run_with_tune pid=1086)[0m AssertionError: can only test a child process
[2m[36m(run_with_tune pid=1086)[0m Exception ignored in: <funct

Epoch 0:   0%|          | 0/188 [00:00<?, ?it/s] 
Epoch 1: 100%|██████████| 375/375 [00:29<00:00, 12.60it/s, v_num=0]
Epoch 1: 100%|██████████| 375/375 [00:29<00:00, 12.60it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
                                                                        [A
                                                                        [A


[2m[36m(run_with_tune pid=1086)[0m Exception ignored in: <function _MultiProcessingDataLoaderIter.__del__ at 0x7acc463f4820>
[2m[36m(run_with_tune pid=1086)[0m Traceback (most recent call last):
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/local/lib/python3.10/dist-packages/torch/utils/data/dataloader.py", line 1478, in __del__
[2m[36m(run_with_tune pid=1086)[0m     self._shutdown_workers()
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/local/lib/python3.10/dist-packages/torch/utils/data/dataloader.py", line 1461, in _shutdown_workers
[2m[36m(run_with_tune pid=1086)[0m     if w.is_alive():
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/lib/python3.10/multiprocessing/process.py", line 160, in is_alive
[2m[36m(run_with_tune pid=1086)[0m Exception ignored in: <function _MultiProcessingDataLoaderIter.__del__ at 0x7acc463f4820>
[2m[36m(run_with_tune pid=1086)[0m Traceback (most recent call last):
[2m[36m(run_with_tune pid=1086)[0m   File "/usr/local/lib/py

[2m[36m(run_with_tune pid=1086)[0m Epoch 1: 100%|██████████| 375/375 [00:29<00:00, 12.52it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
                                                                        [A
Epoch 0:  11%|█         | 20/188 [00:01<00:13, 12.10it/s, v_num=0]
Epoch 0:  21%|██▏       | 40/188 [00:03<00:11, 13.07it/s, v_num=0]
Epoch 0:  32%|███▏      | 60/188 [00:04<00:09, 13.75it/s, v_num=0]
Epoch 0:  43%|████▎     | 80/188 [00:05<00:07, 13.75it/s, v_num=0]
Trial status: 95 TERMINATED | 1 RUNNING
Current time: 2023-09-02 18:39:55. Total running time: 1hr 59min 38s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


Epoch 1:  11%|█         | 20/188 [00:01<00:13, 12.35it/s, v_num=0]
Epoch 1:  21%|██▏       | 40/188 [00:02<00:10, 13.73it/s, v_num=0]
Epoch 1:  32%|███▏      | 60/188 [00:04<00:09, 14.00it/s, v_num=0]
Epoch 1:  43%|████▎     | 80/188 [00:06<00:08, 12.47it/s, v_num=0]
Epoch 1: 100%|██████████| 188/188 [09:00<00:00,  2.87s/it, v_num=0]
Epoch 1:  53%|█████▎    | 100/188 [00:09<00:08, 10.63it/s, v_num=0]
Epoch 1:  64%|██████▍   | 120/188 [00:11<00:06, 10.26it/s, v_num=0]
Epoch 1:  74%|███████▍  | 140/188 [00:12<00:04, 10.77it/s, v_num=0]
Epoch 1:  85%|████████▌ | 160/188 [00:14<00:02, 11.12it/s, v_num=0]
Epoch 1:  96%|█████████▌| 180/188 [00:15<00:00, 11.51it/s, v_num=0]
Epoch 1: 100%|██████████| 188/188 [00:16<00:00, 11.70it/s, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
Validation: 0it [00:00, ?it/s][A
[2m[36m(run_with_tune pid=1086)[0m 
Validation:   0%|          | 0/47 [00:00<?, ?it/s][A
Validation DataLoader 0:   0%|          | 0/47 [00:00<?, ?it/s][A
[2m[36m(run_with_tune

[2m[36m(run_with_tune pid=1086)[0m Metric time_total_s does not exist in `trainer.callback_metrics.


[2m[36m(run_with_tune pid=1086)[0m Epoch 1: 100%|██████████| 375/375 [08:03<00:00,  1.29s/it, v_num=0]
[2m[36m(run_with_tune pid=1086)[0m 
[2m[36m(run_with_tune pid=1086)[0m                                                                         [AEpoch 1: 100%|██████████| 188/188 [07:16<00:00,  2.32s/it, v_num=0]
Trial status: 95 TERMINATED | 1 RUNNING
Current time: 2023-09-02 18:40:55. Total running time: 2hr 0min 38s
Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
Current best trial: 62480_00000 with ptl/val_loss=0.4649209976196289 and params={'regularization_ratio': 0.5, 'batch_size': 64, 'lr': 0.01, 'resnet_config': {'first_conv': {'in_channels': 1, 'out_channels': 32, 'kernel_size': 3, 'stride': 2, 'padding': 1}, 'block_list': [{'in_channels': 32, 'out_channels': 16, 'kernel_size': 3, 'stride': 2, 'padding': 1}, {'in_channels': 16, 'out_channels': 8, 'kernel_size': 3, 'stride': 1, 'padding': 'same'}], 'pool_size': 2}, 'mlp_config': {'block_list': [{'in_size': 72, 'out

In [None]:
# Trial status: 96 TERMINATED
# Current time: 2023-09-02 18:41:36. Total running time: 2hr 1min 18s
# Logical resource usage: 2.0/2 CPUs, 1.0/1 GPUs
df = results.get_dataframe()[['training_iteration', 'config/batch_size', 'config/lr', 'config/mlp_af_l0', 'config/mlp_bn_l0', 'config/mlp_do_l0', 'config/mlp_out_l0', 'ptl/val_loss', 'ptl/val_accuracy']]
df.sort_values('ptl/val_loss', ascending=True).head(20)

Unnamed: 0,training_iteration,config/batch_size,config/lr,config/mlp_af_l0,config/mlp_bn_l0,config/mlp_do_l0,config/mlp_out_l0,ptl/val_loss,ptl/val_accuracy
0,6,64,0.01,relu,True,0.1,64,0.464921,0.825733
49,7,128,0.01,relu,True,0.1,128,0.465987,0.826847
73,7,128,0.01,relu,True,0.3,128,0.471249,0.822388
26,8,256,0.01,relu,True,0.3,64,0.476863,0.819004
61,7,128,0.01,relu,False,0.1,128,0.478739,0.820178
60,6,64,0.01,relu,False,0.1,128,0.479928,0.820506
85,7,128,0.01,relu,False,0.3,128,0.491108,0.815976
12,5,64,0.01,relu,False,0.1,64,0.497068,0.813628
37,7,128,0.01,relu,False,0.3,64,0.500579,0.813494
84,6,64,0.01,relu,False,0.3,128,0.501533,0.813122
