In [1]:
import os
import json

import numpy as np
import torch
import torchvision
from torchsummary import summary

from project_18408.datasets import *
from project_18408.evaluation import *
from project_18408.experiments import *
from project_18408.utils import *

In [2]:
print("PyTorch Version:", torch.__version__)
print("Torchvision Version:", torchvision.__version__)
# Detect if we have a GPU available
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
if torch.cuda.is_available():
    print("Using the GPU!")
else:
    print("WARNING: Could not find GPU! Using CPU only")

PyTorch Version: 1.8.0
Torchvision Version: 0.9.0
Using the GPU!


In [3]:
configs_fname = "experiment_configs_mnist_test2.json"

In [4]:
with open(configs_fname, 'r') as f:
    configs = json.load(f)
configs = [ExperimentConfig.from_dict(c) for c in configs]

In [5]:
print(configs[0])

{'dataset_config': {'dataset_type': 'img', 'dataset_config': {'img_dataset_type': 'mnist', 'num_train_samples': 60000, 'num_test_samples': 10000, 'new_input_size': None, 'flatten': True, 'augment': False, 'corrupt_frac': 0.0, 'seed': 0}}, 'model_config': {'model_type': 'relu_toy', 'model_config': {'input_dim': 784, 'output_dim': 10, 'layer_dims': [], 'bias': True, 'seed': None}}, 'training_config': {'optimizer_type': 'sgd_momentum', 'loss_type': 'cross_entropy', 'lr': 0.01, 'num_epochs': 50, 'clip_grad_norm': False, 'weight_decay': 0.0, 'use_lr_schedule': False, 'epoch_lr_decay_steps': None, 'lr_decay_gamma': None, 'early_stop': True, 'early_stop_acc': 0.9, 'early_stop_patience': 5}, 'trial_index': 0}


In [6]:
data_dir = get_rel_pkg_path("dataset/")
experiment_dir = get_rel_pkg_path("experiments/")

In [7]:
manager = ExperimentManager(data_dir, experiment_dir)

In [8]:
def process_training(config):
    manager.add_experiment(config, exist_ok=True)
    setup, state = manager.run_training(config,
                                        device,
                                        num_workers=2,
                                        pin_memory=False,
                                        completed_ok=True)

In [None]:
for c in configs:
    print("="*40)
    print(c)
    process_training(c)

{'dataset_config': {'dataset_type': 'img', 'dataset_config': {'img_dataset_type': 'mnist', 'num_train_samples': 60000, 'num_test_samples': 10000, 'new_input_size': None, 'flatten': True, 'augment': False, 'corrupt_frac': 0.0, 'seed': 0}}, 'model_config': {'model_type': 'relu_toy', 'model_config': {'input_dim': 784, 'output_dim': 10, 'layer_dims': [], 'bias': True, 'seed': None}}, 'training_config': {'optimizer_type': 'sgd_momentum', 'loss_type': 'cross_entropy', 'lr': 0.01, 'num_epochs': 50, 'clip_grad_norm': False, 'weight_decay': 0.0, 'use_lr_schedule': False, 'epoch_lr_decay_steps': None, 'lr_decay_gamma': None, 'early_stop': True, 'early_stop_acc': 0.9, 'early_stop_patience': 5}, 'trial_index': 0}


  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

----------
Epoch 1/50
----------
Training


Avg. Loss: 0.5855, Total Loss: 0.3837, Loss Parts: [0.3837]: 100%|███████████████████| 469/469 [00:05<00:00, 79.11it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.5855
Training Accuracy: 0.8517
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.70it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.3788
Testing accuracy: 0.8995
Best testing accuracy was: -1.0000
Stagnation was: 0

----------
Epoch 2/50
----------
Training


Avg. Loss: 0.3730, Total Loss: 0.2483, Loss Parts: [0.2483]: 100%|███████████████████| 469/469 [00:05<00:00, 86.04it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.3730
Training Accuracy: 0.8976
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.49it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.3347
Testing accuracy: 0.9079
Best testing accuracy was: 0.8995
Stagnation was: 0

----------
Epoch 3/50
----------
Training


Avg. Loss: 0.3420, Total Loss: 0.3483, Loss Parts: [0.3483]: 100%|███████████████████| 469/469 [00:05<00:00, 80.08it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.3420
Training Accuracy: 0.9046
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.15it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.3155
Testing accuracy: 0.9122
Best testing accuracy was: 0.9079
Stagnation was: 0

----------
Epoch 4/50
----------
Training


Avg. Loss: 0.3257, Total Loss: 0.2240, Loss Parts: [0.2240]: 100%|███████████████████| 469/469 [00:05<00:00, 78.99it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.3257
Training Accuracy: 0.9095
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.76it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.3055
Testing accuracy: 0.9166
Best testing accuracy was: 0.9122
Stagnation was: 0

----------
Epoch 5/50
----------
Training


Avg. Loss: 0.3153, Total Loss: 0.4058, Loss Parts: [0.4058]: 100%|███████████████████| 469/469 [00:05<00:00, 79.13it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.3153
Training Accuracy: 0.9121
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 20.71it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2990
Testing accuracy: 0.9173
Best testing accuracy was: 0.9166
Stagnation was: 0

----------
Epoch 6/50
----------
Training


Avg. Loss: 0.3077, Total Loss: 0.3488, Loss Parts: [0.3488]: 100%|███████████████████| 469/469 [00:05<00:00, 79.36it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.3077
Training Accuracy: 0.9143
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.19it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2929
Testing accuracy: 0.9193
Best testing accuracy was: 0.9173
Stagnation was: 0

----------
Epoch 7/50
----------
Training


Avg. Loss: 0.3020, Total Loss: 0.2624, Loss Parts: [0.2624]: 100%|███████████████████| 469/469 [00:05<00:00, 80.10it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.3020
Training Accuracy: 0.9160
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.88it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2896
Testing accuracy: 0.9207
Best testing accuracy was: 0.9193
Stagnation was: 0

----------
Epoch 8/50
----------
Training


Avg. Loss: 0.2974, Total Loss: 0.4364, Loss Parts: [0.4364]: 100%|███████████████████| 469/469 [00:05<00:00, 82.48it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2974
Training Accuracy: 0.9171
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:02<00:00, 28.68it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2873
Testing accuracy: 0.9191
Best testing accuracy was: 0.9207
Stagnation was: 1

----------
Epoch 9/50
----------
Training


Avg. Loss: 0.2934, Total Loss: 0.4334, Loss Parts: [0.4334]: 100%|███████████████████| 469/469 [00:05<00:00, 81.40it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2934
Training Accuracy: 0.9184
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.72it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2841
Testing accuracy: 0.9214
Best testing accuracy was: 0.9207
Stagnation was: 0

----------
Epoch 10/50
----------
Training


Avg. Loss: 0.2903, Total Loss: 0.2195, Loss Parts: [0.2195]: 100%|███████████████████| 469/469 [00:05<00:00, 80.72it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2903
Training Accuracy: 0.9196
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.62it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2827
Testing accuracy: 0.9205
Best testing accuracy was: 0.9214
Stagnation was: 1

----------
Epoch 11/50
----------
Training


Avg. Loss: 0.2876, Total Loss: 0.3786, Loss Parts: [0.3786]: 100%|███████████████████| 469/469 [00:05<00:00, 84.10it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2876
Training Accuracy: 0.9198
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.99it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2824
Testing accuracy: 0.9206
Best testing accuracy was: 0.9214
Stagnation was: 2

----------
Epoch 12/50
----------
Training


Avg. Loss: 0.2850, Total Loss: 0.3143, Loss Parts: [0.3143]: 100%|███████████████████| 469/469 [00:05<00:00, 82.18it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2850
Training Accuracy: 0.9204
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.54it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2797
Testing accuracy: 0.9211
Best testing accuracy was: 0.9214
Stagnation was: 3

----------
Epoch 13/50
----------
Training


Avg. Loss: 0.2829, Total Loss: 0.2194, Loss Parts: [0.2194]: 100%|███████████████████| 469/469 [00:05<00:00, 79.42it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2829
Training Accuracy: 0.9214
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 25.32it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2780
Testing accuracy: 0.9219
Best testing accuracy was: 0.9214
Stagnation was: 0

----------
Epoch 14/50
----------
Training


Avg. Loss: 0.2811, Total Loss: 0.3934, Loss Parts: [0.3934]: 100%|███████████████████| 469/469 [00:05<00:00, 80.32it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2811
Training Accuracy: 0.9218
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.73it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2767
Testing accuracy: 0.9225
Best testing accuracy was: 0.9219
Stagnation was: 0

----------
Epoch 15/50
----------
Training


Avg. Loss: 0.2793, Total Loss: 0.4273, Loss Parts: [0.4273]: 100%|███████████████████| 469/469 [00:05<00:00, 78.73it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2793
Training Accuracy: 0.9222
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.11it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2771
Testing accuracy: 0.9204
Best testing accuracy was: 0.9225
Stagnation was: 1

----------
Epoch 16/50
----------
Training


Avg. Loss: 0.2774, Total Loss: 0.2677, Loss Parts: [0.2677]: 100%|███████████████████| 469/469 [00:05<00:00, 79.02it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2774
Training Accuracy: 0.9234
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.49it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2754
Testing accuracy: 0.9226
Best testing accuracy was: 0.9225
Stagnation was: 0

----------
Epoch 17/50
----------
Training


Avg. Loss: 0.2760, Total Loss: 0.2777, Loss Parts: [0.2777]: 100%|███████████████████| 469/469 [00:05<00:00, 82.45it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2760
Training Accuracy: 0.9232
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.05it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2743
Testing accuracy: 0.9226
Best testing accuracy was: 0.9226
Stagnation was: 1

----------
Epoch 18/50
----------
Training


Avg. Loss: 0.2751, Total Loss: 0.2666, Loss Parts: [0.2666]: 100%|███████████████████| 469/469 [00:05<00:00, 79.45it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2751
Training Accuracy: 0.9238
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.12it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2743
Testing accuracy: 0.9219
Best testing accuracy was: 0.9226
Stagnation was: 2

----------
Epoch 19/50
----------
Training


Avg. Loss: 0.2737, Total Loss: 0.2433, Loss Parts: [0.2433]: 100%|███████████████████| 469/469 [00:06<00:00, 78.13it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2737
Training Accuracy: 0.9241
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.26it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2733
Testing accuracy: 0.9236
Best testing accuracy was: 0.9226
Stagnation was: 0

----------
Epoch 20/50
----------
Training


Avg. Loss: 0.2725, Total Loss: 0.3353, Loss Parts: [0.3353]: 100%|███████████████████| 469/469 [00:05<00:00, 82.21it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2725
Training Accuracy: 0.9245
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.59it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2726
Testing accuracy: 0.9234
Best testing accuracy was: 0.9236
Stagnation was: 1

----------
Epoch 21/50
----------
Training


Avg. Loss: 0.2716, Total Loss: 0.2850, Loss Parts: [0.2850]: 100%|███████████████████| 469/469 [00:05<00:00, 82.78it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2716
Training Accuracy: 0.9250
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.39it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2729
Testing accuracy: 0.9238
Best testing accuracy was: 0.9236
Stagnation was: 0

----------
Epoch 22/50
----------
Training


Avg. Loss: 0.2707, Total Loss: 0.4798, Loss Parts: [0.4798]: 100%|███████████████████| 469/469 [00:05<00:00, 80.06it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2707
Training Accuracy: 0.9252
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.06it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2716
Testing accuracy: 0.9236
Best testing accuracy was: 0.9238
Stagnation was: 1

----------
Epoch 23/50
----------
Training


Avg. Loss: 0.2695, Total Loss: 0.2479, Loss Parts: [0.2479]: 100%|███████████████████| 469/469 [00:05<00:00, 81.54it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2695
Training Accuracy: 0.9254
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.71it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2714
Testing accuracy: 0.9221
Best testing accuracy was: 0.9238
Stagnation was: 2

----------
Epoch 24/50
----------
Training


Avg. Loss: 0.2688, Total Loss: 0.2560, Loss Parts: [0.2560]: 100%|███████████████████| 469/469 [00:05<00:00, 84.48it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2688
Training Accuracy: 0.9249
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.12it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2717
Testing accuracy: 0.9230
Best testing accuracy was: 0.9238
Stagnation was: 3

----------
Epoch 25/50
----------
Training


Avg. Loss: 0.2677, Total Loss: 0.1260, Loss Parts: [0.1260]: 100%|███████████████████| 469/469 [00:05<00:00, 82.39it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2677
Training Accuracy: 0.9263
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.75it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2702
Testing accuracy: 0.9239
Best testing accuracy was: 0.9238
Stagnation was: 0

----------
Epoch 26/50
----------
Training


Avg. Loss: 0.2671, Total Loss: 0.1703, Loss Parts: [0.1703]: 100%|███████████████████| 469/469 [00:05<00:00, 84.79it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2671
Training Accuracy: 0.9264
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.95it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2706
Testing accuracy: 0.9235
Best testing accuracy was: 0.9239
Stagnation was: 1

----------
Epoch 27/50
----------
Training


Avg. Loss: 0.2663, Total Loss: 0.2335, Loss Parts: [0.2335]: 100%|███████████████████| 469/469 [00:06<00:00, 78.14it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2663
Training Accuracy: 0.9259
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.70it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2705
Testing accuracy: 0.9235
Best testing accuracy was: 0.9239
Stagnation was: 2

----------
Epoch 28/50
----------
Training


Avg. Loss: 0.2656, Total Loss: 0.2073, Loss Parts: [0.2073]: 100%|███████████████████| 469/469 [00:05<00:00, 80.28it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2656
Training Accuracy: 0.9263
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.58it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2701
Testing accuracy: 0.9236
Best testing accuracy was: 0.9239
Stagnation was: 3

----------
Epoch 29/50
----------
Training


Avg. Loss: 0.2650, Total Loss: 0.5496, Loss Parts: [0.5496]: 100%|███████████████████| 469/469 [00:05<00:00, 80.33it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2650
Training Accuracy: 0.9268
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.70it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2691
Testing accuracy: 0.9239
Best testing accuracy was: 0.9239
Stagnation was: 4

----------
Epoch 30/50
----------
Training


Avg. Loss: 0.2642, Total Loss: 0.3086, Loss Parts: [0.3086]: 100%|███████████████████| 469/469 [00:06<00:00, 77.97it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2642
Training Accuracy: 0.9270
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.06it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2695
Testing accuracy: 0.9230
Best testing accuracy was: 0.9239
Ran out of patience at epoch: 29
Patience was: 5
Training complete in 4m 35s
Saved session to C:\Users\Windows\Desktop\Shahir\18.408\18408-final-project\experiments\44b333e88741f6ef\sessions\Session 05-19-2021 04-50-46 PM
{'dataset_config': {'dataset_type': 'img', 'dataset_config': {'img_dataset_type': 'mnist', 'num_train_samples': 60000, 'num_test_samples': 10000, 'new_input_size': None, 'flatten': True, 'augment': False, 'corrupt_frac': 0.0, 'seed': 0}}, 'model_config': {'model_type': 'relu_toy', 'model_config': {'input_dim': 784, 'output_dim': 10, 'layer_dims': [], 'bias': True, 'seed': None}}, 'training_config': {'optimizer_type': 'sgd_momentum', 'loss_type': 'cross_entropy', 'lr': 0.01, 'num_epochs': 50, 'clip_grad_norm': False, 'weight_decay': 0.01, 'use_lr_schedule': False, 'epoch_lr_decay_steps': None, 'lr_decay_gamma': None, 'early_stop': True, 'early_stop_acc': 0.9, 'early_stop_patience': 5}, 'tri

Avg. Loss: 0.6131, Total Loss: 0.3878, Loss Parts: [0.3878]: 100%|███████████████████| 469/469 [00:05<00:00, 87.15it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.6131
Training Accuracy: 0.8511
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.52it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.4233
Testing accuracy: 0.8963
Best testing accuracy was: -1.0000
Stagnation was: 0

----------
Epoch 2/50
----------
Training


Avg. Loss: 0.4296, Total Loss: 0.3539, Loss Parts: [0.3539]: 100%|███████████████████| 469/469 [00:05<00:00, 82.11it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.4296
Training Accuracy: 0.8930
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.09it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.3988
Testing accuracy: 0.9013
Best testing accuracy was: 0.8963
Stagnation was: 0

----------
Epoch 3/50
----------
Training


Avg. Loss: 0.4160, Total Loss: 0.3174, Loss Parts: [0.3174]: 100%|███████████████████| 469/469 [00:05<00:00, 83.92it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.4160
Training Accuracy: 0.8968
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.35it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.3918
Testing accuracy: 0.9045
Best testing accuracy was: 0.9013
Stagnation was: 0

----------
Epoch 4/50
----------
Training


Avg. Loss: 0.4115, Total Loss: 0.3950, Loss Parts: [0.3950]: 100%|███████████████████| 469/469 [00:05<00:00, 82.78it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.4115
Training Accuracy: 0.8982
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.54it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.3950
Testing accuracy: 0.9047
Best testing accuracy was: 0.9045
Stagnation was: 0

----------
Epoch 5/50
----------
Training


Avg. Loss: 0.4095, Total Loss: 0.4315, Loss Parts: [0.4315]: 100%|███████████████████| 469/469 [00:05<00:00, 80.86it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.4095
Training Accuracy: 0.8993
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.72it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.3898
Testing accuracy: 0.9065
Best testing accuracy was: 0.9047
Stagnation was: 0

----------
Epoch 6/50
----------
Training


Avg. Loss: 0.4095, Total Loss: 0.3751, Loss Parts: [0.3751]: 100%|███████████████████| 469/469 [00:05<00:00, 82.25it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.4095
Training Accuracy: 0.8993
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.70it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.3894
Testing accuracy: 0.9078
Best testing accuracy was: 0.9065
Stagnation was: 0

----------
Epoch 7/50
----------
Training


Avg. Loss: 0.4087, Total Loss: 0.5048, Loss Parts: [0.5048]: 100%|███████████████████| 469/469 [00:05<00:00, 79.45it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.4087
Training Accuracy: 0.8988
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.52it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.3907
Testing accuracy: 0.9072
Best testing accuracy was: 0.9078
Stagnation was: 1

----------
Epoch 8/50
----------
Training


Avg. Loss: 0.4087, Total Loss: 0.3641, Loss Parts: [0.3641]: 100%|███████████████████| 469/469 [00:06<00:00, 78.08it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.4087
Training Accuracy: 0.8995
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.19it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.3909
Testing accuracy: 0.9048
Best testing accuracy was: 0.9078
Stagnation was: 2

----------
Epoch 9/50
----------
Training


Avg. Loss: 0.4084, Total Loss: 0.4767, Loss Parts: [0.4767]: 100%|███████████████████| 469/469 [00:05<00:00, 81.50it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.4084
Training Accuracy: 0.9000
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.95it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.3905
Testing accuracy: 0.9065
Best testing accuracy was: 0.9078
Stagnation was: 3

----------
Epoch 10/50
----------
Training


Avg. Loss: 0.4085, Total Loss: 0.4600, Loss Parts: [0.4600]: 100%|███████████████████| 469/469 [00:05<00:00, 85.15it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.4085
Training Accuracy: 0.8993
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.79it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.3888
Testing accuracy: 0.9069
Best testing accuracy was: 0.9078
Stagnation was: 4

----------
Epoch 11/50
----------
Training


Avg. Loss: 0.4085, Total Loss: 0.3988, Loss Parts: [0.3988]: 100%|███████████████████| 469/469 [00:05<00:00, 80.69it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.4085
Training Accuracy: 0.8998
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.60it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.3893
Testing accuracy: 0.9067
Best testing accuracy was: 0.9078
Ran out of patience at epoch: 10
Patience was: 5
Training complete in 1m 40s
Saved session to C:\Users\Windows\Desktop\Shahir\18.408\18408-final-project\experiments\716119bb47f5a05c\sessions\Session 05-19-2021 04-52-26 PM
{'dataset_config': {'dataset_type': 'img', 'dataset_config': {'img_dataset_type': 'mnist', 'num_train_samples': 60000, 'num_test_samples': 10000, 'new_input_size': None, 'flatten': True, 'augment': False, 'corrupt_frac': 0.0, 'seed': 0}}, 'model_config': {'model_type': 'relu_toy', 'model_config': {'input_dim': 784, 'output_dim': 10, 'layer_dims': [], 'bias': True, 'seed': None}}, 'training_config': {'optimizer_type': 'sgd_momentum', 'loss_type': 'cross_entropy', 'lr': 0.01, 'num_epochs': 50, 'clip_grad_norm': False, 'weight_decay': 0.1, 'use_lr_schedule': False, 'epoch_lr_decay_steps': None, 'lr_decay_gamma': None, 'early_stop': True, 'early_stop_acc': 0.9, 'early_stop_patience': 5}, 'tria

Avg. Loss: 0.8509, Total Loss: 0.8888, Loss Parts: [0.8888]: 100%|███████████████████| 469/469 [00:05<00:00, 84.49it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8509
Training Accuracy: 0.8341
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.11it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7474
Testing accuracy: 0.8703
Best testing accuracy was: -1.0000
Stagnation was: 0

----------
Epoch 2/50
----------
Training


Avg. Loss: 0.7736, Total Loss: 0.6245, Loss Parts: [0.6245]: 100%|███████████████████| 469/469 [00:05<00:00, 83.32it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7736
Training Accuracy: 0.8574
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.03it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7497
Testing accuracy: 0.8683
Best testing accuracy was: 0.8703
Stagnation was: 0

----------
Epoch 3/50
----------
Training


Avg. Loss: 0.7735, Total Loss: 0.8185, Loss Parts: [0.8185]: 100%|███████████████████| 469/469 [00:05<00:00, 82.92it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7735
Training Accuracy: 0.8580
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.16it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7443
Testing accuracy: 0.8686
Best testing accuracy was: 0.8703
Stagnation was: 0

----------
Epoch 4/50
----------
Training


Avg. Loss: 0.7737, Total Loss: 0.6728, Loss Parts: [0.6728]: 100%|███████████████████| 469/469 [00:05<00:00, 83.83it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7737
Training Accuracy: 0.8578
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.99it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7445
Testing accuracy: 0.8686
Best testing accuracy was: 0.8703
Stagnation was: 0

----------
Epoch 5/50
----------
Training


Avg. Loss: 0.7737, Total Loss: 0.7958, Loss Parts: [0.7958]: 100%|███████████████████| 469/469 [00:05<00:00, 83.08it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7737
Training Accuracy: 0.8573
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.48it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7471
Testing accuracy: 0.8636
Best testing accuracy was: 0.8703
Stagnation was: 0

----------
Epoch 6/50
----------
Training


Avg. Loss: 0.7732, Total Loss: 0.8435, Loss Parts: [0.8435]: 100%|███████████████████| 469/469 [00:05<00:00, 81.34it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7732
Training Accuracy: 0.8573
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 25.20it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7490
Testing accuracy: 0.8697
Best testing accuracy was: 0.8703
Stagnation was: 0

----------
Epoch 7/50
----------
Training


Avg. Loss: 0.7735, Total Loss: 0.7210, Loss Parts: [0.7210]: 100%|███████████████████| 469/469 [00:05<00:00, 82.98it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7735
Training Accuracy: 0.8571
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.34it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7459
Testing accuracy: 0.8727
Best testing accuracy was: 0.8703
Stagnation was: 0

----------
Epoch 8/50
----------
Training


Avg. Loss: 0.7737, Total Loss: 0.8078, Loss Parts: [0.8078]: 100%|███████████████████| 469/469 [00:05<00:00, 82.93it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7737
Training Accuracy: 0.8577
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.69it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7469
Testing accuracy: 0.8651
Best testing accuracy was: 0.8727
Stagnation was: 0

----------
Epoch 9/50
----------
Training


Avg. Loss: 0.7735, Total Loss: 0.8060, Loss Parts: [0.8060]: 100%|███████████████████| 469/469 [00:05<00:00, 79.43it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7735
Training Accuracy: 0.8583
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.93it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7459
Testing accuracy: 0.8732
Best testing accuracy was: 0.8727
Stagnation was: 0

----------
Epoch 10/50
----------
Training


Avg. Loss: 0.7732, Total Loss: 0.7590, Loss Parts: [0.7590]: 100%|███████████████████| 469/469 [00:06<00:00, 76.33it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7732
Training Accuracy: 0.8578
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 25.96it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7473
Testing accuracy: 0.8662
Best testing accuracy was: 0.8732
Stagnation was: 0

----------
Epoch 11/50
----------
Training


Avg. Loss: 0.7730, Total Loss: 0.7764, Loss Parts: [0.7764]: 100%|███████████████████| 469/469 [00:05<00:00, 85.74it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7730
Training Accuracy: 0.8583
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.76it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7460
Testing accuracy: 0.8671
Best testing accuracy was: 0.8732
Stagnation was: 0

----------
Epoch 12/50
----------
Training


Avg. Loss: 0.7738, Total Loss: 0.6765, Loss Parts: [0.6765]: 100%|███████████████████| 469/469 [00:05<00:00, 80.27it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7738
Training Accuracy: 0.8580
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.23it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7463
Testing accuracy: 0.8667
Best testing accuracy was: 0.8732
Stagnation was: 0

----------
Epoch 13/50
----------
Training


Avg. Loss: 0.7733, Total Loss: 0.7794, Loss Parts: [0.7794]: 100%|███████████████████| 469/469 [00:05<00:00, 82.88it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7733
Training Accuracy: 0.8587
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.70it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7471
Testing accuracy: 0.8683
Best testing accuracy was: 0.8732
Stagnation was: 0

----------
Epoch 14/50
----------
Training


Avg. Loss: 0.7734, Total Loss: 0.7840, Loss Parts: [0.7840]: 100%|███████████████████| 469/469 [00:06<00:00, 77.84it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7734
Training Accuracy: 0.8578
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.56it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7507
Testing accuracy: 0.8674
Best testing accuracy was: 0.8732
Stagnation was: 0

----------
Epoch 15/50
----------
Training


Avg. Loss: 0.7735, Total Loss: 0.7588, Loss Parts: [0.7588]: 100%|███████████████████| 469/469 [00:05<00:00, 81.44it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7735
Training Accuracy: 0.8577
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.80it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7451
Testing accuracy: 0.8700
Best testing accuracy was: 0.8732
Stagnation was: 0

----------
Epoch 16/50
----------
Training


Avg. Loss: 0.7734, Total Loss: 0.7181, Loss Parts: [0.7181]: 100%|███████████████████| 469/469 [00:05<00:00, 83.27it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7734
Training Accuracy: 0.8582
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.67it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7471
Testing accuracy: 0.8676
Best testing accuracy was: 0.8732
Stagnation was: 0

----------
Epoch 17/50
----------
Training


Avg. Loss: 0.7735, Total Loss: 0.6785, Loss Parts: [0.6785]: 100%|███████████████████| 469/469 [00:05<00:00, 84.35it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7735
Training Accuracy: 0.8576
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.93it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7448
Testing accuracy: 0.8733
Best testing accuracy was: 0.8732
Stagnation was: 0

----------
Epoch 18/50
----------
Training


Avg. Loss: 0.7737, Total Loss: 0.7177, Loss Parts: [0.7177]: 100%|███████████████████| 469/469 [00:05<00:00, 80.03it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7737
Training Accuracy: 0.8575
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.53it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7484
Testing accuracy: 0.8733
Best testing accuracy was: 0.8733
Stagnation was: 0

----------
Epoch 19/50
----------
Training


Avg. Loss: 0.7734, Total Loss: 0.8327, Loss Parts: [0.8327]: 100%|███████████████████| 469/469 [00:05<00:00, 86.16it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7734
Training Accuracy: 0.8571
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.85it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7472
Testing accuracy: 0.8686
Best testing accuracy was: 0.8733
Stagnation was: 0

----------
Epoch 20/50
----------
Training


Avg. Loss: 0.7736, Total Loss: 0.7261, Loss Parts: [0.7261]: 100%|███████████████████| 469/469 [00:05<00:00, 84.77it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7736
Training Accuracy: 0.8577
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.98it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7500
Testing accuracy: 0.8631
Best testing accuracy was: 0.8733
Stagnation was: 0

----------
Epoch 21/50
----------
Training


Avg. Loss: 0.7733, Total Loss: 0.7565, Loss Parts: [0.7565]: 100%|███████████████████| 469/469 [00:05<00:00, 85.29it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7733
Training Accuracy: 0.8571
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 25.49it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7514
Testing accuracy: 0.8772
Best testing accuracy was: 0.8733
Stagnation was: 0

----------
Epoch 22/50
----------
Training


Avg. Loss: 0.7736, Total Loss: 0.8036, Loss Parts: [0.8036]: 100%|███████████████████| 469/469 [00:05<00:00, 82.82it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7736
Training Accuracy: 0.8578
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.18it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7495
Testing accuracy: 0.8696
Best testing accuracy was: 0.8772
Stagnation was: 0

----------
Epoch 23/50
----------
Training


Avg. Loss: 0.7736, Total Loss: 0.6957, Loss Parts: [0.6957]: 100%|███████████████████| 469/469 [00:05<00:00, 82.49it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7736
Training Accuracy: 0.8571
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.48it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7495
Testing accuracy: 0.8714
Best testing accuracy was: 0.8772
Stagnation was: 0

----------
Epoch 24/50
----------
Training


Avg. Loss: 0.7735, Total Loss: 0.8222, Loss Parts: [0.8222]: 100%|███████████████████| 469/469 [00:05<00:00, 79.99it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7735
Training Accuracy: 0.8575
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.54it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7517
Testing accuracy: 0.8743
Best testing accuracy was: 0.8772
Stagnation was: 0

----------
Epoch 25/50
----------
Training


Avg. Loss: 0.7738, Total Loss: 0.7383, Loss Parts: [0.7383]: 100%|███████████████████| 469/469 [00:05<00:00, 86.25it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7738
Training Accuracy: 0.8570
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.26it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7421
Testing accuracy: 0.8731
Best testing accuracy was: 0.8772
Stagnation was: 0

----------
Epoch 26/50
----------
Training


Avg. Loss: 0.7729, Total Loss: 0.7948, Loss Parts: [0.7948]: 100%|███████████████████| 469/469 [00:05<00:00, 83.69it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7729
Training Accuracy: 0.8589
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.73it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7463
Testing accuracy: 0.8677
Best testing accuracy was: 0.8772
Stagnation was: 0

----------
Epoch 27/50
----------
Training


Avg. Loss: 0.7738, Total Loss: 0.8485, Loss Parts: [0.8485]: 100%|███████████████████| 469/469 [00:05<00:00, 80.29it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7738
Training Accuracy: 0.8576
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.51it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7445
Testing accuracy: 0.8673
Best testing accuracy was: 0.8772
Stagnation was: 0

----------
Epoch 28/50
----------
Training


Avg. Loss: 0.7733, Total Loss: 0.7972, Loss Parts: [0.7972]: 100%|███████████████████| 469/469 [00:05<00:00, 81.29it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7733
Training Accuracy: 0.8576
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.99it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7457
Testing accuracy: 0.8644
Best testing accuracy was: 0.8772
Stagnation was: 0

----------
Epoch 29/50
----------
Training


Avg. Loss: 0.7735, Total Loss: 0.7234, Loss Parts: [0.7234]: 100%|███████████████████| 469/469 [00:05<00:00, 84.08it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7735
Training Accuracy: 0.8570
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.32it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7477
Testing accuracy: 0.8637
Best testing accuracy was: 0.8772
Stagnation was: 0

----------
Epoch 30/50
----------
Training


Avg. Loss: 0.7735, Total Loss: 0.6934, Loss Parts: [0.6934]: 100%|███████████████████| 469/469 [00:05<00:00, 79.75it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7735
Training Accuracy: 0.8578
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.16it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7492
Testing accuracy: 0.8611
Best testing accuracy was: 0.8772
Stagnation was: 0

----------
Epoch 31/50
----------
Training


Avg. Loss: 0.7737, Total Loss: 0.7114, Loss Parts: [0.7114]: 100%|███████████████████| 469/469 [00:05<00:00, 84.38it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7737
Training Accuracy: 0.8572
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.63it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7489
Testing accuracy: 0.8672
Best testing accuracy was: 0.8772
Stagnation was: 0

----------
Epoch 32/50
----------
Training


Avg. Loss: 0.7735, Total Loss: 0.6986, Loss Parts: [0.6986]: 100%|███████████████████| 469/469 [00:06<00:00, 78.05it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7735
Training Accuracy: 0.8579
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.24it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7454
Testing accuracy: 0.8680
Best testing accuracy was: 0.8772
Stagnation was: 0

----------
Epoch 33/50
----------
Training


Avg. Loss: 0.7735, Total Loss: 0.7806, Loss Parts: [0.7806]: 100%|███████████████████| 469/469 [00:05<00:00, 84.27it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7735
Training Accuracy: 0.8583
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.00it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7507
Testing accuracy: 0.8622
Best testing accuracy was: 0.8772
Stagnation was: 0

----------
Epoch 34/50
----------
Training


Avg. Loss: 0.7738, Total Loss: 0.6747, Loss Parts: [0.6747]: 100%|███████████████████| 469/469 [00:05<00:00, 83.94it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7738
Training Accuracy: 0.8581
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.62it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7475
Testing accuracy: 0.8716
Best testing accuracy was: 0.8772
Stagnation was: 0

----------
Epoch 35/50
----------
Training


Avg. Loss: 0.7735, Total Loss: 0.8152, Loss Parts: [0.8152]: 100%|███████████████████| 469/469 [00:05<00:00, 79.30it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7735
Training Accuracy: 0.8578
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.21it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7486
Testing accuracy: 0.8654
Best testing accuracy was: 0.8772
Stagnation was: 0

----------
Epoch 36/50
----------
Training


Avg. Loss: 0.7733, Total Loss: 0.8760, Loss Parts: [0.8760]: 100%|███████████████████| 469/469 [00:05<00:00, 84.17it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7733
Training Accuracy: 0.8576
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.07it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7497
Testing accuracy: 0.8692
Best testing accuracy was: 0.8772
Stagnation was: 0

----------
Epoch 37/50
----------
Training


Avg. Loss: 0.7732, Total Loss: 0.8523, Loss Parts: [0.8523]: 100%|███████████████████| 469/469 [00:05<00:00, 80.19it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7732
Training Accuracy: 0.8581
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.30it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7467
Testing accuracy: 0.8700
Best testing accuracy was: 0.8772
Stagnation was: 0

----------
Epoch 38/50
----------
Training


Avg. Loss: 0.7734, Total Loss: 0.7302, Loss Parts: [0.7302]: 100%|███████████████████| 469/469 [00:05<00:00, 85.19it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7734
Training Accuracy: 0.8586
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.27it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7468
Testing accuracy: 0.8631
Best testing accuracy was: 0.8772
Stagnation was: 0

----------
Epoch 39/50
----------
Training


Avg. Loss: 0.7737, Total Loss: 0.7674, Loss Parts: [0.7674]: 100%|███████████████████| 469/469 [00:05<00:00, 83.44it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7737
Training Accuracy: 0.8567
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.51it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7478
Testing accuracy: 0.8673
Best testing accuracy was: 0.8772
Stagnation was: 0

----------
Epoch 40/50
----------
Training


Avg. Loss: 0.7735, Total Loss: 0.7772, Loss Parts: [0.7772]: 100%|███████████████████| 469/469 [00:05<00:00, 82.17it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7735
Training Accuracy: 0.8569
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.71it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7496
Testing accuracy: 0.8722
Best testing accuracy was: 0.8772
Stagnation was: 0

----------
Epoch 41/50
----------
Training


Avg. Loss: 0.7732, Total Loss: 0.7288, Loss Parts: [0.7288]: 100%|███████████████████| 469/469 [00:05<00:00, 80.72it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7732
Training Accuracy: 0.8574
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.10it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7506
Testing accuracy: 0.8727
Best testing accuracy was: 0.8772
Stagnation was: 0

----------
Epoch 42/50
----------
Training


Avg. Loss: 0.7732, Total Loss: 0.6585, Loss Parts: [0.6585]: 100%|███████████████████| 469/469 [00:05<00:00, 83.70it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7732
Training Accuracy: 0.8583
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.57it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7468
Testing accuracy: 0.8680
Best testing accuracy was: 0.8772
Stagnation was: 0

----------
Epoch 43/50
----------
Training


Avg. Loss: 0.7735, Total Loss: 0.7860, Loss Parts: [0.7860]: 100%|███████████████████| 469/469 [00:05<00:00, 82.51it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7735
Training Accuracy: 0.8579
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.31it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7457
Testing accuracy: 0.8714
Best testing accuracy was: 0.8772
Stagnation was: 0

----------
Epoch 44/50
----------
Training


Avg. Loss: 0.7732, Total Loss: 0.8099, Loss Parts: [0.8099]: 100%|███████████████████| 469/469 [00:05<00:00, 81.33it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7732
Training Accuracy: 0.8577
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.72it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7470
Testing accuracy: 0.8691
Best testing accuracy was: 0.8772
Stagnation was: 0

----------
Epoch 45/50
----------
Training


Avg. Loss: 0.7739, Total Loss: 0.7855, Loss Parts: [0.7855]: 100%|███████████████████| 469/469 [00:05<00:00, 79.42it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7739
Training Accuracy: 0.8583
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.24it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7413
Testing accuracy: 0.8707
Best testing accuracy was: 0.8772
Stagnation was: 0

----------
Epoch 46/50
----------
Training


Avg. Loss: 0.7736, Total Loss: 0.8199, Loss Parts: [0.8199]: 100%|███████████████████| 469/469 [00:05<00:00, 82.50it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7736
Training Accuracy: 0.8575
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.92it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7463
Testing accuracy: 0.8683
Best testing accuracy was: 0.8772
Stagnation was: 0

----------
Epoch 47/50
----------
Training


Avg. Loss: 0.7728, Total Loss: 0.7984, Loss Parts: [0.7984]: 100%|███████████████████| 469/469 [00:05<00:00, 84.21it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7728
Training Accuracy: 0.8581
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.61it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7544
Testing accuracy: 0.8697
Best testing accuracy was: 0.8772
Stagnation was: 0

----------
Epoch 48/50
----------
Training


Avg. Loss: 0.7739, Total Loss: 0.7797, Loss Parts: [0.7797]: 100%|███████████████████| 469/469 [00:05<00:00, 85.23it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7739
Training Accuracy: 0.8571
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.38it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7460
Testing accuracy: 0.8703
Best testing accuracy was: 0.8772
Stagnation was: 0

----------
Epoch 49/50
----------
Training


Avg. Loss: 0.7731, Total Loss: 0.6988, Loss Parts: [0.6988]: 100%|███████████████████| 469/469 [00:05<00:00, 86.21it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7731
Training Accuracy: 0.8577
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.72it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7492
Testing accuracy: 0.8663
Best testing accuracy was: 0.8772
Stagnation was: 0

----------
Epoch 50/50
----------
Training


Avg. Loss: 0.7736, Total Loss: 1.0310, Loss Parts: [1.0310]: 100%|███████████████████| 469/469 [00:05<00:00, 80.71it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7736
Training Accuracy: 0.8579
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.09it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7482
Testing accuracy: 0.8604
Best testing accuracy was: 0.8772
Stagnation was: 0

Training complete in 7m 32s
Saved session to C:\Users\Windows\Desktop\Shahir\18.408\18408-final-project\experiments\f3cfd582c9b9a972\sessions\Session 05-19-2021 04-59-59 PM
{'dataset_config': {'dataset_type': 'img', 'dataset_config': {'img_dataset_type': 'mnist', 'num_train_samples': 60000, 'num_test_samples': 10000, 'new_input_size': None, 'flatten': True, 'augment': False, 'corrupt_frac': 0.0, 'seed': 0}}, 'model_config': {'model_type': 'relu_toy', 'model_config': {'input_dim': 784, 'output_dim': 10, 'layer_dims': [100], 'bias': True, 'seed': None}}, 'training_config': {'optimizer_type': 'sgd_momentum', 'loss_type': 'cross_entropy', 'lr': 0.01, 'num_epochs': 50, 'clip_grad_norm': False, 'weight_decay': 0.0, 'use_lr_schedule': False, 'epoch_lr_decay_steps': None, 'lr_decay_gamma': None, 'early_stop': True, 'early_stop_acc': 0.9, 'early_stop_patience': 5}, 'trial_index': 0}
----------
Epo

Avg. Loss: 0.6203, Total Loss: 0.3011, Loss Parts: [0.3011]: 100%|███████████████████| 469/469 [00:05<00:00, 83.47it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.6203
Training Accuracy: 0.8420
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.11it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.3200
Testing accuracy: 0.9094
Best testing accuracy was: -1.0000
Stagnation was: 0

----------
Epoch 2/50
----------
Training


Avg. Loss: 0.3024, Total Loss: 0.2662, Loss Parts: [0.2662]: 100%|███████████████████| 469/469 [00:05<00:00, 81.59it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.3024
Training Accuracy: 0.9142
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.76it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2628
Testing accuracy: 0.9258
Best testing accuracy was: 0.9094
Stagnation was: 0

----------
Epoch 3/50
----------
Training


Avg. Loss: 0.2544, Total Loss: 0.2596, Loss Parts: [0.2596]: 100%|███████████████████| 469/469 [00:05<00:00, 83.00it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2544
Training Accuracy: 0.9280
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.73it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2253
Testing accuracy: 0.9354
Best testing accuracy was: 0.9258
Stagnation was: 0

----------
Epoch 4/50
----------
Training


Avg. Loss: 0.2174, Total Loss: 0.2120, Loss Parts: [0.2120]: 100%|███████████████████| 469/469 [00:05<00:00, 81.02it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2174
Training Accuracy: 0.9384
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.56it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1990
Testing accuracy: 0.9427
Best testing accuracy was: 0.9354
Stagnation was: 0

----------
Epoch 5/50
----------
Training


Avg. Loss: 0.1896, Total Loss: 0.2114, Loss Parts: [0.2114]: 100%|███████████████████| 469/469 [00:05<00:00, 79.34it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1896
Training Accuracy: 0.9467
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.14it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1777
Testing accuracy: 0.9470
Best testing accuracy was: 0.9427
Stagnation was: 0

----------
Epoch 6/50
----------
Training


Avg. Loss: 0.1669, Total Loss: 0.1532, Loss Parts: [0.1532]: 100%|███████████████████| 469/469 [00:05<00:00, 82.90it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1669
Training Accuracy: 0.9522
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.25it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1568
Testing accuracy: 0.9547
Best testing accuracy was: 0.9470
Stagnation was: 0

----------
Epoch 7/50
----------
Training


Avg. Loss: 0.1488, Total Loss: 0.1147, Loss Parts: [0.1147]: 100%|███████████████████| 469/469 [00:06<00:00, 77.86it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1488
Training Accuracy: 0.9575
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.38it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1433
Testing accuracy: 0.9586
Best testing accuracy was: 0.9547
Stagnation was: 0

----------
Epoch 8/50
----------
Training


Avg. Loss: 0.1342, Total Loss: 0.1700, Loss Parts: [0.1700]: 100%|███████████████████| 469/469 [00:05<00:00, 78.74it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1342
Training Accuracy: 0.9616
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.74it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1288
Testing accuracy: 0.9619
Best testing accuracy was: 0.9586
Stagnation was: 0

----------
Epoch 9/50
----------
Training


Avg. Loss: 0.1221, Total Loss: 0.0950, Loss Parts: [0.0950]: 100%|███████████████████| 469/469 [00:05<00:00, 80.56it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1221
Training Accuracy: 0.9655
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.01it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1198
Testing accuracy: 0.9652
Best testing accuracy was: 0.9619
Stagnation was: 0

----------
Epoch 10/50
----------
Training


Avg. Loss: 0.1118, Total Loss: 0.0722, Loss Parts: [0.0722]: 100%|███████████████████| 469/469 [00:05<00:00, 81.10it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1118
Training Accuracy: 0.9683
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.34it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1119
Testing accuracy: 0.9678
Best testing accuracy was: 0.9652
Stagnation was: 0

----------
Epoch 11/50
----------
Training


Avg. Loss: 0.1034, Total Loss: 0.0833, Loss Parts: [0.0833]: 100%|███████████████████| 469/469 [00:06<00:00, 77.48it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1034
Training Accuracy: 0.9704
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.18it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1065
Testing accuracy: 0.9681
Best testing accuracy was: 0.9678
Stagnation was: 0

----------
Epoch 12/50
----------
Training


Avg. Loss: 0.0955, Total Loss: 0.0828, Loss Parts: [0.0828]: 100%|███████████████████| 469/469 [00:06<00:00, 75.54it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0955
Training Accuracy: 0.9730
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.03it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1011
Testing accuracy: 0.9696
Best testing accuracy was: 0.9681
Stagnation was: 0

----------
Epoch 13/50
----------
Training


Avg. Loss: 0.0895, Total Loss: 0.0839, Loss Parts: [0.0839]: 100%|███████████████████| 469/469 [00:05<00:00, 80.37it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0895
Training Accuracy: 0.9751
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.53it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0965
Testing accuracy: 0.9710
Best testing accuracy was: 0.9696
Stagnation was: 0

----------
Epoch 14/50
----------
Training


Avg. Loss: 0.0834, Total Loss: 0.0396, Loss Parts: [0.0396]: 100%|███████████████████| 469/469 [00:06<00:00, 77.99it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0834
Training Accuracy: 0.9768
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.91it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0907
Testing accuracy: 0.9725
Best testing accuracy was: 0.9710
Stagnation was: 0

----------
Epoch 15/50
----------
Training


Avg. Loss: 0.0782, Total Loss: 0.0808, Loss Parts: [0.0808]: 100%|███████████████████| 469/469 [00:06<00:00, 77.64it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0782
Training Accuracy: 0.9782
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.05it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0887
Testing accuracy: 0.9725
Best testing accuracy was: 0.9725
Stagnation was: 1

----------
Epoch 16/50
----------
Training


Avg. Loss: 0.0737, Total Loss: 0.0362, Loss Parts: [0.0362]: 100%|███████████████████| 469/469 [00:06<00:00, 77.63it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0737
Training Accuracy: 0.9796
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.04it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0851
Testing accuracy: 0.9746
Best testing accuracy was: 0.9725
Stagnation was: 0

----------
Epoch 17/50
----------
Training


Avg. Loss: 0.0697, Total Loss: 0.0394, Loss Parts: [0.0394]: 100%|███████████████████| 469/469 [00:05<00:00, 80.35it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0697
Training Accuracy: 0.9809
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.86it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0838
Testing accuracy: 0.9744
Best testing accuracy was: 0.9746
Stagnation was: 1

----------
Epoch 18/50
----------
Training


Avg. Loss: 0.0661, Total Loss: 0.0243, Loss Parts: [0.0243]: 100%|███████████████████| 469/469 [00:06<00:00, 77.87it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0661
Training Accuracy: 0.9820
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.94it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0793
Testing accuracy: 0.9760
Best testing accuracy was: 0.9746
Stagnation was: 0

----------
Epoch 19/50
----------
Training


Avg. Loss: 0.0628, Total Loss: 0.0388, Loss Parts: [0.0388]: 100%|███████████████████| 469/469 [00:06<00:00, 77.47it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0628
Training Accuracy: 0.9829
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.33it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0791
Testing accuracy: 0.9757
Best testing accuracy was: 0.9760
Stagnation was: 1

----------
Epoch 20/50
----------
Training


Avg. Loss: 0.0594, Total Loss: 0.0407, Loss Parts: [0.0407]: 100%|███████████████████| 469/469 [00:05<00:00, 80.79it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0594
Training Accuracy: 0.9841
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.59it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0762
Testing accuracy: 0.9765
Best testing accuracy was: 0.9760
Stagnation was: 0

----------
Epoch 21/50
----------
Training


Avg. Loss: 0.0565, Total Loss: 0.0671, Loss Parts: [0.0671]: 100%|███████████████████| 469/469 [00:05<00:00, 81.32it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0565
Training Accuracy: 0.9850
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.96it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0761
Testing accuracy: 0.9768
Best testing accuracy was: 0.9765
Stagnation was: 0

----------
Epoch 22/50
----------
Training


Avg. Loss: 0.0539, Total Loss: 0.0338, Loss Parts: [0.0338]: 100%|███████████████████| 469/469 [00:05<00:00, 82.42it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0539
Training Accuracy: 0.9855
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.33it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0753
Testing accuracy: 0.9775
Best testing accuracy was: 0.9768
Stagnation was: 0

----------
Epoch 23/50
----------
Training


Avg. Loss: 0.0515, Total Loss: 0.0266, Loss Parts: [0.0266]: 100%|███████████████████| 469/469 [00:05<00:00, 82.84it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0515
Training Accuracy: 0.9863
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.90it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0729
Testing accuracy: 0.9776
Best testing accuracy was: 0.9775
Stagnation was: 0

----------
Epoch 24/50
----------
Training


Avg. Loss: 0.0495, Total Loss: 0.0184, Loss Parts: [0.0184]: 100%|███████████████████| 469/469 [00:06<00:00, 78.04it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0495
Training Accuracy: 0.9869
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.60it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0718
Testing accuracy: 0.9781
Best testing accuracy was: 0.9776
Stagnation was: 0

----------
Epoch 25/50
----------
Training


Avg. Loss: 0.0474, Total Loss: 0.0407, Loss Parts: [0.0407]: 100%|███████████████████| 469/469 [00:05<00:00, 82.80it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0474
Training Accuracy: 0.9874
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.41it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0711
Testing accuracy: 0.9781
Best testing accuracy was: 0.9781
Stagnation was: 1

----------
Epoch 26/50
----------
Training


Avg. Loss: 0.0450, Total Loss: 0.0567, Loss Parts: [0.0567]: 100%|███████████████████| 469/469 [00:05<00:00, 83.00it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0450
Training Accuracy: 0.9883
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.58it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0686
Testing accuracy: 0.9791
Best testing accuracy was: 0.9781
Stagnation was: 0

----------
Epoch 27/50
----------
Training


Avg. Loss: 0.0433, Total Loss: 0.0445, Loss Parts: [0.0445]: 100%|███████████████████| 469/469 [00:05<00:00, 81.35it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0433
Training Accuracy: 0.9889
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.87it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0703
Testing accuracy: 0.9789
Best testing accuracy was: 0.9791
Stagnation was: 1

----------
Epoch 28/50
----------
Training


Avg. Loss: 0.0416, Total Loss: 0.1263, Loss Parts: [0.1263]: 100%|███████████████████| 469/469 [00:05<00:00, 80.28it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0416
Training Accuracy: 0.9890
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.30it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0684
Testing accuracy: 0.9788
Best testing accuracy was: 0.9791
Stagnation was: 2

----------
Epoch 29/50
----------
Training


Avg. Loss: 0.0400, Total Loss: 0.0328, Loss Parts: [0.0328]: 100%|███████████████████| 469/469 [00:05<00:00, 79.03it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0400
Training Accuracy: 0.9900
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.28it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0683
Testing accuracy: 0.9791
Best testing accuracy was: 0.9791
Stagnation was: 3

----------
Epoch 30/50
----------
Training


Avg. Loss: 0.0384, Total Loss: 0.0252, Loss Parts: [0.0252]: 100%|███████████████████| 469/469 [00:05<00:00, 80.44it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0384
Training Accuracy: 0.9905
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.78it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0686
Testing accuracy: 0.9797
Best testing accuracy was: 0.9791
Stagnation was: 0

----------
Epoch 31/50
----------
Training


Avg. Loss: 0.0368, Total Loss: 0.0178, Loss Parts: [0.0178]: 100%|███████████████████| 469/469 [00:05<00:00, 81.81it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0368
Training Accuracy: 0.9907
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.32it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0686
Testing accuracy: 0.9796
Best testing accuracy was: 0.9797
Stagnation was: 1

----------
Epoch 32/50
----------
Training


Avg. Loss: 0.0358, Total Loss: 0.0168, Loss Parts: [0.0168]: 100%|███████████████████| 469/469 [00:05<00:00, 84.17it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0358
Training Accuracy: 0.9911
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.56it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0673
Testing accuracy: 0.9797
Best testing accuracy was: 0.9797
Stagnation was: 2

----------
Epoch 33/50
----------
Training


Avg. Loss: 0.0343, Total Loss: 0.0813, Loss Parts: [0.0813]: 100%|███████████████████| 469/469 [00:05<00:00, 79.48it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0343
Training Accuracy: 0.9914
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.92it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0666
Testing accuracy: 0.9797
Best testing accuracy was: 0.9797
Stagnation was: 3

----------
Epoch 34/50
----------
Training


Avg. Loss: 0.0332, Total Loss: 0.0321, Loss Parts: [0.0321]: 100%|███████████████████| 469/469 [00:06<00:00, 77.47it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0332
Training Accuracy: 0.9919
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.95it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0652
Testing accuracy: 0.9801
Best testing accuracy was: 0.9797
Stagnation was: 0

----------
Epoch 35/50
----------
Training


Avg. Loss: 0.0320, Total Loss: 0.0364, Loss Parts: [0.0364]: 100%|███████████████████| 469/469 [00:05<00:00, 78.66it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0320
Training Accuracy: 0.9923
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.23it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0658
Testing accuracy: 0.9795
Best testing accuracy was: 0.9801
Stagnation was: 1

----------
Epoch 36/50
----------
Training


Avg. Loss: 0.0306, Total Loss: 0.0382, Loss Parts: [0.0382]: 100%|███████████████████| 469/469 [00:05<00:00, 83.79it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0306
Training Accuracy: 0.9926
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.53it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0649
Testing accuracy: 0.9804
Best testing accuracy was: 0.9801
Stagnation was: 0

----------
Epoch 37/50
----------
Training


Avg. Loss: 0.0294, Total Loss: 0.0174, Loss Parts: [0.0174]: 100%|███████████████████| 469/469 [00:05<00:00, 80.46it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0294
Training Accuracy: 0.9933
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.26it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0649
Testing accuracy: 0.9802
Best testing accuracy was: 0.9804
Stagnation was: 1

----------
Epoch 38/50
----------
Training


Avg. Loss: 0.0285, Total Loss: 0.0325, Loss Parts: [0.0325]: 100%|███████████████████| 469/469 [00:05<00:00, 80.30it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0285
Training Accuracy: 0.9935
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.30it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0651
Testing accuracy: 0.9796
Best testing accuracy was: 0.9804
Stagnation was: 2

----------
Epoch 39/50
----------
Training


Avg. Loss: 0.0276, Total Loss: 0.0231, Loss Parts: [0.0231]: 100%|███████████████████| 469/469 [00:06<00:00, 76.24it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0276
Training Accuracy: 0.9939
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.99it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0653
Testing accuracy: 0.9803
Best testing accuracy was: 0.9804
Stagnation was: 3

----------
Epoch 40/50
----------
Training


Avg. Loss: 0.0265, Total Loss: 0.0214, Loss Parts: [0.0214]: 100%|███████████████████| 469/469 [00:05<00:00, 80.35it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0265
Training Accuracy: 0.9940
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.95it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0647
Testing accuracy: 0.9798
Best testing accuracy was: 0.9804
Stagnation was: 4

----------
Epoch 41/50
----------
Training


Avg. Loss: 0.0257, Total Loss: 0.0135, Loss Parts: [0.0135]: 100%|███████████████████| 469/469 [00:05<00:00, 81.34it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0257
Training Accuracy: 0.9942
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.86it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0644
Testing accuracy: 0.9807
Best testing accuracy was: 0.9804
Stagnation was: 0

----------
Epoch 42/50
----------
Training


Avg. Loss: 0.0248, Total Loss: 0.0230, Loss Parts: [0.0230]: 100%|███████████████████| 469/469 [00:06<00:00, 76.21it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0248
Training Accuracy: 0.9944
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.20it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0650
Testing accuracy: 0.9801
Best testing accuracy was: 0.9807
Stagnation was: 1

----------
Epoch 43/50
----------
Training


Avg. Loss: 0.0241, Total Loss: 0.0229, Loss Parts: [0.0229]: 100%|███████████████████| 469/469 [00:06<00:00, 76.29it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0241
Training Accuracy: 0.9948
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.59it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0639
Testing accuracy: 0.9800
Best testing accuracy was: 0.9807
Stagnation was: 2

----------
Epoch 44/50
----------
Training


Avg. Loss: 0.0234, Total Loss: 0.0187, Loss Parts: [0.0187]: 100%|███████████████████| 469/469 [00:05<00:00, 78.46it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0234
Training Accuracy: 0.9951
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.49it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0651
Testing accuracy: 0.9805
Best testing accuracy was: 0.9807
Stagnation was: 3

----------
Epoch 45/50
----------
Training


Avg. Loss: 0.0225, Total Loss: 0.0223, Loss Parts: [0.0223]: 100%|███████████████████| 469/469 [00:05<00:00, 84.63it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0225
Training Accuracy: 0.9956
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.12it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0639
Testing accuracy: 0.9808
Best testing accuracy was: 0.9807
Stagnation was: 0

----------
Epoch 46/50
----------
Training


Avg. Loss: 0.0217, Total Loss: 0.0521, Loss Parts: [0.0521]: 100%|███████████████████| 469/469 [00:05<00:00, 80.99it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0217
Training Accuracy: 0.9957
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.34it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0636
Testing accuracy: 0.9808
Best testing accuracy was: 0.9808
Stagnation was: 1

----------
Epoch 47/50
----------
Training


Avg. Loss: 0.0210, Total Loss: 0.0063, Loss Parts: [0.0063]: 100%|███████████████████| 469/469 [00:06<00:00, 77.98it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0210
Training Accuracy: 0.9960
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.01it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0651
Testing accuracy: 0.9803
Best testing accuracy was: 0.9808
Stagnation was: 2

----------
Epoch 48/50
----------
Training


Avg. Loss: 0.0203, Total Loss: 0.0101, Loss Parts: [0.0101]: 100%|███████████████████| 469/469 [00:06<00:00, 77.56it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0203
Training Accuracy: 0.9964
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.87it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0639
Testing accuracy: 0.9805
Best testing accuracy was: 0.9808
Stagnation was: 3

----------
Epoch 49/50
----------
Training


Avg. Loss: 0.0197, Total Loss: 0.0054, Loss Parts: [0.0054]: 100%|███████████████████| 469/469 [00:05<00:00, 80.60it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0197
Training Accuracy: 0.9966
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.25it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0675
Testing accuracy: 0.9795
Best testing accuracy was: 0.9808
Stagnation was: 4

----------
Epoch 50/50
----------
Training


Avg. Loss: 0.0190, Total Loss: 0.0145, Loss Parts: [0.0145]: 100%|███████████████████| 469/469 [00:05<00:00, 84.69it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0190
Training Accuracy: 0.9968
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.26it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0650
Testing accuracy: 0.9800
Best testing accuracy was: 0.9808
Ran out of patience at epoch: 49
Patience was: 5
Training complete in 7m 43s
Saved session to C:\Users\Windows\Desktop\Shahir\18.408\18408-final-project\experiments\f88dac12158f7350\sessions\Session 05-19-2021 05-07-41 PM
{'dataset_config': {'dataset_type': 'img', 'dataset_config': {'img_dataset_type': 'mnist', 'num_train_samples': 60000, 'num_test_samples': 10000, 'new_input_size': None, 'flatten': True, 'augment': False, 'corrupt_frac': 0.0, 'seed': 0}}, 'model_config': {'model_type': 'relu_toy', 'model_config': {'input_dim': 784, 'output_dim': 10, 'layer_dims': [100], 'bias': True, 'seed': None}}, 'training_config': {'optimizer_type': 'sgd_momentum', 'loss_type': 'cross_entropy', 'lr': 0.01, 'num_epochs': 50, 'clip_grad_norm': False, 'weight_decay': 0.01, 'use_lr_schedule': False, 'epoch_lr_decay_steps': None, 'lr_decay_gamma': None, 'early_stop': True, 'early_stop_acc': 0.9, 'early_stop_patience': 5}, '

Avg. Loss: 0.6617, Total Loss: 0.4070, Loss Parts: [0.4070]: 100%|███████████████████| 469/469 [00:05<00:00, 86.37it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.6617
Training Accuracy: 0.8317
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.27it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.3638
Testing accuracy: 0.9054
Best testing accuracy was: -1.0000
Stagnation was: 0

----------
Epoch 2/50
----------
Training


Avg. Loss: 0.3530, Total Loss: 0.3353, Loss Parts: [0.3353]: 100%|███████████████████| 469/469 [00:05<00:00, 80.60it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.3530
Training Accuracy: 0.9073
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.45it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.3259
Testing accuracy: 0.9151
Best testing accuracy was: 0.9054
Stagnation was: 0

----------
Epoch 3/50
----------
Training


Avg. Loss: 0.3257, Total Loss: 0.2674, Loss Parts: [0.2674]: 100%|███████████████████| 469/469 [00:05<00:00, 78.34it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.3257
Training Accuracy: 0.9170
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.37it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.3045
Testing accuracy: 0.9240
Best testing accuracy was: 0.9151
Stagnation was: 0

----------
Epoch 4/50
----------
Training


Avg. Loss: 0.3098, Total Loss: 0.3283, Loss Parts: [0.3283]: 100%|███████████████████| 469/469 [00:05<00:00, 81.66it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.3098
Training Accuracy: 0.9206
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.57it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2929
Testing accuracy: 0.9281
Best testing accuracy was: 0.9240
Stagnation was: 0

----------
Epoch 5/50
----------
Training


Avg. Loss: 0.2994, Total Loss: 0.2858, Loss Parts: [0.2858]: 100%|███████████████████| 469/469 [00:05<00:00, 81.06it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2994
Training Accuracy: 0.9247
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.75it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2821
Testing accuracy: 0.9289
Best testing accuracy was: 0.9281
Stagnation was: 0

----------
Epoch 6/50
----------
Training


Avg. Loss: 0.2923, Total Loss: 0.2323, Loss Parts: [0.2323]: 100%|███████████████████| 469/469 [00:05<00:00, 80.02it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2923
Training Accuracy: 0.9272
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.91it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2788
Testing accuracy: 0.9297
Best testing accuracy was: 0.9289
Stagnation was: 0

----------
Epoch 7/50
----------
Training


Avg. Loss: 0.2871, Total Loss: 0.3748, Loss Parts: [0.3748]: 100%|███████████████████| 469/469 [00:05<00:00, 83.10it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2871
Training Accuracy: 0.9290
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 25.00it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2709
Testing accuracy: 0.9335
Best testing accuracy was: 0.9297
Stagnation was: 0

----------
Epoch 8/50
----------
Training


Avg. Loss: 0.2827, Total Loss: 0.2042, Loss Parts: [0.2042]: 100%|███████████████████| 469/469 [00:05<00:00, 81.13it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2827
Training Accuracy: 0.9298
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.72it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2698
Testing accuracy: 0.9338
Best testing accuracy was: 0.9335
Stagnation was: 0

----------
Epoch 9/50
----------
Training


Avg. Loss: 0.2808, Total Loss: 0.3329, Loss Parts: [0.3329]: 100%|███████████████████| 469/469 [00:05<00:00, 81.07it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2808
Training Accuracy: 0.9307
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.35it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2700
Testing accuracy: 0.9340
Best testing accuracy was: 0.9338
Stagnation was: 0

----------
Epoch 10/50
----------
Training


Avg. Loss: 0.2777, Total Loss: 0.2361, Loss Parts: [0.2361]: 100%|███████████████████| 469/469 [00:05<00:00, 81.88it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2777
Training Accuracy: 0.9322
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.77it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2632
Testing accuracy: 0.9356
Best testing accuracy was: 0.9340
Stagnation was: 0

----------
Epoch 11/50
----------
Training


Avg. Loss: 0.2750, Total Loss: 0.2609, Loss Parts: [0.2609]: 100%|███████████████████| 469/469 [00:06<00:00, 77.49it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2750
Training Accuracy: 0.9334
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.33it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2614
Testing accuracy: 0.9371
Best testing accuracy was: 0.9356
Stagnation was: 0

----------
Epoch 12/50
----------
Training


Avg. Loss: 0.2734, Total Loss: 0.1886, Loss Parts: [0.1886]: 100%|███████████████████| 469/469 [00:06<00:00, 76.62it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2734
Training Accuracy: 0.9344
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.61it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2629
Testing accuracy: 0.9349
Best testing accuracy was: 0.9371
Stagnation was: 1

----------
Epoch 13/50
----------
Training


Avg. Loss: 0.2723, Total Loss: 0.2543, Loss Parts: [0.2543]: 100%|███████████████████| 469/469 [00:06<00:00, 77.21it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2723
Training Accuracy: 0.9336
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.08it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2603
Testing accuracy: 0.9368
Best testing accuracy was: 0.9371
Stagnation was: 2

----------
Epoch 14/50
----------
Training


Avg. Loss: 0.2701, Total Loss: 0.2470, Loss Parts: [0.2470]: 100%|███████████████████| 469/469 [00:06<00:00, 78.10it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2701
Training Accuracy: 0.9349
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.27it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2613
Testing accuracy: 0.9361
Best testing accuracy was: 0.9371
Stagnation was: 3

----------
Epoch 15/50
----------
Training


Avg. Loss: 0.2695, Total Loss: 0.2553, Loss Parts: [0.2553]: 100%|███████████████████| 469/469 [00:06<00:00, 77.69it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2695
Training Accuracy: 0.9346
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.61it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2598
Testing accuracy: 0.9383
Best testing accuracy was: 0.9371
Stagnation was: 0

----------
Epoch 16/50
----------
Training


Avg. Loss: 0.2684, Total Loss: 0.2716, Loss Parts: [0.2716]: 100%|███████████████████| 469/469 [00:06<00:00, 77.16it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2684
Training Accuracy: 0.9352
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.46it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2593
Testing accuracy: 0.9354
Best testing accuracy was: 0.9383
Stagnation was: 1

----------
Epoch 17/50
----------
Training


Avg. Loss: 0.2674, Total Loss: 0.2884, Loss Parts: [0.2884]: 100%|███████████████████| 469/469 [00:06<00:00, 77.88it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2674
Training Accuracy: 0.9357
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.54it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2575
Testing accuracy: 0.9374
Best testing accuracy was: 0.9383
Stagnation was: 2

----------
Epoch 18/50
----------
Training


Avg. Loss: 0.2660, Total Loss: 0.3057, Loss Parts: [0.3057]: 100%|███████████████████| 469/469 [00:05<00:00, 80.55it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2660
Training Accuracy: 0.9366
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.96it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2548
Testing accuracy: 0.9380
Best testing accuracy was: 0.9383
Stagnation was: 3

----------
Epoch 19/50
----------
Training


Avg. Loss: 0.2656, Total Loss: 0.3020, Loss Parts: [0.3020]: 100%|███████████████████| 469/469 [00:05<00:00, 79.09it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2656
Training Accuracy: 0.9361
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.18it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2542
Testing accuracy: 0.9385
Best testing accuracy was: 0.9383
Stagnation was: 0

----------
Epoch 20/50
----------
Training


Avg. Loss: 0.2648, Total Loss: 0.2551, Loss Parts: [0.2551]: 100%|███████████████████| 469/469 [00:06<00:00, 77.71it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2648
Training Accuracy: 0.9364
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.98it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2542
Testing accuracy: 0.9381
Best testing accuracy was: 0.9385
Stagnation was: 1

----------
Epoch 21/50
----------
Training


Avg. Loss: 0.2642, Total Loss: 0.2794, Loss Parts: [0.2794]: 100%|███████████████████| 469/469 [00:06<00:00, 78.13it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2642
Training Accuracy: 0.9368
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.92it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2537
Testing accuracy: 0.9384
Best testing accuracy was: 0.9385
Stagnation was: 2

----------
Epoch 22/50
----------
Training


Avg. Loss: 0.2630, Total Loss: 0.3881, Loss Parts: [0.3881]: 100%|███████████████████| 469/469 [00:05<00:00, 79.18it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2630
Training Accuracy: 0.9373
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.95it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2505
Testing accuracy: 0.9407
Best testing accuracy was: 0.9385
Stagnation was: 0

----------
Epoch 23/50
----------
Training


Avg. Loss: 0.2632, Total Loss: 0.3043, Loss Parts: [0.3043]: 100%|███████████████████| 469/469 [00:05<00:00, 83.08it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2632
Training Accuracy: 0.9373
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.27it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2534
Testing accuracy: 0.9381
Best testing accuracy was: 0.9407
Stagnation was: 1

----------
Epoch 24/50
----------
Training


Avg. Loss: 0.2627, Total Loss: 0.3378, Loss Parts: [0.3378]: 100%|███████████████████| 469/469 [00:06<00:00, 74.23it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2627
Training Accuracy: 0.9374
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.70it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2506
Testing accuracy: 0.9410
Best testing accuracy was: 0.9407
Stagnation was: 0

----------
Epoch 25/50
----------
Training


Avg. Loss: 0.2618, Total Loss: 0.2636, Loss Parts: [0.2636]: 100%|███████████████████| 469/469 [00:06<00:00, 77.83it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2618
Training Accuracy: 0.9380
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.02it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2502
Testing accuracy: 0.9397
Best testing accuracy was: 0.9410
Stagnation was: 1

----------
Epoch 26/50
----------
Training


Avg. Loss: 0.2614, Total Loss: 0.3168, Loss Parts: [0.3168]: 100%|███████████████████| 469/469 [00:05<00:00, 78.74it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2614
Training Accuracy: 0.9377
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.09it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2500
Testing accuracy: 0.9404
Best testing accuracy was: 0.9410
Stagnation was: 2

----------
Epoch 27/50
----------
Training


Avg. Loss: 0.2610, Total Loss: 0.3024, Loss Parts: [0.3024]: 100%|███████████████████| 469/469 [00:05<00:00, 80.36it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2610
Training Accuracy: 0.9382
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.79it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2514
Testing accuracy: 0.9393
Best testing accuracy was: 0.9410
Stagnation was: 3

----------
Epoch 28/50
----------
Training


Avg. Loss: 0.2614, Total Loss: 0.3263, Loss Parts: [0.3263]: 100%|███████████████████| 469/469 [00:05<00:00, 78.37it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2614
Training Accuracy: 0.9380
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.61it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2499
Testing accuracy: 0.9391
Best testing accuracy was: 0.9410
Stagnation was: 4

----------
Epoch 29/50
----------
Training


Avg. Loss: 0.2610, Total Loss: 0.3723, Loss Parts: [0.3723]: 100%|███████████████████| 469/469 [00:05<00:00, 79.08it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2610
Training Accuracy: 0.9380
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.14it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2503
Testing accuracy: 0.9410
Best testing accuracy was: 0.9410
Ran out of patience at epoch: 28
Patience was: 5
Training complete in 4m 31s
Saved session to C:\Users\Windows\Desktop\Shahir\18.408\18408-final-project\experiments\0b050f3f6a14b9bf\sessions\Session 05-19-2021 05-12-12 PM
{'dataset_config': {'dataset_type': 'img', 'dataset_config': {'img_dataset_type': 'mnist', 'num_train_samples': 60000, 'num_test_samples': 10000, 'new_input_size': None, 'flatten': True, 'augment': False, 'corrupt_frac': 0.0, 'seed': 0}}, 'model_config': {'model_type': 'relu_toy', 'model_config': {'input_dim': 784, 'output_dim': 10, 'layer_dims': [100], 'bias': True, 'seed': None}}, 'training_config': {'optimizer_type': 'sgd_momentum', 'loss_type': 'cross_entropy', 'lr': 0.01, 'num_epochs': 50, 'clip_grad_norm': False, 'weight_decay': 0.1, 'use_lr_schedule': False, 'epoch_lr_decay_steps': None, 'lr_decay_gamma': None, 'early_stop': True, 'early_stop_acc': 0.9, 'early_stop_patience': 5}, 't

Avg. Loss: 1.0595, Total Loss: 0.9719, Loss Parts: [0.9719]: 100%|███████████████████| 469/469 [00:05<00:00, 84.97it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 1.0595
Training Accuracy: 0.7835
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.95it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8334
Testing accuracy: 0.8480
Best testing accuracy was: -1.0000
Stagnation was: 0

----------
Epoch 2/50
----------
Training


Avg. Loss: 0.8544, Total Loss: 0.8586, Loss Parts: [0.8586]: 100%|███████████████████| 469/469 [00:05<00:00, 84.45it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8544
Training Accuracy: 0.8444
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.89it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8252
Testing accuracy: 0.8603
Best testing accuracy was: 0.8480
Stagnation was: 0

----------
Epoch 3/50
----------
Training


Avg. Loss: 0.8506, Total Loss: 0.7453, Loss Parts: [0.7453]: 100%|███████████████████| 469/469 [00:05<00:00, 80.35it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8506
Training Accuracy: 0.8444
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.63it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8324
Testing accuracy: 0.8475
Best testing accuracy was: 0.8603
Stagnation was: 0

----------
Epoch 4/50
----------
Training


Avg. Loss: 0.8495, Total Loss: 0.8688, Loss Parts: [0.8688]: 100%|███████████████████| 469/469 [00:06<00:00, 76.37it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8495
Training Accuracy: 0.8451
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.48it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8272
Testing accuracy: 0.8606
Best testing accuracy was: 0.8603
Stagnation was: 0

----------
Epoch 5/50
----------
Training


Avg. Loss: 0.8486, Total Loss: 0.8839, Loss Parts: [0.8839]: 100%|███████████████████| 469/469 [00:06<00:00, 75.58it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8486
Training Accuracy: 0.8460
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.27it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8299
Testing accuracy: 0.8450
Best testing accuracy was: 0.8606
Stagnation was: 0

----------
Epoch 6/50
----------
Training


Avg. Loss: 0.8476, Total Loss: 0.8390, Loss Parts: [0.8390]: 100%|███████████████████| 469/469 [00:05<00:00, 83.03it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8476
Training Accuracy: 0.8476
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.57it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8209
Testing accuracy: 0.8617
Best testing accuracy was: 0.8606
Stagnation was: 0

----------
Epoch 7/50
----------
Training


Avg. Loss: 0.8470, Total Loss: 0.8614, Loss Parts: [0.8614]: 100%|███████████████████| 469/469 [00:05<00:00, 81.60it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8470
Training Accuracy: 0.8443
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.70it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8300
Testing accuracy: 0.8456
Best testing accuracy was: 0.8617
Stagnation was: 0

----------
Epoch 8/50
----------
Training


Avg. Loss: 0.8462, Total Loss: 0.9061, Loss Parts: [0.9061]: 100%|███████████████████| 469/469 [00:06<00:00, 76.00it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8462
Training Accuracy: 0.8460
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.40it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8301
Testing accuracy: 0.8524
Best testing accuracy was: 0.8617
Stagnation was: 0

----------
Epoch 9/50
----------
Training


Avg. Loss: 0.8470, Total Loss: 0.8593, Loss Parts: [0.8593]: 100%|███████████████████| 469/469 [00:06<00:00, 75.11it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8470
Training Accuracy: 0.8466
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 25.17it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8226
Testing accuracy: 0.8560
Best testing accuracy was: 0.8617
Stagnation was: 0

----------
Epoch 10/50
----------
Training


Avg. Loss: 0.8453, Total Loss: 0.8466, Loss Parts: [0.8466]: 100%|███████████████████| 469/469 [00:05<00:00, 78.72it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8453
Training Accuracy: 0.8478
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.10it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8243
Testing accuracy: 0.8591
Best testing accuracy was: 0.8617
Stagnation was: 0

----------
Epoch 11/50
----------
Training


Avg. Loss: 0.8464, Total Loss: 0.8339, Loss Parts: [0.8339]: 100%|███████████████████| 469/469 [00:05<00:00, 84.46it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8464
Training Accuracy: 0.8464
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.83it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8250
Testing accuracy: 0.8528
Best testing accuracy was: 0.8617
Stagnation was: 0

----------
Epoch 12/50
----------
Training


Avg. Loss: 0.8466, Total Loss: 0.7751, Loss Parts: [0.7751]: 100%|███████████████████| 469/469 [00:05<00:00, 79.27it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8466
Training Accuracy: 0.8456
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 25.45it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8245
Testing accuracy: 0.8550
Best testing accuracy was: 0.8617
Stagnation was: 0

----------
Epoch 13/50
----------
Training


Avg. Loss: 0.8460, Total Loss: 0.7871, Loss Parts: [0.7871]: 100%|███████████████████| 469/469 [00:05<00:00, 79.88it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8460
Training Accuracy: 0.8474
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.65it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8254
Testing accuracy: 0.8543
Best testing accuracy was: 0.8617
Stagnation was: 0

----------
Epoch 14/50
----------
Training


Avg. Loss: 0.8455, Total Loss: 0.7982, Loss Parts: [0.7982]: 100%|███████████████████| 469/469 [00:05<00:00, 78.79it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8455
Training Accuracy: 0.8484
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.83it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8265
Testing accuracy: 0.8585
Best testing accuracy was: 0.8617
Stagnation was: 0

----------
Epoch 15/50
----------
Training


Avg. Loss: 0.8473, Total Loss: 0.8030, Loss Parts: [0.8030]: 100%|███████████████████| 469/469 [00:06<00:00, 76.53it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8473
Training Accuracy: 0.8451
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.37it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8233
Testing accuracy: 0.8508
Best testing accuracy was: 0.8617
Stagnation was: 0

----------
Epoch 16/50
----------
Training


Avg. Loss: 0.8448, Total Loss: 0.8334, Loss Parts: [0.8334]: 100%|███████████████████| 469/469 [00:06<00:00, 75.38it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8448
Training Accuracy: 0.8469
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.33it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8300
Testing accuracy: 0.8626
Best testing accuracy was: 0.8617
Stagnation was: 0

----------
Epoch 17/50
----------
Training


Avg. Loss: 0.8470, Total Loss: 0.8340, Loss Parts: [0.8340]: 100%|███████████████████| 469/469 [00:06<00:00, 73.84it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8470
Training Accuracy: 0.8469
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.95it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8225
Testing accuracy: 0.8630
Best testing accuracy was: 0.8626
Stagnation was: 0

----------
Epoch 18/50
----------
Training


Avg. Loss: 0.8464, Total Loss: 0.7808, Loss Parts: [0.7808]: 100%|███████████████████| 469/469 [00:06<00:00, 74.94it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8464
Training Accuracy: 0.8462
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.16it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8221
Testing accuracy: 0.8512
Best testing accuracy was: 0.8630
Stagnation was: 0

----------
Epoch 19/50
----------
Training


Avg. Loss: 0.8450, Total Loss: 0.8922, Loss Parts: [0.8922]: 100%|███████████████████| 469/469 [00:05<00:00, 78.64it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8450
Training Accuracy: 0.8486
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.18it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8288
Testing accuracy: 0.8428
Best testing accuracy was: 0.8630
Stagnation was: 0

----------
Epoch 20/50
----------
Training


Avg. Loss: 0.8451, Total Loss: 0.7847, Loss Parts: [0.7847]: 100%|███████████████████| 469/469 [00:06<00:00, 78.13it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8451
Training Accuracy: 0.8481
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.44it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8259
Testing accuracy: 0.8500
Best testing accuracy was: 0.8630
Stagnation was: 0

----------
Epoch 21/50
----------
Training


Avg. Loss: 0.8462, Total Loss: 0.7780, Loss Parts: [0.7780]: 100%|███████████████████| 469/469 [00:06<00:00, 75.13it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8462
Training Accuracy: 0.8447
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.30it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8270
Testing accuracy: 0.8549
Best testing accuracy was: 0.8630
Stagnation was: 0

----------
Epoch 22/50
----------
Training


Avg. Loss: 0.8457, Total Loss: 0.8503, Loss Parts: [0.8503]: 100%|███████████████████| 469/469 [00:05<00:00, 83.23it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8457
Training Accuracy: 0.8470
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.43it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8248
Testing accuracy: 0.8529
Best testing accuracy was: 0.8630
Stagnation was: 0

----------
Epoch 23/50
----------
Training


Avg. Loss: 0.8456, Total Loss: 0.8076, Loss Parts: [0.8076]: 100%|███████████████████| 469/469 [00:06<00:00, 77.02it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8456
Training Accuracy: 0.8466
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.97it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8256
Testing accuracy: 0.8505
Best testing accuracy was: 0.8630
Stagnation was: 0

----------
Epoch 24/50
----------
Training


Avg. Loss: 0.8451, Total Loss: 0.9040, Loss Parts: [0.9040]: 100%|███████████████████| 469/469 [00:05<00:00, 78.39it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8451
Training Accuracy: 0.8478
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.07it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8274
Testing accuracy: 0.8325
Best testing accuracy was: 0.8630
Stagnation was: 0

----------
Epoch 25/50
----------
Training


Avg. Loss: 0.8462, Total Loss: 0.8563, Loss Parts: [0.8563]: 100%|███████████████████| 469/469 [00:05<00:00, 78.79it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8462
Training Accuracy: 0.8453
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.22it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8230
Testing accuracy: 0.8570
Best testing accuracy was: 0.8630
Stagnation was: 0

----------
Epoch 26/50
----------
Training


Avg. Loss: 0.8457, Total Loss: 0.8226, Loss Parts: [0.8226]: 100%|███████████████████| 469/469 [00:05<00:00, 81.96it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8457
Training Accuracy: 0.8459
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.07it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8219
Testing accuracy: 0.8622
Best testing accuracy was: 0.8630
Stagnation was: 0

----------
Epoch 27/50
----------
Training


Avg. Loss: 0.8457, Total Loss: 0.8306, Loss Parts: [0.8306]: 100%|███████████████████| 469/469 [00:05<00:00, 81.36it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8457
Training Accuracy: 0.8466
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.94it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8255
Testing accuracy: 0.8503
Best testing accuracy was: 0.8630
Stagnation was: 0

----------
Epoch 28/50
----------
Training


Avg. Loss: 0.8452, Total Loss: 0.8526, Loss Parts: [0.8526]: 100%|███████████████████| 469/469 [00:05<00:00, 82.13it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8452
Training Accuracy: 0.8481
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.14it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8181
Testing accuracy: 0.8563
Best testing accuracy was: 0.8630
Stagnation was: 0

----------
Epoch 29/50
----------
Training


Avg. Loss: 0.8461, Total Loss: 0.8587, Loss Parts: [0.8587]: 100%|███████████████████| 469/469 [00:05<00:00, 81.59it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8461
Training Accuracy: 0.8466
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.21it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8212
Testing accuracy: 0.8618
Best testing accuracy was: 0.8630
Stagnation was: 0

----------
Epoch 30/50
----------
Training


Avg. Loss: 0.8443, Total Loss: 0.9922, Loss Parts: [0.9922]: 100%|███████████████████| 469/469 [00:06<00:00, 77.96it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8443
Training Accuracy: 0.8473
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.39it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8241
Testing accuracy: 0.8563
Best testing accuracy was: 0.8630
Stagnation was: 0

----------
Epoch 31/50
----------
Training


Avg. Loss: 0.8456, Total Loss: 0.8512, Loss Parts: [0.8512]: 100%|███████████████████| 469/469 [00:05<00:00, 80.21it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8456
Training Accuracy: 0.8470
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.17it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8208
Testing accuracy: 0.8596
Best testing accuracy was: 0.8630
Stagnation was: 0

----------
Epoch 32/50
----------
Training


Avg. Loss: 0.8460, Total Loss: 0.8271, Loss Parts: [0.8271]: 100%|███████████████████| 469/469 [00:05<00:00, 80.73it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8460
Training Accuracy: 0.8467
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.56it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8186
Testing accuracy: 0.8587
Best testing accuracy was: 0.8630
Stagnation was: 0

----------
Epoch 33/50
----------
Training


Avg. Loss: 0.8444, Total Loss: 0.8757, Loss Parts: [0.8757]: 100%|███████████████████| 469/469 [00:05<00:00, 82.81it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8444
Training Accuracy: 0.8471
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.34it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8340
Testing accuracy: 0.8577
Best testing accuracy was: 0.8630
Stagnation was: 0

----------
Epoch 34/50
----------
Training


Avg. Loss: 0.8457, Total Loss: 0.8027, Loss Parts: [0.8027]: 100%|███████████████████| 469/469 [00:06<00:00, 74.32it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8457
Training Accuracy: 0.8451
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.99it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8222
Testing accuracy: 0.8655
Best testing accuracy was: 0.8630
Stagnation was: 0

----------
Epoch 35/50
----------
Training


Avg. Loss: 0.8460, Total Loss: 0.8973, Loss Parts: [0.8973]: 100%|███████████████████| 469/469 [00:05<00:00, 80.57it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8460
Training Accuracy: 0.8473
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:02<00:00, 26.36it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8210
Testing accuracy: 0.8516
Best testing accuracy was: 0.8655
Stagnation was: 0

----------
Epoch 36/50
----------
Training


Avg. Loss: 0.8445, Total Loss: 0.8725, Loss Parts: [0.8725]: 100%|███████████████████| 469/469 [00:05<00:00, 79.23it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8445
Training Accuracy: 0.8472
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.49it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8210
Testing accuracy: 0.8581
Best testing accuracy was: 0.8655
Stagnation was: 0

----------
Epoch 37/50
----------
Training


Avg. Loss: 0.8449, Total Loss: 0.8433, Loss Parts: [0.8433]: 100%|███████████████████| 469/469 [00:05<00:00, 80.96it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8449
Training Accuracy: 0.8471
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.91it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8249
Testing accuracy: 0.8553
Best testing accuracy was: 0.8655
Stagnation was: 0

----------
Epoch 38/50
----------
Training


Avg. Loss: 0.8457, Total Loss: 0.8572, Loss Parts: [0.8572]: 100%|███████████████████| 469/469 [00:06<00:00, 72.92it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8457
Training Accuracy: 0.8470
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.07it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8292
Testing accuracy: 0.8562
Best testing accuracy was: 0.8655
Stagnation was: 0

----------
Epoch 39/50
----------
Training


Avg. Loss: 0.8440, Total Loss: 0.7957, Loss Parts: [0.7957]: 100%|███████████████████| 469/469 [00:06<00:00, 74.89it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8440
Training Accuracy: 0.8479
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 25.73it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8353
Testing accuracy: 0.8570
Best testing accuracy was: 0.8655
Stagnation was: 0

----------
Epoch 40/50
----------
Training


Avg. Loss: 0.8457, Total Loss: 0.8133, Loss Parts: [0.8133]: 100%|███████████████████| 469/469 [00:06<00:00, 77.44it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8457
Training Accuracy: 0.8469
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.45it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8218
Testing accuracy: 0.8626
Best testing accuracy was: 0.8655
Stagnation was: 0

----------
Epoch 41/50
----------
Training


Avg. Loss: 0.8453, Total Loss: 0.9194, Loss Parts: [0.9194]: 100%|███████████████████| 469/469 [00:06<00:00, 77.13it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8453
Training Accuracy: 0.8463
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.44it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8223
Testing accuracy: 0.8538
Best testing accuracy was: 0.8655
Stagnation was: 0

----------
Epoch 42/50
----------
Training


Avg. Loss: 0.8459, Total Loss: 0.7626, Loss Parts: [0.7626]: 100%|███████████████████| 469/469 [00:06<00:00, 77.33it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8459
Training Accuracy: 0.8464
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.63it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8217
Testing accuracy: 0.8586
Best testing accuracy was: 0.8655
Stagnation was: 0

----------
Epoch 43/50
----------
Training


Avg. Loss: 0.8459, Total Loss: 0.8747, Loss Parts: [0.8747]: 100%|███████████████████| 469/469 [00:06<00:00, 77.59it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8459
Training Accuracy: 0.8463
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.68it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8259
Testing accuracy: 0.8588
Best testing accuracy was: 0.8655
Stagnation was: 0

----------
Epoch 44/50
----------
Training


Avg. Loss: 0.8447, Total Loss: 0.9705, Loss Parts: [0.9705]: 100%|███████████████████| 469/469 [00:06<00:00, 75.12it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8447
Training Accuracy: 0.8467
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.49it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8263
Testing accuracy: 0.8558
Best testing accuracy was: 0.8655
Stagnation was: 0

----------
Epoch 45/50
----------
Training


Avg. Loss: 0.8457, Total Loss: 0.7958, Loss Parts: [0.7958]: 100%|███████████████████| 469/469 [00:06<00:00, 74.46it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8457
Training Accuracy: 0.8472
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.65it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8224
Testing accuracy: 0.8482
Best testing accuracy was: 0.8655
Stagnation was: 0

----------
Epoch 46/50
----------
Training


Avg. Loss: 0.8453, Total Loss: 0.9210, Loss Parts: [0.9210]: 100%|███████████████████| 469/469 [00:05<00:00, 78.31it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8453
Training Accuracy: 0.8458
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.76it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8160
Testing accuracy: 0.8602
Best testing accuracy was: 0.8655
Stagnation was: 0

----------
Epoch 47/50
----------
Training


Avg. Loss: 0.8444, Total Loss: 0.7560, Loss Parts: [0.7560]: 100%|███████████████████| 469/469 [00:05<00:00, 79.15it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8444
Training Accuracy: 0.8477
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.83it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8198
Testing accuracy: 0.8508
Best testing accuracy was: 0.8655
Stagnation was: 0

----------
Epoch 48/50
----------
Training


Avg. Loss: 0.8452, Total Loss: 0.8829, Loss Parts: [0.8829]: 100%|███████████████████| 469/469 [00:05<00:00, 84.31it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8452
Training Accuracy: 0.8469
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.88it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8230
Testing accuracy: 0.8652
Best testing accuracy was: 0.8655
Stagnation was: 0

----------
Epoch 49/50
----------
Training


Avg. Loss: 0.8460, Total Loss: 0.7958, Loss Parts: [0.7958]: 100%|███████████████████| 469/469 [00:06<00:00, 76.61it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8460
Training Accuracy: 0.8459
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.61it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8248
Testing accuracy: 0.8570
Best testing accuracy was: 0.8655
Stagnation was: 0

----------
Epoch 50/50
----------
Training


Avg. Loss: 0.8465, Total Loss: 0.8972, Loss Parts: [0.8972]: 100%|███████████████████| 469/469 [00:05<00:00, 78.24it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8465
Training Accuracy: 0.8463
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.84it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.8223
Testing accuracy: 0.8540
Best testing accuracy was: 0.8655
Stagnation was: 0

Training complete in 7m 47s
Saved session to C:\Users\Windows\Desktop\Shahir\18.408\18408-final-project\experiments\ca1694869d61b24a\sessions\Session 05-19-2021 05-19-59 PM
{'dataset_config': {'dataset_type': 'img', 'dataset_config': {'img_dataset_type': 'mnist', 'num_train_samples': 60000, 'num_test_samples': 10000, 'new_input_size': None, 'flatten': True, 'augment': False, 'corrupt_frac': 0.0, 'seed': 0}}, 'model_config': {'model_type': 'relu_toy', 'model_config': {'input_dim': 784, 'output_dim': 10, 'layer_dims': [100, 100], 'bias': True, 'seed': None}}, 'training_config': {'optimizer_type': 'sgd_momentum', 'loss_type': 'cross_entropy', 'lr': 0.01, 'num_epochs': 50, 'clip_grad_norm': False, 'weight_decay': 0.0, 'use_lr_schedule': False, 'epoch_lr_decay_steps': None, 'lr_decay_gamma': None, 'early_stop': True, 'early_stop_acc': 0.9, 'early_stop_patience': 5}, 'trial_index': 0}
---------

Avg. Loss: 0.7716, Total Loss: 0.1823, Loss Parts: [0.1823]: 100%|███████████████████| 469/469 [00:05<00:00, 81.38it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.7716
Training Accuracy: 0.7881
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.50it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.3115
Testing accuracy: 0.9124
Best testing accuracy was: -1.0000
Stagnation was: 0

----------
Epoch 2/50
----------
Training


Avg. Loss: 0.2826, Total Loss: 0.2748, Loss Parts: [0.2748]: 100%|███████████████████| 469/469 [00:06<00:00, 76.99it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2826
Training Accuracy: 0.9180
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 25.02it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2323
Testing accuracy: 0.9339
Best testing accuracy was: 0.9124
Stagnation was: 0

----------
Epoch 3/50
----------
Training


Avg. Loss: 0.2173, Total Loss: 0.2451, Loss Parts: [0.2451]: 100%|███████████████████| 469/469 [00:06<00:00, 77.53it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2173
Training Accuracy: 0.9367
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.29it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1920
Testing accuracy: 0.9450
Best testing accuracy was: 0.9339
Stagnation was: 0

----------
Epoch 4/50
----------
Training


Avg. Loss: 0.1740, Total Loss: 0.1371, Loss Parts: [0.1371]: 100%|███████████████████| 469/469 [00:06<00:00, 76.66it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1740
Training Accuracy: 0.9494
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.88it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1588
Testing accuracy: 0.9526
Best testing accuracy was: 0.9450
Stagnation was: 0

----------
Epoch 5/50
----------
Training


Avg. Loss: 0.1446, Total Loss: 0.1659, Loss Parts: [0.1659]: 100%|███████████████████| 469/469 [00:06<00:00, 75.33it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1446
Training Accuracy: 0.9583
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.35it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1321
Testing accuracy: 0.9607
Best testing accuracy was: 0.9526
Stagnation was: 0

----------
Epoch 6/50
----------
Training


Avg. Loss: 0.1210, Total Loss: 0.1933, Loss Parts: [0.1933]: 100%|███████████████████| 469/469 [00:06<00:00, 74.68it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1210
Training Accuracy: 0.9648
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.15it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1188
Testing accuracy: 0.9652
Best testing accuracy was: 0.9607
Stagnation was: 0

----------
Epoch 7/50
----------
Training


Avg. Loss: 0.1059, Total Loss: 0.0493, Loss Parts: [0.0493]: 100%|███████████████████| 469/469 [00:05<00:00, 78.86it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1059
Training Accuracy: 0.9688
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.74it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1076
Testing accuracy: 0.9688
Best testing accuracy was: 0.9652
Stagnation was: 0

----------
Epoch 8/50
----------
Training


Avg. Loss: 0.0943, Total Loss: 0.1274, Loss Parts: [0.1274]: 100%|███████████████████| 469/469 [00:06<00:00, 73.40it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0943
Training Accuracy: 0.9721
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.24it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1008
Testing accuracy: 0.9705
Best testing accuracy was: 0.9688
Stagnation was: 0

----------
Epoch 9/50
----------
Training


Avg. Loss: 0.0839, Total Loss: 0.1048, Loss Parts: [0.1048]: 100%|███████████████████| 469/469 [00:06<00:00, 73.77it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0839
Training Accuracy: 0.9755
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.62it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0927
Testing accuracy: 0.9719
Best testing accuracy was: 0.9705
Stagnation was: 0

----------
Epoch 10/50
----------
Training


Avg. Loss: 0.0747, Total Loss: 0.1383, Loss Parts: [0.1383]: 100%|███████████████████| 469/469 [00:06<00:00, 74.27it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0747
Training Accuracy: 0.9786
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.03it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0891
Testing accuracy: 0.9727
Best testing accuracy was: 0.9719
Stagnation was: 0

----------
Epoch 11/50
----------
Training


Avg. Loss: 0.0683, Total Loss: 0.1199, Loss Parts: [0.1199]: 100%|███████████████████| 469/469 [00:05<00:00, 86.13it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0683
Training Accuracy: 0.9801
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.50it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0846
Testing accuracy: 0.9740
Best testing accuracy was: 0.9727
Stagnation was: 0

----------
Epoch 12/50
----------
Training


Avg. Loss: 0.0620, Total Loss: 0.0507, Loss Parts: [0.0507]: 100%|███████████████████| 469/469 [00:05<00:00, 83.58it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0620
Training Accuracy: 0.9819
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.86it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0858
Testing accuracy: 0.9718
Best testing accuracy was: 0.9740
Stagnation was: 1

----------
Epoch 13/50
----------
Training


Avg. Loss: 0.0569, Total Loss: 0.0303, Loss Parts: [0.0303]: 100%|███████████████████| 469/469 [00:06<00:00, 74.10it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0569
Training Accuracy: 0.9835
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.60it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0897
Testing accuracy: 0.9718
Best testing accuracy was: 0.9740
Stagnation was: 2

----------
Epoch 14/50
----------
Training


Avg. Loss: 0.0514, Total Loss: 0.0265, Loss Parts: [0.0265]: 100%|███████████████████| 469/469 [00:06<00:00, 72.97it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0514
Training Accuracy: 0.9851
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.64it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0774
Testing accuracy: 0.9771
Best testing accuracy was: 0.9740
Stagnation was: 0

----------
Epoch 15/50
----------
Training


Avg. Loss: 0.0471, Total Loss: 0.0266, Loss Parts: [0.0266]: 100%|███████████████████| 469/469 [00:05<00:00, 78.19it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0471
Training Accuracy: 0.9861
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.32it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0823
Testing accuracy: 0.9733
Best testing accuracy was: 0.9771
Stagnation was: 1

----------
Epoch 16/50
----------
Training


Avg. Loss: 0.0430, Total Loss: 0.1065, Loss Parts: [0.1065]: 100%|███████████████████| 469/469 [00:06<00:00, 71.83it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0430
Training Accuracy: 0.9879
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.92it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0747
Testing accuracy: 0.9756
Best testing accuracy was: 0.9771
Stagnation was: 2

----------
Epoch 17/50
----------
Training


Avg. Loss: 0.0394, Total Loss: 0.0574, Loss Parts: [0.0574]: 100%|███████████████████| 469/469 [00:06<00:00, 74.37it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0394
Training Accuracy: 0.9889
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.15it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0752
Testing accuracy: 0.9771
Best testing accuracy was: 0.9771
Stagnation was: 3

----------
Epoch 18/50
----------
Training


Avg. Loss: 0.0364, Total Loss: 0.0043, Loss Parts: [0.0043]: 100%|███████████████████| 469/469 [00:06<00:00, 74.59it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0364
Training Accuracy: 0.9896
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.75it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0719
Testing accuracy: 0.9778
Best testing accuracy was: 0.9771
Stagnation was: 0

----------
Epoch 19/50
----------
Training


Avg. Loss: 0.0333, Total Loss: 0.0576, Loss Parts: [0.0576]: 100%|███████████████████| 469/469 [00:05<00:00, 79.63it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0333
Training Accuracy: 0.9909
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.41it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0734
Testing accuracy: 0.9773
Best testing accuracy was: 0.9778
Stagnation was: 1

----------
Epoch 20/50
----------
Training


Avg. Loss: 0.0305, Total Loss: 0.0604, Loss Parts: [0.0604]: 100%|███████████████████| 469/469 [00:05<00:00, 81.26it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0305
Training Accuracy: 0.9913
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.51it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0737
Testing accuracy: 0.9777
Best testing accuracy was: 0.9778
Stagnation was: 2

----------
Epoch 21/50
----------
Training


Avg. Loss: 0.0276, Total Loss: 0.0101, Loss Parts: [0.0101]: 100%|███████████████████| 469/469 [00:06<00:00, 77.93it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0276
Training Accuracy: 0.9925
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.42it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0728
Testing accuracy: 0.9793
Best testing accuracy was: 0.9778
Stagnation was: 0

----------
Epoch 22/50
----------
Training


Avg. Loss: 0.0268, Total Loss: 0.0212, Loss Parts: [0.0212]: 100%|███████████████████| 469/469 [00:05<00:00, 80.80it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0268
Training Accuracy: 0.9924
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.79it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0732
Testing accuracy: 0.9775
Best testing accuracy was: 0.9793
Stagnation was: 1

----------
Epoch 23/50
----------
Training


Avg. Loss: 0.0236, Total Loss: 0.0206, Loss Parts: [0.0206]: 100%|███████████████████| 469/469 [00:05<00:00, 80.45it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0236
Training Accuracy: 0.9939
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 25.64it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0780
Testing accuracy: 0.9760
Best testing accuracy was: 0.9793
Stagnation was: 2

----------
Epoch 24/50
----------
Training


Avg. Loss: 0.0219, Total Loss: 0.0495, Loss Parts: [0.0495]: 100%|███████████████████| 469/469 [00:06<00:00, 74.82it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0219
Training Accuracy: 0.9943
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.58it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0717
Testing accuracy: 0.9786
Best testing accuracy was: 0.9793
Stagnation was: 3

----------
Epoch 25/50
----------
Training


Avg. Loss: 0.0196, Total Loss: 0.0158, Loss Parts: [0.0158]: 100%|███████████████████| 469/469 [00:05<00:00, 79.48it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0196
Training Accuracy: 0.9954
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.96it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0769
Testing accuracy: 0.9774
Best testing accuracy was: 0.9793
Stagnation was: 4

----------
Epoch 26/50
----------
Training


Avg. Loss: 0.0184, Total Loss: 0.0106, Loss Parts: [0.0106]: 100%|███████████████████| 469/469 [00:05<00:00, 79.52it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0184
Training Accuracy: 0.9956
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.78it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0699
Testing accuracy: 0.9801
Best testing accuracy was: 0.9793
Stagnation was: 0

----------
Epoch 27/50
----------
Training


Avg. Loss: 0.0159, Total Loss: 0.0173, Loss Parts: [0.0173]: 100%|███████████████████| 469/469 [00:05<00:00, 81.10it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0159
Training Accuracy: 0.9966
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.50it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0756
Testing accuracy: 0.9775
Best testing accuracy was: 0.9801
Stagnation was: 1

----------
Epoch 28/50
----------
Training


Avg. Loss: 0.0151, Total Loss: 0.0064, Loss Parts: [0.0064]: 100%|███████████████████| 469/469 [00:05<00:00, 85.05it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0151
Training Accuracy: 0.9966
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.47it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0724
Testing accuracy: 0.9791
Best testing accuracy was: 0.9801
Stagnation was: 2

----------
Epoch 29/50
----------
Training


Avg. Loss: 0.0139, Total Loss: 0.0065, Loss Parts: [0.0065]: 100%|███████████████████| 469/469 [00:05<00:00, 81.97it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0139
Training Accuracy: 0.9970
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.15it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0752
Testing accuracy: 0.9776
Best testing accuracy was: 0.9801
Stagnation was: 3

----------
Epoch 30/50
----------
Training


Avg. Loss: 0.0126, Total Loss: 0.0229, Loss Parts: [0.0229]: 100%|███████████████████| 469/469 [00:05<00:00, 79.28it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0126
Training Accuracy: 0.9978
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.64it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0749
Testing accuracy: 0.9783
Best testing accuracy was: 0.9801
Stagnation was: 4

----------
Epoch 31/50
----------
Training


Avg. Loss: 0.0117, Total Loss: 0.0020, Loss Parts: [0.0020]: 100%|███████████████████| 469/469 [00:05<00:00, 84.47it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0117
Training Accuracy: 0.9979
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.84it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0742
Testing accuracy: 0.9791
Best testing accuracy was: 0.9801
Ran out of patience at epoch: 30
Patience was: 5
Training complete in 4m 52s
Saved session to C:\Users\Windows\Desktop\Shahir\18.408\18408-final-project\experiments\6dc3543b6c1a1764\sessions\Session 05-19-2021 05-24-51 PM
{'dataset_config': {'dataset_type': 'img', 'dataset_config': {'img_dataset_type': 'mnist', 'num_train_samples': 60000, 'num_test_samples': 10000, 'new_input_size': None, 'flatten': True, 'augment': False, 'corrupt_frac': 0.0, 'seed': 0}}, 'model_config': {'model_type': 'relu_toy', 'model_config': {'input_dim': 784, 'output_dim': 10, 'layer_dims': [100, 100], 'bias': True, 'seed': None}}, 'training_config': {'optimizer_type': 'sgd_momentum', 'loss_type': 'cross_entropy', 'lr': 0.01, 'num_epochs': 50, 'clip_grad_norm': False, 'weight_decay': 0.01, 'use_lr_schedule': False, 'epoch_lr_decay_steps': None, 'lr_decay_gamma': None, 'early_stop': True, 'early_stop_acc': 0.9, 'early_stop_patience': 

Avg. Loss: 0.8306, Total Loss: 0.3305, Loss Parts: [0.3305]: 100%|███████████████████| 469/469 [00:05<00:00, 82.42it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8306
Training Accuracy: 0.7613
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.49it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.3645
Testing accuracy: 0.8980
Best testing accuracy was: -1.0000
Stagnation was: 0

----------
Epoch 2/50
----------
Training


Avg. Loss: 0.3465, Total Loss: 0.3326, Loss Parts: [0.3326]: 100%|███████████████████| 469/469 [00:05<00:00, 79.32it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.3465
Training Accuracy: 0.9055
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.61it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.3112
Testing accuracy: 0.9154
Best testing accuracy was: 0.8980
Stagnation was: 0

----------
Epoch 3/50
----------
Training


Avg. Loss: 0.3093, Total Loss: 0.2884, Loss Parts: [0.2884]: 100%|███████████████████| 469/469 [00:05<00:00, 81.84it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.3093
Training Accuracy: 0.9165
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.16it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2904
Testing accuracy: 0.9230
Best testing accuracy was: 0.9154
Stagnation was: 0

----------
Epoch 4/50
----------
Training


Avg. Loss: 0.2842, Total Loss: 0.2973, Loss Parts: [0.2973]: 100%|███████████████████| 469/469 [00:05<00:00, 81.87it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2842
Training Accuracy: 0.9251
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.61it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2742
Testing accuracy: 0.9253
Best testing accuracy was: 0.9230
Stagnation was: 0

----------
Epoch 5/50
----------
Training


Avg. Loss: 0.2658, Total Loss: 0.3076, Loss Parts: [0.3076]: 100%|███████████████████| 469/469 [00:05<00:00, 79.56it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2658
Training Accuracy: 0.9298
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.75it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2484
Testing accuracy: 0.9340
Best testing accuracy was: 0.9253
Stagnation was: 0

----------
Epoch 6/50
----------
Training


Avg. Loss: 0.2551, Total Loss: 0.3050, Loss Parts: [0.3050]: 100%|███████████████████| 469/469 [00:06<00:00, 72.07it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2551
Training Accuracy: 0.9334
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.61it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2396
Testing accuracy: 0.9382
Best testing accuracy was: 0.9340
Stagnation was: 0

----------
Epoch 7/50
----------
Training


Avg. Loss: 0.2456, Total Loss: 0.2698, Loss Parts: [0.2698]: 100%|███████████████████| 469/469 [00:06<00:00, 73.48it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2456
Training Accuracy: 0.9371
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.04it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2336
Testing accuracy: 0.9401
Best testing accuracy was: 0.9382
Stagnation was: 0

----------
Epoch 8/50
----------
Training


Avg. Loss: 0.2410, Total Loss: 0.3604, Loss Parts: [0.3604]: 100%|██████████████████| 469/469 [00:04<00:00, 102.25it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2410
Training Accuracy: 0.9383
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.69it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2307
Testing accuracy: 0.9396
Best testing accuracy was: 0.9401
Stagnation was: 1

----------
Epoch 9/50
----------
Training


Avg. Loss: 0.2354, Total Loss: 0.2044, Loss Parts: [0.2044]: 100%|███████████████████| 469/469 [00:06<00:00, 77.87it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2354
Training Accuracy: 0.9398
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.98it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2238
Testing accuracy: 0.9430
Best testing accuracy was: 0.9401
Stagnation was: 0

----------
Epoch 10/50
----------
Training


Avg. Loss: 0.2330, Total Loss: 0.1731, Loss Parts: [0.1731]: 100%|███████████████████| 469/469 [00:06<00:00, 71.36it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2330
Training Accuracy: 0.9413
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.24it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2231
Testing accuracy: 0.9432
Best testing accuracy was: 0.9430
Stagnation was: 0

----------
Epoch 11/50
----------
Training


Avg. Loss: 0.2299, Total Loss: 0.1928, Loss Parts: [0.1928]: 100%|███████████████████| 469/469 [00:06<00:00, 68.50it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2299
Training Accuracy: 0.9421
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.75it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2181
Testing accuracy: 0.9457
Best testing accuracy was: 0.9432
Stagnation was: 0

----------
Epoch 12/50
----------
Training


Avg. Loss: 0.2268, Total Loss: 0.2950, Loss Parts: [0.2950]: 100%|███████████████████| 469/469 [00:06<00:00, 74.43it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2268
Training Accuracy: 0.9432
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 20.67it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2199
Testing accuracy: 0.9427
Best testing accuracy was: 0.9457
Stagnation was: 1

----------
Epoch 13/50
----------
Training


Avg. Loss: 0.2248, Total Loss: 0.2502, Loss Parts: [0.2502]: 100%|███████████████████| 469/469 [00:06<00:00, 77.34it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2248
Training Accuracy: 0.9433
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.50it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2160
Testing accuracy: 0.9458
Best testing accuracy was: 0.9457
Stagnation was: 0

----------
Epoch 14/50
----------
Training


Avg. Loss: 0.2230, Total Loss: 0.2321, Loss Parts: [0.2321]: 100%|███████████████████| 469/469 [00:06<00:00, 73.89it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2230
Training Accuracy: 0.9441
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.41it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2132
Testing accuracy: 0.9473
Best testing accuracy was: 0.9458
Stagnation was: 0

----------
Epoch 15/50
----------
Training


Avg. Loss: 0.2209, Total Loss: 0.3906, Loss Parts: [0.3906]: 100%|███████████████████| 469/469 [00:06<00:00, 72.29it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2209
Training Accuracy: 0.9448
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.97it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2112
Testing accuracy: 0.9445
Best testing accuracy was: 0.9473
Stagnation was: 1

----------
Epoch 16/50
----------
Training


Avg. Loss: 0.2199, Total Loss: 0.2677, Loss Parts: [0.2677]: 100%|███████████████████| 469/469 [00:06<00:00, 71.04it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2199
Training Accuracy: 0.9453
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.34it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2092
Testing accuracy: 0.9478
Best testing accuracy was: 0.9473
Stagnation was: 0

----------
Epoch 17/50
----------
Training


Avg. Loss: 0.2175, Total Loss: 0.2497, Loss Parts: [0.2497]: 100%|███████████████████| 469/469 [00:06<00:00, 76.14it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2175
Training Accuracy: 0.9457
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.44it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2111
Testing accuracy: 0.9459
Best testing accuracy was: 0.9478
Stagnation was: 1

----------
Epoch 18/50
----------
Training


Avg. Loss: 0.2167, Total Loss: 0.2431, Loss Parts: [0.2431]: 100%|███████████████████| 469/469 [00:06<00:00, 71.97it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2167
Training Accuracy: 0.9462
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.67it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2073
Testing accuracy: 0.9461
Best testing accuracy was: 0.9478
Stagnation was: 2

----------
Epoch 19/50
----------
Training


Avg. Loss: 0.2156, Total Loss: 0.1958, Loss Parts: [0.1958]: 100%|███████████████████| 469/469 [00:06<00:00, 73.90it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2156
Training Accuracy: 0.9466
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.78it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2083
Testing accuracy: 0.9489
Best testing accuracy was: 0.9478
Stagnation was: 0

----------
Epoch 20/50
----------
Training


Avg. Loss: 0.2150, Total Loss: 0.1614, Loss Parts: [0.1614]: 100%|███████████████████| 469/469 [00:06<00:00, 72.31it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2150
Training Accuracy: 0.9469
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.32it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2104
Testing accuracy: 0.9480
Best testing accuracy was: 0.9489
Stagnation was: 1

----------
Epoch 21/50
----------
Training


Avg. Loss: 0.2144, Total Loss: 0.1469, Loss Parts: [0.1469]: 100%|███████████████████| 469/469 [00:06<00:00, 73.67it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2144
Training Accuracy: 0.9471
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.53it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2065
Testing accuracy: 0.9492
Best testing accuracy was: 0.9489
Stagnation was: 0

----------
Epoch 22/50
----------
Training


Avg. Loss: 0.2132, Total Loss: 0.2487, Loss Parts: [0.2487]: 100%|███████████████████| 469/469 [00:06<00:00, 71.00it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2132
Training Accuracy: 0.9473
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.45it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2066
Testing accuracy: 0.9470
Best testing accuracy was: 0.9492
Stagnation was: 1

----------
Epoch 23/50
----------
Training


Avg. Loss: 0.2127, Total Loss: 0.1975, Loss Parts: [0.1975]: 100%|███████████████████| 469/469 [00:06<00:00, 73.59it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2127
Training Accuracy: 0.9473
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 20.90it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2032
Testing accuracy: 0.9508
Best testing accuracy was: 0.9492
Stagnation was: 0

----------
Epoch 24/50
----------
Training


Avg. Loss: 0.2125, Total Loss: 0.1502, Loss Parts: [0.1502]: 100%|███████████████████| 469/469 [00:06<00:00, 72.87it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2125
Training Accuracy: 0.9480
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.17it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2017
Testing accuracy: 0.9503
Best testing accuracy was: 0.9508
Stagnation was: 1

----------
Epoch 25/50
----------
Training


Avg. Loss: 0.2111, Total Loss: 0.1247, Loss Parts: [0.1247]: 100%|███████████████████| 469/469 [00:06<00:00, 76.74it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2111
Training Accuracy: 0.9478
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.81it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2044
Testing accuracy: 0.9480
Best testing accuracy was: 0.9508
Stagnation was: 2

----------
Epoch 26/50
----------
Training


Avg. Loss: 0.2116, Total Loss: 0.2100, Loss Parts: [0.2100]: 100%|███████████████████| 469/469 [00:06<00:00, 71.44it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2116
Training Accuracy: 0.9486
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.93it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2034
Testing accuracy: 0.9482
Best testing accuracy was: 0.9508
Stagnation was: 3

----------
Epoch 27/50
----------
Training


Avg. Loss: 0.2113, Total Loss: 0.1436, Loss Parts: [0.1436]: 100%|███████████████████| 469/469 [00:06<00:00, 70.76it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2113
Training Accuracy: 0.9482
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 20.55it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1991
Testing accuracy: 0.9516
Best testing accuracy was: 0.9508
Stagnation was: 0

----------
Epoch 28/50
----------
Training


Avg. Loss: 0.2103, Total Loss: 0.1813, Loss Parts: [0.1813]: 100%|███████████████████| 469/469 [00:06<00:00, 73.75it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2103
Training Accuracy: 0.9483
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.77it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2011
Testing accuracy: 0.9493
Best testing accuracy was: 0.9516
Stagnation was: 1

----------
Epoch 29/50
----------
Training


Avg. Loss: 0.2098, Total Loss: 0.2234, Loss Parts: [0.2234]: 100%|███████████████████| 469/469 [00:06<00:00, 77.73it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2098
Training Accuracy: 0.9492
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.51it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2041
Testing accuracy: 0.9511
Best testing accuracy was: 0.9516
Stagnation was: 2

----------
Epoch 30/50
----------
Training


Avg. Loss: 0.2090, Total Loss: 0.2086, Loss Parts: [0.2086]: 100%|███████████████████| 469/469 [00:06<00:00, 77.55it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2090
Training Accuracy: 0.9489
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.95it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2012
Testing accuracy: 0.9509
Best testing accuracy was: 0.9516
Stagnation was: 3

----------
Epoch 31/50
----------
Training


Avg. Loss: 0.2085, Total Loss: 0.1586, Loss Parts: [0.1586]: 100%|███████████████████| 469/469 [00:05<00:00, 79.42it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2085
Training Accuracy: 0.9489
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.53it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2004
Testing accuracy: 0.9513
Best testing accuracy was: 0.9516
Stagnation was: 4

----------
Epoch 32/50
----------
Training


Avg. Loss: 0.2092, Total Loss: 0.2438, Loss Parts: [0.2438]: 100%|███████████████████| 469/469 [00:06<00:00, 74.30it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2092
Training Accuracy: 0.9492
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.17it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2014
Testing accuracy: 0.9508
Best testing accuracy was: 0.9516
Ran out of patience at epoch: 31
Patience was: 5
Training complete in 5m 13s
Saved session to C:\Users\Windows\Desktop\Shahir\18.408\18408-final-project\experiments\bc8947ac3ab84b26\sessions\Session 05-19-2021 05-30-04 PM
{'dataset_config': {'dataset_type': 'img', 'dataset_config': {'img_dataset_type': 'mnist', 'num_train_samples': 60000, 'num_test_samples': 10000, 'new_input_size': None, 'flatten': True, 'augment': False, 'corrupt_frac': 0.0, 'seed': 0}}, 'model_config': {'model_type': 'relu_toy', 'model_config': {'input_dim': 784, 'output_dim': 10, 'layer_dims': [100, 100], 'bias': True, 'seed': None}}, 'training_config': {'optimizer_type': 'sgd_momentum', 'loss_type': 'cross_entropy', 'lr': 0.01, 'num_epochs': 50, 'clip_grad_norm': False, 'weight_decay': 0.1, 'use_lr_schedule': False, 'epoch_lr_decay_steps': None, 'lr_decay_gamma': None, 'early_stop': True, 'early_stop_acc': 0.9, 'early_stop_patience': 5

Avg. Loss: 1.8426, Total Loss: 1.2920, Loss Parts: [1.2920]: 100%|███████████████████| 469/469 [00:06<00:00, 75.03it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 1.8426
Training Accuracy: 0.4381
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.18it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 1.3293
Testing accuracy: 0.6347
Best testing accuracy was: -1.0000
Stagnation was: 0

----------
Epoch 2/50
----------
Training


Avg. Loss: 1.1029, Total Loss: 1.0554, Loss Parts: [1.0554]: 100%|███████████████████| 469/469 [00:06<00:00, 74.68it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 1.1029
Training Accuracy: 0.7018
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.28it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9997
Testing accuracy: 0.7613
Best testing accuracy was: 0.6347
Stagnation was: 0

----------
Epoch 3/50
----------
Training


Avg. Loss: 1.0106, Total Loss: 1.0909, Loss Parts: [1.0909]: 100%|███████████████████| 469/469 [00:06<00:00, 70.83it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 1.0106
Training Accuracy: 0.7338
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.51it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9812
Testing accuracy: 0.7557
Best testing accuracy was: 0.7613
Stagnation was: 0

----------
Epoch 4/50
----------
Training


Avg. Loss: 1.0033, Total Loss: 1.2634, Loss Parts: [1.2634]: 100%|███████████████████| 469/469 [00:06<00:00, 68.72it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 1.0033
Training Accuracy: 0.7383
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 20.87it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9940
Testing accuracy: 0.7402
Best testing accuracy was: 0.7613
Stagnation was: 0

----------
Epoch 5/50
----------
Training


Avg. Loss: 1.0063, Total Loss: 0.9985, Loss Parts: [0.9985]: 100%|███████████████████| 469/469 [00:06<00:00, 77.47it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 1.0063
Training Accuracy: 0.7348
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.45it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9855
Testing accuracy: 0.7400
Best testing accuracy was: 0.7613
Stagnation was: 0

----------
Epoch 6/50
----------
Training


Avg. Loss: 1.0020, Total Loss: 0.8995, Loss Parts: [0.8995]: 100%|███████████████████| 469/469 [00:06<00:00, 72.00it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 1.0020
Training Accuracy: 0.7375
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.76it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9724
Testing accuracy: 0.7476
Best testing accuracy was: 0.7613
Stagnation was: 0

----------
Epoch 7/50
----------
Training


Avg. Loss: 1.0010, Total Loss: 1.0008, Loss Parts: [1.0008]: 100%|███████████████████| 469/469 [00:06<00:00, 72.51it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 1.0010
Training Accuracy: 0.7387
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.62it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9826
Testing accuracy: 0.7336
Best testing accuracy was: 0.7613
Stagnation was: 0

----------
Epoch 8/50
----------
Training


Avg. Loss: 0.9997, Total Loss: 1.0061, Loss Parts: [1.0061]: 100%|███████████████████| 469/469 [00:06<00:00, 72.22it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9997
Training Accuracy: 0.7391
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.87it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9765
Testing accuracy: 0.7536
Best testing accuracy was: 0.7613
Stagnation was: 0

----------
Epoch 9/50
----------
Training


Avg. Loss: 0.9981, Total Loss: 0.9721, Loss Parts: [0.9721]: 100%|███████████████████| 469/469 [00:05<00:00, 79.95it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9981
Training Accuracy: 0.7403
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.26it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9735
Testing accuracy: 0.7594
Best testing accuracy was: 0.7613
Stagnation was: 0

----------
Epoch 10/50
----------
Training


Avg. Loss: 0.9982, Total Loss: 0.9071, Loss Parts: [0.9071]: 100%|███████████████████| 469/469 [00:06<00:00, 75.78it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9982
Training Accuracy: 0.7407
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.82it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9835
Testing accuracy: 0.7340
Best testing accuracy was: 0.7613
Stagnation was: 0

----------
Epoch 11/50
----------
Training


Avg. Loss: 0.9982, Total Loss: 0.9880, Loss Parts: [0.9880]: 100%|███████████████████| 469/469 [00:06<00:00, 73.18it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9982
Training Accuracy: 0.7400
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 20.84it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9835
Testing accuracy: 0.7447
Best testing accuracy was: 0.7613
Stagnation was: 0

----------
Epoch 12/50
----------
Training


Avg. Loss: 0.9991, Total Loss: 0.9578, Loss Parts: [0.9578]: 100%|███████████████████| 469/469 [00:06<00:00, 75.00it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9991
Training Accuracy: 0.7398
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.31it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9793
Testing accuracy: 0.7681
Best testing accuracy was: 0.7613
Stagnation was: 0

----------
Epoch 13/50
----------
Training


Avg. Loss: 0.9986, Total Loss: 1.0168, Loss Parts: [1.0168]: 100%|███████████████████| 469/469 [00:06<00:00, 72.60it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9986
Training Accuracy: 0.7394
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.71it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9789
Testing accuracy: 0.7616
Best testing accuracy was: 0.7681
Stagnation was: 0

----------
Epoch 14/50
----------
Training


Avg. Loss: 0.9981, Total Loss: 0.9875, Loss Parts: [0.9875]: 100%|███████████████████| 469/469 [00:06<00:00, 75.23it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9981
Training Accuracy: 0.7387
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.66it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9826
Testing accuracy: 0.7527
Best testing accuracy was: 0.7681
Stagnation was: 0

----------
Epoch 15/50
----------
Training


Avg. Loss: 0.9983, Total Loss: 1.0131, Loss Parts: [1.0131]: 100%|███████████████████| 469/469 [00:06<00:00, 71.89it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9983
Training Accuracy: 0.7399
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.41it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9844
Testing accuracy: 0.7598
Best testing accuracy was: 0.7681
Stagnation was: 0

----------
Epoch 16/50
----------
Training


Avg. Loss: 0.9982, Total Loss: 1.0030, Loss Parts: [1.0030]: 100%|███████████████████| 469/469 [00:05<00:00, 78.17it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9982
Training Accuracy: 0.7402
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.14it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9857
Testing accuracy: 0.7512
Best testing accuracy was: 0.7681
Stagnation was: 0

----------
Epoch 17/50
----------
Training


Avg. Loss: 1.0004, Total Loss: 0.9786, Loss Parts: [0.9786]: 100%|███████████████████| 469/469 [00:05<00:00, 82.05it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 1.0004
Training Accuracy: 0.7385
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.80it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9763
Testing accuracy: 0.7626
Best testing accuracy was: 0.7681
Stagnation was: 0

----------
Epoch 18/50
----------
Training


Avg. Loss: 0.9978, Total Loss: 1.0040, Loss Parts: [1.0040]: 100%|███████████████████| 469/469 [00:06<00:00, 78.02it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9978
Training Accuracy: 0.7407
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.64it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9786
Testing accuracy: 0.7631
Best testing accuracy was: 0.7681
Stagnation was: 0

----------
Epoch 19/50
----------
Training


Avg. Loss: 0.9980, Total Loss: 0.9539, Loss Parts: [0.9539]: 100%|███████████████████| 469/469 [00:06<00:00, 67.09it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9980
Training Accuracy: 0.7390
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.36it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9720
Testing accuracy: 0.7633
Best testing accuracy was: 0.7681
Stagnation was: 0

----------
Epoch 20/50
----------
Training


Avg. Loss: 0.9991, Total Loss: 0.9792, Loss Parts: [0.9792]: 100%|███████████████████| 469/469 [00:06<00:00, 74.51it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9991
Training Accuracy: 0.7400
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 20.61it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9850
Testing accuracy: 0.7344
Best testing accuracy was: 0.7681
Stagnation was: 0

----------
Epoch 21/50
----------
Training


Avg. Loss: 0.9970, Total Loss: 0.9552, Loss Parts: [0.9552]: 100%|███████████████████| 469/469 [00:06<00:00, 72.71it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9970
Training Accuracy: 0.7403
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.93it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9783
Testing accuracy: 0.7517
Best testing accuracy was: 0.7681
Stagnation was: 0

----------
Epoch 22/50
----------
Training


Avg. Loss: 0.9977, Total Loss: 1.0931, Loss Parts: [1.0931]: 100%|███████████████████| 469/469 [00:05<00:00, 78.67it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9977
Training Accuracy: 0.7390
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.69it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9806
Testing accuracy: 0.7581
Best testing accuracy was: 0.7681
Stagnation was: 0

----------
Epoch 23/50
----------
Training


Avg. Loss: 0.9983, Total Loss: 1.0004, Loss Parts: [1.0004]: 100%|███████████████████| 469/469 [00:06<00:00, 71.93it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9983
Training Accuracy: 0.7400
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.69it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9783
Testing accuracy: 0.7448
Best testing accuracy was: 0.7681
Stagnation was: 0

----------
Epoch 24/50
----------
Training


Avg. Loss: 0.9978, Total Loss: 1.0891, Loss Parts: [1.0891]: 100%|███████████████████| 469/469 [00:06<00:00, 69.91it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9978
Training Accuracy: 0.7404
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.56it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9755
Testing accuracy: 0.7370
Best testing accuracy was: 0.7681
Stagnation was: 0

----------
Epoch 25/50
----------
Training


Avg. Loss: 0.9993, Total Loss: 0.9503, Loss Parts: [0.9503]: 100%|███████████████████| 469/469 [00:06<00:00, 77.76it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9993
Training Accuracy: 0.7389
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.55it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9723
Testing accuracy: 0.7601
Best testing accuracy was: 0.7681
Stagnation was: 0

----------
Epoch 26/50
----------
Training


Avg. Loss: 0.9978, Total Loss: 0.9512, Loss Parts: [0.9512]: 100%|███████████████████| 469/469 [00:06<00:00, 72.50it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9978
Training Accuracy: 0.7399
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.13it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9849
Testing accuracy: 0.7467
Best testing accuracy was: 0.7681
Stagnation was: 0

----------
Epoch 27/50
----------
Training


Avg. Loss: 0.9988, Total Loss: 0.9562, Loss Parts: [0.9562]: 100%|███████████████████| 469/469 [00:06<00:00, 72.67it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9988
Training Accuracy: 0.7391
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.09it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9749
Testing accuracy: 0.7570
Best testing accuracy was: 0.7681
Stagnation was: 0

----------
Epoch 28/50
----------
Training


Avg. Loss: 0.9983, Total Loss: 0.9488, Loss Parts: [0.9488]: 100%|███████████████████| 469/469 [00:06<00:00, 69.74it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9983
Training Accuracy: 0.7396
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 20.91it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9767
Testing accuracy: 0.7636
Best testing accuracy was: 0.7681
Stagnation was: 0

----------
Epoch 29/50
----------
Training


Avg. Loss: 0.9972, Total Loss: 1.0457, Loss Parts: [1.0457]: 100%|███████████████████| 469/469 [00:06<00:00, 72.91it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9972
Training Accuracy: 0.7407
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.26it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9767
Testing accuracy: 0.7631
Best testing accuracy was: 0.7681
Stagnation was: 0

----------
Epoch 30/50
----------
Training


Avg. Loss: 0.9993, Total Loss: 0.9673, Loss Parts: [0.9673]: 100%|███████████████████| 469/469 [00:06<00:00, 69.32it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9993
Training Accuracy: 0.7377
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.68it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9722
Testing accuracy: 0.7678
Best testing accuracy was: 0.7681
Stagnation was: 0

----------
Epoch 31/50
----------
Training


Avg. Loss: 0.9970, Total Loss: 1.0921, Loss Parts: [1.0921]: 100%|███████████████████| 469/469 [00:06<00:00, 69.29it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9970
Training Accuracy: 0.7405
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.89it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9758
Testing accuracy: 0.7656
Best testing accuracy was: 0.7681
Stagnation was: 0

----------
Epoch 32/50
----------
Training


Avg. Loss: 0.9988, Total Loss: 1.0112, Loss Parts: [1.0112]: 100%|███████████████████| 469/469 [00:06<00:00, 72.98it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9988
Training Accuracy: 0.7386
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.98it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9808
Testing accuracy: 0.7348
Best testing accuracy was: 0.7681
Stagnation was: 0

----------
Epoch 33/50
----------
Training


Avg. Loss: 0.9980, Total Loss: 1.0837, Loss Parts: [1.0837]: 100%|███████████████████| 469/469 [00:06<00:00, 69.98it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9980
Training Accuracy: 0.7392
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.52it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9790
Testing accuracy: 0.7593
Best testing accuracy was: 0.7681
Stagnation was: 0

----------
Epoch 34/50
----------
Training


Avg. Loss: 0.9972, Total Loss: 0.9335, Loss Parts: [0.9335]: 100%|███████████████████| 469/469 [00:05<00:00, 78.24it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9972
Training Accuracy: 0.7419
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.04it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9781
Testing accuracy: 0.7425
Best testing accuracy was: 0.7681
Stagnation was: 0

----------
Epoch 35/50
----------
Training


Avg. Loss: 0.9975, Total Loss: 1.0564, Loss Parts: [1.0564]: 100%|███████████████████| 469/469 [00:06<00:00, 75.24it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9975
Training Accuracy: 0.7409
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.78it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9718
Testing accuracy: 0.7649
Best testing accuracy was: 0.7681
Stagnation was: 0

----------
Epoch 36/50
----------
Training


Avg. Loss: 0.9961, Total Loss: 1.0159, Loss Parts: [1.0159]: 100%|███████████████████| 469/469 [00:06<00:00, 73.47it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9961
Training Accuracy: 0.7424
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.93it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9768
Testing accuracy: 0.7501
Best testing accuracy was: 0.7681
Stagnation was: 0

----------
Epoch 37/50
----------
Training


Avg. Loss: 0.9983, Total Loss: 0.9521, Loss Parts: [0.9521]: 100%|███████████████████| 469/469 [00:06<00:00, 70.87it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9983
Training Accuracy: 0.7401
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.07it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9718
Testing accuracy: 0.7597
Best testing accuracy was: 0.7681
Stagnation was: 0

----------
Epoch 38/50
----------
Training


Avg. Loss: 0.9990, Total Loss: 1.0320, Loss Parts: [1.0320]: 100%|███████████████████| 469/469 [00:06<00:00, 71.80it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9990
Training Accuracy: 0.7392
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.29it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9673
Testing accuracy: 0.7461
Best testing accuracy was: 0.7681
Stagnation was: 0

----------
Epoch 39/50
----------
Training


Avg. Loss: 0.9972, Total Loss: 0.9203, Loss Parts: [0.9203]: 100%|███████████████████| 469/469 [00:06<00:00, 74.79it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9972
Training Accuracy: 0.7420
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.33it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9781
Testing accuracy: 0.7385
Best testing accuracy was: 0.7681
Stagnation was: 0

----------
Epoch 40/50
----------
Training


Avg. Loss: 0.9987, Total Loss: 1.0093, Loss Parts: [1.0093]: 100%|███████████████████| 469/469 [00:06<00:00, 75.47it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9987
Training Accuracy: 0.7390
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.43it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9813
Testing accuracy: 0.7462
Best testing accuracy was: 0.7681
Stagnation was: 0

----------
Epoch 41/50
----------
Training


Avg. Loss: 0.9970, Total Loss: 1.0282, Loss Parts: [1.0282]: 100%|███████████████████| 469/469 [00:06<00:00, 73.62it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9970
Training Accuracy: 0.7418
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.87it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9766
Testing accuracy: 0.7534
Best testing accuracy was: 0.7681
Stagnation was: 0

----------
Epoch 42/50
----------
Training


Avg. Loss: 0.9972, Total Loss: 1.0156, Loss Parts: [1.0156]: 100%|███████████████████| 469/469 [00:06<00:00, 74.06it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9972
Training Accuracy: 0.7412
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.91it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9826
Testing accuracy: 0.7626
Best testing accuracy was: 0.7681
Stagnation was: 0

----------
Epoch 43/50
----------
Training


Avg. Loss: 0.9987, Total Loss: 1.0777, Loss Parts: [1.0777]: 100%|███████████████████| 469/469 [00:06<00:00, 69.38it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9987
Training Accuracy: 0.7393
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.84it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9774
Testing accuracy: 0.7682
Best testing accuracy was: 0.7681
Stagnation was: 0

----------
Epoch 44/50
----------
Training


Avg. Loss: 0.9977, Total Loss: 0.9155, Loss Parts: [0.9155]: 100%|███████████████████| 469/469 [00:06<00:00, 71.93it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9977
Training Accuracy: 0.7414
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.23it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9699
Testing accuracy: 0.7520
Best testing accuracy was: 0.7682
Stagnation was: 0

----------
Epoch 45/50
----------
Training


Avg. Loss: 0.9981, Total Loss: 0.9453, Loss Parts: [0.9453]: 100%|███████████████████| 469/469 [00:06<00:00, 70.45it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9981
Training Accuracy: 0.7393
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.99it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9787
Testing accuracy: 0.7386
Best testing accuracy was: 0.7682
Stagnation was: 0

----------
Epoch 46/50
----------
Training


Avg. Loss: 0.9987, Total Loss: 0.9110, Loss Parts: [0.9110]: 100%|███████████████████| 469/469 [00:05<00:00, 82.05it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9987
Training Accuracy: 0.7381
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.49it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9762
Testing accuracy: 0.7500
Best testing accuracy was: 0.7682
Stagnation was: 0

----------
Epoch 47/50
----------
Training


Avg. Loss: 0.9980, Total Loss: 0.9815, Loss Parts: [0.9815]: 100%|███████████████████| 469/469 [00:06<00:00, 71.61it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9980
Training Accuracy: 0.7394
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.42it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9731
Testing accuracy: 0.7594
Best testing accuracy was: 0.7682
Stagnation was: 0

----------
Epoch 48/50
----------
Training


Avg. Loss: 0.9982, Total Loss: 0.8933, Loss Parts: [0.8933]: 100%|███████████████████| 469/469 [00:06<00:00, 72.65it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9982
Training Accuracy: 0.7396
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.22it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9757
Testing accuracy: 0.7351
Best testing accuracy was: 0.7682
Stagnation was: 0

----------
Epoch 49/50
----------
Training


Avg. Loss: 0.9981, Total Loss: 1.0791, Loss Parts: [1.0791]: 100%|███████████████████| 469/469 [00:05<00:00, 80.43it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9981
Training Accuracy: 0.7388
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.75it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9876
Testing accuracy: 0.7407
Best testing accuracy was: 0.7682
Stagnation was: 0

----------
Epoch 50/50
----------
Training


Avg. Loss: 0.9974, Total Loss: 1.0799, Loss Parts: [1.0799]: 100%|███████████████████| 469/469 [00:06<00:00, 77.14it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.9974
Training Accuracy: 0.7411
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.91it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9925
Testing accuracy: 0.7309
Best testing accuracy was: 0.7682
Stagnation was: 0

Training complete in 8m 16s
Saved session to C:\Users\Windows\Desktop\Shahir\18.408\18408-final-project\experiments\f16119680fd73e13\sessions\Session 05-19-2021 05-38-20 PM
{'dataset_config': {'dataset_type': 'img', 'dataset_config': {'img_dataset_type': 'mnist', 'num_train_samples': 60000, 'num_test_samples': 10000, 'new_input_size': None, 'flatten': True, 'augment': False, 'corrupt_frac': 0.0, 'seed': 0}}, 'model_config': {'model_type': 'relu_toy', 'model_config': {'input_dim': 784, 'output_dim': 10, 'layer_dims': [100, 100, 100, 100], 'bias': True, 'seed': None}}, 'training_config': {'optimizer_type': 'sgd_momentum', 'loss_type': 'cross_entropy', 'lr': 0.01, 'num_epochs': 50, 'clip_grad_norm': False, 'weight_decay': 0.0, 'use_lr_schedule': False, 'epoch_lr_decay_steps': None, 'lr_decay_gamma': None, 'early_stop': True, 'early_stop_acc': 0.9, 'early_stop_patience': 5}, 'trial_index': 0}

Avg. Loss: 1.5021, Total Loss: 0.4645, Loss Parts: [0.4645]: 100%|███████████████████| 469/469 [00:06<00:00, 69.34it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 1.5021
Training Accuracy: 0.4680
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.87it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.4334
Testing accuracy: 0.8708
Best testing accuracy was: -1.0000
Stagnation was: 0

----------
Epoch 2/50
----------
Training


Avg. Loss: 0.3231, Total Loss: 0.2355, Loss Parts: [0.2355]: 100%|███████████████████| 469/469 [00:06<00:00, 69.67it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.3231
Training Accuracy: 0.9040
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.58it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2322
Testing accuracy: 0.9309
Best testing accuracy was: 0.8708
Stagnation was: 0

----------
Epoch 3/50
----------
Training


Avg. Loss: 0.1899, Total Loss: 0.2988, Loss Parts: [0.2988]: 100%|███████████████████| 469/469 [00:06<00:00, 72.15it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1899
Training Accuracy: 0.9433
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.04it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1759
Testing accuracy: 0.9446
Best testing accuracy was: 0.9309
Stagnation was: 0

----------
Epoch 4/50
----------
Training


Avg. Loss: 0.1363, Total Loss: 0.1822, Loss Parts: [0.1822]: 100%|███████████████████| 469/469 [00:07<00:00, 66.90it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1363
Training Accuracy: 0.9596
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.60it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1339
Testing accuracy: 0.9555
Best testing accuracy was: 0.9446
Stagnation was: 0

----------
Epoch 5/50
----------
Training


Avg. Loss: 0.1085, Total Loss: 0.0585, Loss Parts: [0.0585]: 100%|███████████████████| 469/469 [00:07<00:00, 66.01it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1085
Training Accuracy: 0.9673
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.61it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1200
Testing accuracy: 0.9615
Best testing accuracy was: 0.9555
Stagnation was: 0

----------
Epoch 6/50
----------
Training


Avg. Loss: 0.0905, Total Loss: 0.0356, Loss Parts: [0.0356]: 100%|███████████████████| 469/469 [00:06<00:00, 67.37it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0905
Training Accuracy: 0.9729
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.28it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1018
Testing accuracy: 0.9688
Best testing accuracy was: 0.9615
Stagnation was: 0

----------
Epoch 7/50
----------
Training


Avg. Loss: 0.0786, Total Loss: 0.1195, Loss Parts: [0.1195]: 100%|███████████████████| 469/469 [00:06<00:00, 70.43it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0786
Training Accuracy: 0.9762
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.82it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1057
Testing accuracy: 0.9684
Best testing accuracy was: 0.9688
Stagnation was: 1

----------
Epoch 8/50
----------
Training


Avg. Loss: 0.0671, Total Loss: 0.0451, Loss Parts: [0.0451]: 100%|███████████████████| 469/469 [00:06<00:00, 75.56it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0671
Training Accuracy: 0.9800
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.74it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1013
Testing accuracy: 0.9702
Best testing accuracy was: 0.9688
Stagnation was: 0

----------
Epoch 9/50
----------
Training


Avg. Loss: 0.0595, Total Loss: 0.0399, Loss Parts: [0.0399]: 100%|███████████████████| 469/469 [00:06<00:00, 69.10it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0595
Training Accuracy: 0.9815
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.73it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0952
Testing accuracy: 0.9716
Best testing accuracy was: 0.9702
Stagnation was: 0

----------
Epoch 10/50
----------
Training


Avg. Loss: 0.0514, Total Loss: 0.0591, Loss Parts: [0.0591]: 100%|███████████████████| 469/469 [00:06<00:00, 72.04it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0514
Training Accuracy: 0.9843
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.61it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1004
Testing accuracy: 0.9707
Best testing accuracy was: 0.9716
Stagnation was: 1

----------
Epoch 11/50
----------
Training


Avg. Loss: 0.0452, Total Loss: 0.0393, Loss Parts: [0.0393]: 100%|███████████████████| 469/469 [00:06<00:00, 73.26it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0452
Training Accuracy: 0.9864
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.41it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0918
Testing accuracy: 0.9739
Best testing accuracy was: 0.9716
Stagnation was: 0

----------
Epoch 12/50
----------
Training


Avg. Loss: 0.0375, Total Loss: 0.0106, Loss Parts: [0.0106]: 100%|███████████████████| 469/469 [00:06<00:00, 74.38it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0375
Training Accuracy: 0.9883
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.77it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0934
Testing accuracy: 0.9742
Best testing accuracy was: 0.9739
Stagnation was: 0

----------
Epoch 13/50
----------
Training


Avg. Loss: 0.0348, Total Loss: 0.0249, Loss Parts: [0.0249]: 100%|███████████████████| 469/469 [00:06<00:00, 75.01it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0348
Training Accuracy: 0.9891
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.28it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0931
Testing accuracy: 0.9734
Best testing accuracy was: 0.9742
Stagnation was: 1

----------
Epoch 14/50
----------
Training


Avg. Loss: 0.0315, Total Loss: 0.0137, Loss Parts: [0.0137]: 100%|███████████████████| 469/469 [00:06<00:00, 78.06it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0315
Training Accuracy: 0.9903
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.62it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0877
Testing accuracy: 0.9770
Best testing accuracy was: 0.9742
Stagnation was: 0

----------
Epoch 15/50
----------
Training


Avg. Loss: 0.0297, Total Loss: 0.0193, Loss Parts: [0.0193]: 100%|███████████████████| 469/469 [00:05<00:00, 79.10it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0297
Training Accuracy: 0.9906
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.64it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0962
Testing accuracy: 0.9749
Best testing accuracy was: 0.9770
Stagnation was: 1

----------
Epoch 16/50
----------
Training


Avg. Loss: 0.0237, Total Loss: 0.0026, Loss Parts: [0.0026]: 100%|███████████████████| 469/469 [00:06<00:00, 75.15it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0237
Training Accuracy: 0.9928
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.86it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1053
Testing accuracy: 0.9745
Best testing accuracy was: 0.9770
Stagnation was: 2

----------
Epoch 17/50
----------
Training


Avg. Loss: 0.0212, Total Loss: 0.0077, Loss Parts: [0.0077]: 100%|███████████████████| 469/469 [00:06<00:00, 72.66it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0212
Training Accuracy: 0.9935
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.20it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0944
Testing accuracy: 0.9767
Best testing accuracy was: 0.9770
Stagnation was: 3

----------
Epoch 18/50
----------
Training


Avg. Loss: 0.0181, Total Loss: 0.0298, Loss Parts: [0.0298]: 100%|███████████████████| 469/469 [00:06<00:00, 77.61it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0181
Training Accuracy: 0.9947
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.69it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.0959
Testing accuracy: 0.9768
Best testing accuracy was: 0.9770
Stagnation was: 4

----------
Epoch 19/50
----------
Training


Avg. Loss: 0.0161, Total Loss: 0.0144, Loss Parts: [0.0144]: 100%|███████████████████| 469/469 [00:05<00:00, 82.59it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0161
Training Accuracy: 0.9954
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.28it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1068
Testing accuracy: 0.9737
Best testing accuracy was: 0.9770
Ran out of patience at epoch: 18
Patience was: 5
Training complete in 3m 9s
Saved session to C:\Users\Windows\Desktop\Shahir\18.408\18408-final-project\experiments\23e792c32f5d72c2\sessions\Session 05-19-2021 05-41-30 PM
{'dataset_config': {'dataset_type': 'img', 'dataset_config': {'img_dataset_type': 'mnist', 'num_train_samples': 60000, 'num_test_samples': 10000, 'new_input_size': None, 'flatten': True, 'augment': False, 'corrupt_frac': 0.0, 'seed': 0}}, 'model_config': {'model_type': 'relu_toy', 'model_config': {'input_dim': 784, 'output_dim': 10, 'layer_dims': [100, 100, 100, 100], 'bias': True, 'seed': None}}, 'training_config': {'optimizer_type': 'sgd_momentum', 'loss_type': 'cross_entropy', 'lr': 0.01, 'num_epochs': 50, 'clip_grad_norm': False, 'weight_decay': 0.01, 'use_lr_schedule': False, 'epoch_lr_decay_steps': None, 'lr_decay_gamma': None, 'early_stop': True, 'early_stop_acc': 0.9, 'early_stop_pa

Avg. Loss: 1.9197, Total Loss: 0.9211, Loss Parts: [0.9211]: 100%|███████████████████| 469/469 [00:05<00:00, 80.27it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 1.9197
Training Accuracy: 0.2979
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.78it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 1.0558
Testing accuracy: 0.6337
Best testing accuracy was: -1.0000
Stagnation was: 0

----------
Epoch 2/50
----------
Training


Avg. Loss: 0.6450, Total Loss: 0.1944, Loss Parts: [0.1944]: 100%|███████████████████| 469/469 [00:06<00:00, 73.11it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.6450
Training Accuracy: 0.8050
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.20it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.3873
Testing accuracy: 0.8888
Best testing accuracy was: 0.6337
Stagnation was: 0

----------
Epoch 3/50
----------
Training


Avg. Loss: 0.3317, Total Loss: 0.2844, Loss Parts: [0.2844]: 100%|███████████████████| 469/469 [00:06<00:00, 71.72it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.3317
Training Accuracy: 0.9096
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.48it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2781
Testing accuracy: 0.9242
Best testing accuracy was: 0.8888
Stagnation was: 0

----------
Epoch 4/50
----------
Training


Avg. Loss: 0.2674, Total Loss: 0.1886, Loss Parts: [0.1886]: 100%|███████████████████| 469/469 [00:06<00:00, 67.94it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2674
Training Accuracy: 0.9284
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.08it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2670
Testing accuracy: 0.9256
Best testing accuracy was: 0.9242
Stagnation was: 0

----------
Epoch 5/50
----------
Training


Avg. Loss: 0.2386, Total Loss: 0.3082, Loss Parts: [0.3082]: 100%|███████████████████| 469/469 [00:06<00:00, 71.55it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2386
Training Accuracy: 0.9372
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 20.81it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2986
Testing accuracy: 0.9139
Best testing accuracy was: 0.9256
Stagnation was: 1

----------
Epoch 6/50
----------
Training


Avg. Loss: 0.2286, Total Loss: 0.2651, Loss Parts: [0.2651]: 100%|███████████████████| 469/469 [00:06<00:00, 69.29it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2286
Training Accuracy: 0.9399
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.60it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2272
Testing accuracy: 0.9428
Best testing accuracy was: 0.9256
Stagnation was: 0

----------
Epoch 7/50
----------
Training


Avg. Loss: 0.2222, Total Loss: 0.2353, Loss Parts: [0.2353]: 100%|███████████████████| 469/469 [00:06<00:00, 70.36it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2222
Training Accuracy: 0.9424
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.13it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2166
Testing accuracy: 0.9422
Best testing accuracy was: 0.9428
Stagnation was: 1

----------
Epoch 8/50
----------
Training


Avg. Loss: 0.2138, Total Loss: 0.1877, Loss Parts: [0.1877]: 100%|███████████████████| 469/469 [00:06<00:00, 72.43it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2138
Training Accuracy: 0.9439
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.23it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2114
Testing accuracy: 0.9433
Best testing accuracy was: 0.9428
Stagnation was: 0

----------
Epoch 9/50
----------
Training


Avg. Loss: 0.2086, Total Loss: 0.2016, Loss Parts: [0.2016]: 100%|███████████████████| 469/469 [00:06<00:00, 72.20it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2086
Training Accuracy: 0.9452
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.83it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2197
Testing accuracy: 0.9389
Best testing accuracy was: 0.9433
Stagnation was: 1

----------
Epoch 10/50
----------
Training


Avg. Loss: 0.2060, Total Loss: 0.1913, Loss Parts: [0.1913]: 100%|███████████████████| 469/469 [00:06<00:00, 73.02it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2060
Training Accuracy: 0.9468
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.18it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2034
Testing accuracy: 0.9445
Best testing accuracy was: 0.9433
Stagnation was: 0

----------
Epoch 11/50
----------
Training


Avg. Loss: 0.2008, Total Loss: 0.2653, Loss Parts: [0.2653]: 100%|███████████████████| 469/469 [00:06<00:00, 73.42it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2008
Training Accuracy: 0.9484
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.91it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2112
Testing accuracy: 0.9416
Best testing accuracy was: 0.9445
Stagnation was: 1

----------
Epoch 12/50
----------
Training


Avg. Loss: 0.2024, Total Loss: 0.3145, Loss Parts: [0.3145]: 100%|███████████████████| 469/469 [00:06<00:00, 70.70it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2024
Training Accuracy: 0.9483
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.78it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2212
Testing accuracy: 0.9397
Best testing accuracy was: 0.9445
Stagnation was: 2

----------
Epoch 13/50
----------
Training


Avg. Loss: 0.1992, Total Loss: 0.2379, Loss Parts: [0.2379]: 100%|███████████████████| 469/469 [00:06<00:00, 70.63it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1992
Training Accuracy: 0.9488
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.71it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2055
Testing accuracy: 0.9423
Best testing accuracy was: 0.9445
Stagnation was: 3

----------
Epoch 14/50
----------
Training


Avg. Loss: 0.1977, Total Loss: 0.2191, Loss Parts: [0.2191]: 100%|███████████████████| 469/469 [00:06<00:00, 69.60it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1977
Training Accuracy: 0.9494
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.16it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1922
Testing accuracy: 0.9517
Best testing accuracy was: 0.9445
Stagnation was: 0

----------
Epoch 15/50
----------
Training


Avg. Loss: 0.1964, Total Loss: 0.2609, Loss Parts: [0.2609]: 100%|███████████████████| 469/469 [00:06<00:00, 69.26it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1964
Training Accuracy: 0.9494
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.89it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1951
Testing accuracy: 0.9479
Best testing accuracy was: 0.9517
Stagnation was: 1

----------
Epoch 16/50
----------
Training


Avg. Loss: 0.1968, Total Loss: 0.2156, Loss Parts: [0.2156]: 100%|███████████████████| 469/469 [00:06<00:00, 69.98it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1968
Training Accuracy: 0.9506
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.27it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2022
Testing accuracy: 0.9459
Best testing accuracy was: 0.9517
Stagnation was: 2

----------
Epoch 17/50
----------
Training


Avg. Loss: 0.1934, Total Loss: 0.2368, Loss Parts: [0.2368]: 100%|███████████████████| 469/469 [00:06<00:00, 73.51it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1934
Training Accuracy: 0.9503
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.22it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1933
Testing accuracy: 0.9496
Best testing accuracy was: 0.9517
Stagnation was: 3

----------
Epoch 18/50
----------
Training


Avg. Loss: 0.1928, Total Loss: 0.2420, Loss Parts: [0.2420]: 100%|███████████████████| 469/469 [00:06<00:00, 76.42it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1928
Training Accuracy: 0.9502
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.39it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1909
Testing accuracy: 0.9518
Best testing accuracy was: 0.9517
Stagnation was: 0

----------
Epoch 19/50
----------
Training


Avg. Loss: 0.1907, Total Loss: 0.2271, Loss Parts: [0.2271]: 100%|███████████████████| 469/469 [00:06<00:00, 77.24it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1907
Training Accuracy: 0.9516
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.55it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1914
Testing accuracy: 0.9513
Best testing accuracy was: 0.9518
Stagnation was: 1

----------
Epoch 20/50
----------
Training


Avg. Loss: 0.1930, Total Loss: 0.3041, Loss Parts: [0.3041]: 100%|███████████████████| 469/469 [00:05<00:00, 81.00it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1930
Training Accuracy: 0.9500
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.24it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1980
Testing accuracy: 0.9476
Best testing accuracy was: 0.9518
Stagnation was: 2

----------
Epoch 21/50
----------
Training


Avg. Loss: 0.1892, Total Loss: 0.1699, Loss Parts: [0.1699]: 100%|███████████████████| 469/469 [00:05<00:00, 79.58it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1892
Training Accuracy: 0.9512
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.37it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2097
Testing accuracy: 0.9432
Best testing accuracy was: 0.9518
Stagnation was: 3

----------
Epoch 22/50
----------
Training


Avg. Loss: 0.1893, Total Loss: 0.1984, Loss Parts: [0.1984]: 100%|███████████████████| 469/469 [00:06<00:00, 68.87it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1893
Training Accuracy: 0.9527
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.42it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1821
Testing accuracy: 0.9542
Best testing accuracy was: 0.9518
Stagnation was: 0

----------
Epoch 23/50
----------
Training


Avg. Loss: 0.1874, Total Loss: 0.1839, Loss Parts: [0.1839]: 100%|███████████████████| 469/469 [00:07<00:00, 65.13it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1874
Training Accuracy: 0.9525
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.75it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1895
Testing accuracy: 0.9519
Best testing accuracy was: 0.9542
Stagnation was: 1

----------
Epoch 24/50
----------
Training


Avg. Loss: 0.1870, Total Loss: 0.1966, Loss Parts: [0.1966]: 100%|███████████████████| 469/469 [00:06<00:00, 74.53it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1870
Training Accuracy: 0.9524
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.44it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1916
Testing accuracy: 0.9519
Best testing accuracy was: 0.9542
Stagnation was: 2

----------
Epoch 25/50
----------
Training


Avg. Loss: 0.1887, Total Loss: 0.1209, Loss Parts: [0.1209]: 100%|███████████████████| 469/469 [00:06<00:00, 71.63it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1887
Training Accuracy: 0.9520
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.12it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1959
Testing accuracy: 0.9493
Best testing accuracy was: 0.9542
Stagnation was: 3

----------
Epoch 26/50
----------
Training


Avg. Loss: 0.1873, Total Loss: 0.1740, Loss Parts: [0.1740]: 100%|███████████████████| 469/469 [00:07<00:00, 65.87it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1873
Training Accuracy: 0.9525
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.62it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1900
Testing accuracy: 0.9498
Best testing accuracy was: 0.9542
Stagnation was: 4

----------
Epoch 27/50
----------
Training


Avg. Loss: 0.1862, Total Loss: 0.1163, Loss Parts: [0.1163]: 100%|███████████████████| 469/469 [00:07<00:00, 66.41it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1862
Training Accuracy: 0.9530
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.67it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1953
Testing accuracy: 0.9480
Best testing accuracy was: 0.9542
Ran out of patience at epoch: 26
Patience was: 5
Training complete in 4m 31s
Saved session to C:\Users\Windows\Desktop\Shahir\18.408\18408-final-project\experiments\2546c661d445a238\sessions\Session 05-19-2021 05-46-00 PM
{'dataset_config': {'dataset_type': 'img', 'dataset_config': {'img_dataset_type': 'mnist', 'num_train_samples': 60000, 'num_test_samples': 10000, 'new_input_size': None, 'flatten': True, 'augment': False, 'corrupt_frac': 0.0, 'seed': 0}}, 'model_config': {'model_type': 'relu_toy', 'model_config': {'input_dim': 784, 'output_dim': 10, 'layer_dims': [100, 100, 100, 100], 'bias': True, 'seed': None}}, 'training_config': {'optimizer_type': 'sgd_momentum', 'loss_type': 'cross_entropy', 'lr': 0.01, 'num_epochs': 50, 'clip_grad_norm': False, 'weight_decay': 0.1, 'use_lr_schedule': False, 'epoch_lr_decay_steps': None, 'lr_decay_gamma': None, 'early_stop': True, 'early_stop_acc': 0.9, 'early_stop_pa

Avg. Loss: 2.3020, Total Loss: 2.3031, Loss Parts: [2.3031]: 100%|███████████████████| 469/469 [00:06<00:00, 72.75it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3020
Training Accuracy: 0.1103
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.59it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: -1.0000
Stagnation was: 0

----------
Epoch 2/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3063, Loss Parts: [2.3063]: 100%|███████████████████| 469/469 [00:06<00:00, 69.95it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.11it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 3/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3000, Loss Parts: [2.3000]: 100%|███████████████████| 469/469 [00:06<00:00, 69.75it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1119
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.95it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 4/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3023, Loss Parts: [2.3023]: 100%|███████████████████| 469/469 [00:06<00:00, 69.30it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.18it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 5/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3028, Loss Parts: [2.3028]: 100%|███████████████████| 469/469 [00:06<00:00, 70.91it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.90it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3017
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 6/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.2975, Loss Parts: [2.2975]: 100%|███████████████████| 469/469 [00:07<00:00, 66.50it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.44it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 7/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.2976, Loss Parts: [2.2976]: 100%|███████████████████| 469/469 [00:07<00:00, 65.32it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1117
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.70it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 8/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.2992, Loss Parts: [2.2992]: 100%|███████████████████| 469/469 [00:07<00:00, 66.15it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.41it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 9/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3056, Loss Parts: [2.3056]: 100%|███████████████████| 469/469 [00:07<00:00, 65.09it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1116
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.87it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3017
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 10/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.2963, Loss Parts: [2.2963]: 100%|███████████████████| 469/469 [00:06<00:00, 75.96it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.99it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 11/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3016, Loss Parts: [2.3016]: 100%|███████████████████| 469/469 [00:06<00:00, 68.57it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.30it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 12/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3088, Loss Parts: [2.3088]: 100%|███████████████████| 469/469 [00:06<00:00, 68.02it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.95it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 13/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3071, Loss Parts: [2.3071]: 100%|███████████████████| 469/469 [00:06<00:00, 68.55it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.63it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3018
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 14/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.2959, Loss Parts: [2.2959]: 100%|███████████████████| 469/469 [00:06<00:00, 69.76it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.83it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 15/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3019, Loss Parts: [2.3019]: 100%|███████████████████| 469/469 [00:06<00:00, 73.28it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1115
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.70it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 16/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3051, Loss Parts: [2.3051]: 100%|███████████████████| 469/469 [00:06<00:00, 70.88it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1119
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.49it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 17/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3020, Loss Parts: [2.3020]: 100%|███████████████████| 469/469 [00:06<00:00, 69.38it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.01it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3017
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 18/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.2992, Loss Parts: [2.2992]: 100%|███████████████████| 469/469 [00:07<00:00, 63.95it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1121
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.42it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3018
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 19/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3013, Loss Parts: [2.3013]: 100%|███████████████████| 469/469 [00:07<00:00, 66.18it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.62it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 20/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3030, Loss Parts: [2.3030]: 100%|███████████████████| 469/469 [00:06<00:00, 68.71it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.80it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 21/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3031, Loss Parts: [2.3031]: 100%|███████████████████| 469/469 [00:07<00:00, 63.52it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.47it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 22/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3024, Loss Parts: [2.3024]: 100%|███████████████████| 469/469 [00:06<00:00, 68.73it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.43it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 23/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3037, Loss Parts: [2.3037]: 100%|███████████████████| 469/469 [00:07<00:00, 66.92it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.84it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 24/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.2949, Loss Parts: [2.2949]: 100%|███████████████████| 469/469 [00:06<00:00, 69.21it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.80it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 25/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.2971, Loss Parts: [2.2971]: 100%|███████████████████| 469/469 [00:07<00:00, 66.75it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.99it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 26/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3054, Loss Parts: [2.3054]: 100%|███████████████████| 469/469 [00:07<00:00, 65.53it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.47it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 27/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.2966, Loss Parts: [2.2966]: 100%|███████████████████| 469/469 [00:07<00:00, 63.98it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.99it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 28/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3012, Loss Parts: [2.3012]: 100%|███████████████████| 469/469 [00:06<00:00, 68.07it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.83it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 29/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3067, Loss Parts: [2.3067]: 100%|███████████████████| 469/469 [00:07<00:00, 66.89it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.69it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 30/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3064, Loss Parts: [2.3064]: 100%|███████████████████| 469/469 [00:07<00:00, 66.55it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.91it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 31/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3057, Loss Parts: [2.3057]: 100%|███████████████████| 469/469 [00:07<00:00, 64.49it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1121
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.98it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 32/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3028, Loss Parts: [2.3028]: 100%|███████████████████| 469/469 [00:07<00:00, 64.49it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.46it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 33/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.2997, Loss Parts: [2.2997]: 100%|███████████████████| 469/469 [00:06<00:00, 73.50it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.41it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 34/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3019, Loss Parts: [2.3019]: 100%|███████████████████| 469/469 [00:06<00:00, 73.72it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1121
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.97it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 35/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.2991, Loss Parts: [2.2991]: 100%|███████████████████| 469/469 [00:07<00:00, 66.08it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.32it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 36/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3042, Loss Parts: [2.3042]: 100%|███████████████████| 469/469 [00:06<00:00, 67.44it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.54it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 37/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.2992, Loss Parts: [2.2992]: 100%|███████████████████| 469/469 [00:07<00:00, 65.88it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.15it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3018
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 38/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.2994, Loss Parts: [2.2994]: 100%|███████████████████| 469/469 [00:07<00:00, 66.33it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.05it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 39/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3040, Loss Parts: [2.3040]: 100%|███████████████████| 469/469 [00:07<00:00, 66.20it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.50it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 40/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3017, Loss Parts: [2.3017]: 100%|███████████████████| 469/469 [00:07<00:00, 65.55it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1110
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.31it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 41/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3048, Loss Parts: [2.3048]: 100%|███████████████████| 469/469 [00:07<00:00, 67.00it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1122
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.07it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 42/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3051, Loss Parts: [2.3051]: 100%|███████████████████| 469/469 [00:07<00:00, 66.31it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1120
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.84it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 43/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.2983, Loss Parts: [2.2983]: 100%|███████████████████| 469/469 [00:07<00:00, 65.60it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.86it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 44/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.2994, Loss Parts: [2.2994]: 100%|███████████████████| 469/469 [00:06<00:00, 67.75it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1119
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.87it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 45/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3016, Loss Parts: [2.3016]: 100%|███████████████████| 469/469 [00:06<00:00, 70.74it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1121
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.49it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 46/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.2994, Loss Parts: [2.2994]: 100%|███████████████████| 469/469 [00:07<00:00, 65.18it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.88it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3017
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 47/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.2976, Loss Parts: [2.2976]: 100%|███████████████████| 469/469 [00:07<00:00, 66.37it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.18it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3017
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 48/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3036, Loss Parts: [2.3036]: 100%|███████████████████| 469/469 [00:07<00:00, 64.24it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.58it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 49/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.2991, Loss Parts: [2.2991]: 100%|███████████████████| 469/469 [00:06<00:00, 67.35it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1120
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.51it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 50/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3017, Loss Parts: [2.3017]: 100%|███████████████████| 469/469 [00:06<00:00, 68.04it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.22it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

Training complete in 8m 43s
Saved session to C:\Users\Windows\Desktop\Shahir\18.408\18408-final-project\experiments\34598a7849cdff8c\sessions\Session 05-19-2021 05-54-44 PM
{'dataset_config': {'dataset_type': 'img', 'dataset_config': {'img_dataset_type': 'mnist', 'num_train_samples': 60000, 'num_test_samples': 10000, 'new_input_size': None, 'flatten': True, 'augment': False, 'corrupt_frac': 0.0, 'seed': 0}}, 'model_config': {'model_type': 'relu_toy', 'model_config': {'input_dim': 784, 'output_dim': 10, 'layer_dims': [100, 100, 100, 100, 100, 100], 'bias': True, 'seed': None}}, 'training_config': {'optimizer_type': 'sgd_momentum', 'loss_type': 'cross_entropy', 'lr': 0.01, 'num_epochs': 50, 'clip_grad_norm': False, 'weight_decay': 0.0, 'use_lr_schedule': False, 'epoch_lr_decay_steps': None, 'lr_decay_gamma': None, 'early_stop': True, 'early_stop_acc': 0.9, 'early_stop_patience': 5}, 'trial_

Avg. Loss: 2.2997, Total Loss: 2.3021, Loss Parts: [2.3021]: 100%|███████████████████| 469/469 [00:06<00:00, 67.62it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.2997
Training Accuracy: 0.1112
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.08it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.2932
Testing accuracy: 0.1135
Best testing accuracy was: -1.0000
Stagnation was: 0

----------
Epoch 2/50
----------
Training


Avg. Loss: 1.5690, Total Loss: 0.7543, Loss Parts: [0.7543]: 100%|███████████████████| 469/469 [00:07<00:00, 64.49it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 1.5690
Training Accuracy: 0.4212
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.53it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.6087
Testing accuracy: 0.8205
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 3/50
----------
Training


Avg. Loss: 0.3519, Total Loss: 0.1791, Loss Parts: [0.1791]: 100%|███████████████████| 469/469 [00:07<00:00, 62.61it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.3519
Training Accuracy: 0.8995
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.73it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2209
Testing accuracy: 0.9379
Best testing accuracy was: 0.8205
Stagnation was: 0

----------
Epoch 4/50
----------
Training


Avg. Loss: 0.1841, Total Loss: 0.1858, Loss Parts: [0.1858]: 100%|███████████████████| 469/469 [00:07<00:00, 64.60it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1841
Training Accuracy: 0.9477
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.42it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1837
Testing accuracy: 0.9480
Best testing accuracy was: 0.9379
Stagnation was: 0

----------
Epoch 5/50
----------
Training


Avg. Loss: 0.1302, Total Loss: 0.1203, Loss Parts: [0.1203]: 100%|███████████████████| 469/469 [00:07<00:00, 63.98it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1302
Training Accuracy: 0.9631
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.81it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1795
Testing accuracy: 0.9510
Best testing accuracy was: 0.9480
Stagnation was: 0

----------
Epoch 6/50
----------
Training


Avg. Loss: 0.1018, Total Loss: 0.0758, Loss Parts: [0.0758]: 100%|███████████████████| 469/469 [00:06<00:00, 72.29it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1018
Training Accuracy: 0.9696
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.32it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1251
Testing accuracy: 0.9657
Best testing accuracy was: 0.9510
Stagnation was: 0

----------
Epoch 7/50
----------
Training


Avg. Loss: 0.0838, Total Loss: 0.1655, Loss Parts: [0.1655]: 100%|███████████████████| 469/469 [00:07<00:00, 65.48it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0838
Training Accuracy: 0.9757
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.49it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1197
Testing accuracy: 0.9683
Best testing accuracy was: 0.9657
Stagnation was: 0

----------
Epoch 8/50
----------
Training


Avg. Loss: 0.0710, Total Loss: 0.0752, Loss Parts: [0.0752]: 100%|███████████████████| 469/469 [00:07<00:00, 64.29it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0710
Training Accuracy: 0.9791
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.39it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1142
Testing accuracy: 0.9703
Best testing accuracy was: 0.9683
Stagnation was: 0

----------
Epoch 9/50
----------
Training


Avg. Loss: 0.0577, Total Loss: 0.0562, Loss Parts: [0.0562]: 100%|███████████████████| 469/469 [00:07<00:00, 60.59it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0577
Training Accuracy: 0.9831
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.18it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1126
Testing accuracy: 0.9709
Best testing accuracy was: 0.9703
Stagnation was: 0

----------
Epoch 10/50
----------
Training


Avg. Loss: 0.0530, Total Loss: 0.0090, Loss Parts: [0.0090]: 100%|███████████████████| 469/469 [00:07<00:00, 62.14it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0530
Training Accuracy: 0.9843
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.53it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1137
Testing accuracy: 0.9717
Best testing accuracy was: 0.9709
Stagnation was: 0

----------
Epoch 11/50
----------
Training


Avg. Loss: 0.0477, Total Loss: 0.0050, Loss Parts: [0.0050]: 100%|███████████████████| 469/469 [00:07<00:00, 62.45it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0477
Training Accuracy: 0.9857
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.12it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1241
Testing accuracy: 0.9685
Best testing accuracy was: 0.9717
Stagnation was: 1

----------
Epoch 12/50
----------
Training


Avg. Loss: 0.0405, Total Loss: 0.0676, Loss Parts: [0.0676]: 100%|███████████████████| 469/469 [00:07<00:00, 63.98it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0405
Training Accuracy: 0.9875
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.76it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1139
Testing accuracy: 0.9730
Best testing accuracy was: 0.9717
Stagnation was: 0

----------
Epoch 13/50
----------
Training


Avg. Loss: 0.0356, Total Loss: 0.0402, Loss Parts: [0.0402]: 100%|███████████████████| 469/469 [00:07<00:00, 63.17it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0356
Training Accuracy: 0.9895
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.62it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1244
Testing accuracy: 0.9707
Best testing accuracy was: 0.9730
Stagnation was: 1

----------
Epoch 14/50
----------
Training


Avg. Loss: 0.0349, Total Loss: 0.0196, Loss Parts: [0.0196]: 100%|███████████████████| 469/469 [00:07<00:00, 61.32it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0349
Training Accuracy: 0.9892
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.46it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1241
Testing accuracy: 0.9727
Best testing accuracy was: 0.9730
Stagnation was: 2

----------
Epoch 15/50
----------
Training


Avg. Loss: 0.0277, Total Loss: 0.0903, Loss Parts: [0.0903]: 100%|███████████████████| 469/469 [00:07<00:00, 61.91it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0277
Training Accuracy: 0.9917
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.93it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1138
Testing accuracy: 0.9755
Best testing accuracy was: 0.9730
Stagnation was: 0

----------
Epoch 16/50
----------
Training


Avg. Loss: 0.0244, Total Loss: 0.0977, Loss Parts: [0.0977]: 100%|███████████████████| 469/469 [00:07<00:00, 60.97it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0244
Training Accuracy: 0.9927
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.78it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1335
Testing accuracy: 0.9720
Best testing accuracy was: 0.9755
Stagnation was: 1

----------
Epoch 17/50
----------
Training


Avg. Loss: 0.0223, Total Loss: 0.0250, Loss Parts: [0.0250]: 100%|███████████████████| 469/469 [00:07<00:00, 66.56it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0223
Training Accuracy: 0.9929
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.72it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1301
Testing accuracy: 0.9724
Best testing accuracy was: 0.9755
Stagnation was: 2

----------
Epoch 18/50
----------
Training


Avg. Loss: 0.0207, Total Loss: 0.0188, Loss Parts: [0.0188]: 100%|███████████████████| 469/469 [00:07<00:00, 62.18it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0207
Training Accuracy: 0.9933
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.49it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1308
Testing accuracy: 0.9732
Best testing accuracy was: 0.9755
Stagnation was: 3

----------
Epoch 19/50
----------
Training


Avg. Loss: 0.0182, Total Loss: 0.0192, Loss Parts: [0.0192]: 100%|███████████████████| 469/469 [00:07<00:00, 65.25it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0182
Training Accuracy: 0.9948
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.42it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1382
Testing accuracy: 0.9737
Best testing accuracy was: 0.9755
Stagnation was: 4

----------
Epoch 20/50
----------
Training


Avg. Loss: 0.0215, Total Loss: 0.0232, Loss Parts: [0.0232]: 100%|███████████████████| 469/469 [00:07<00:00, 63.93it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0215
Training Accuracy: 0.9931
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.89it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1496
Testing accuracy: 0.9709
Best testing accuracy was: 0.9755
Ran out of patience at epoch: 19
Patience was: 5
Training complete in 3m 37s
Saved session to C:\Users\Windows\Desktop\Shahir\18.408\18408-final-project\experiments\3638ed3f4448b30f\sessions\Session 05-19-2021 05-58-21 PM
{'dataset_config': {'dataset_type': 'img', 'dataset_config': {'img_dataset_type': 'mnist', 'num_train_samples': 60000, 'num_test_samples': 10000, 'new_input_size': None, 'flatten': True, 'augment': False, 'corrupt_frac': 0.0, 'seed': 0}}, 'model_config': {'model_type': 'relu_toy', 'model_config': {'input_dim': 784, 'output_dim': 10, 'layer_dims': [100, 100, 100, 100, 100, 100], 'bias': True, 'seed': None}}, 'training_config': {'optimizer_type': 'sgd_momentum', 'loss_type': 'cross_entropy', 'lr': 0.01, 'num_epochs': 50, 'clip_grad_norm': False, 'weight_decay': 0.01, 'use_lr_schedule': False, 'epoch_lr_decay_steps': None, 'lr_decay_gamma': None, 'early_stop': True, 'early_stop_acc': 0.9, 'ea

Avg. Loss: 2.3017, Total Loss: 2.3077, Loss Parts: [2.3077]: 100%|███████████████████| 469/469 [00:07<00:00, 63.67it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1107
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.07it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: -1.0000
Stagnation was: 0

----------
Epoch 2/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2925, Loss Parts: [2.2925]: 100%|███████████████████| 469/469 [00:07<00:00, 62.05it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.36it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 3/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3033, Loss Parts: [2.3033]: 100%|███████████████████| 469/469 [00:07<00:00, 64.75it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.12it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 4/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3034, Loss Parts: [2.3034]: 100%|███████████████████| 469/469 [00:07<00:00, 64.16it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.32it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 5/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3025, Loss Parts: [2.3025]: 100%|███████████████████| 469/469 [00:07<00:00, 62.27it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.60it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 6/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3010, Loss Parts: [2.3010]: 100%|███████████████████| 469/469 [00:07<00:00, 60.44it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.96it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 7/50
----------
Training


Avg. Loss: 2.3013, Total Loss: 2.2888, Loss Parts: [2.2888]: 100%|███████████████████| 469/469 [00:07<00:00, 62.19it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3013
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.13it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 8/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3006, Loss Parts: [2.3006]: 100%|███████████████████| 469/469 [00:06<00:00, 67.92it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.80it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 9/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3081, Loss Parts: [2.3081]: 100%|███████████████████| 469/469 [00:07<00:00, 61.21it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.68it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 10/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3044, Loss Parts: [2.3044]: 100%|███████████████████| 469/469 [00:07<00:00, 59.49it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.72it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 11/50
----------
Training


Avg. Loss: 2.3013, Total Loss: 2.2991, Loss Parts: [2.2991]: 100%|███████████████████| 469/469 [00:07<00:00, 62.33it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3013
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.70it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 12/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3004, Loss Parts: [2.3004]: 100%|███████████████████| 469/469 [00:07<00:00, 62.01it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.63it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 13/50
----------
Training


Avg. Loss: 2.3013, Total Loss: 2.3013, Loss Parts: [2.3013]: 100%|███████████████████| 469/469 [00:07<00:00, 60.16it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3013
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.26it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 14/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2946, Loss Parts: [2.2946]: 100%|███████████████████| 469/469 [00:07<00:00, 64.42it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.08it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 15/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3022, Loss Parts: [2.3022]: 100%|███████████████████| 469/469 [00:07<00:00, 62.62it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.07it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 16/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3005, Loss Parts: [2.3005]: 100%|███████████████████| 469/469 [00:07<00:00, 61.70it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.29it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 17/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3154, Loss Parts: [2.3154]: 100%|███████████████████| 469/469 [00:07<00:00, 62.12it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.71it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 18/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3111, Loss Parts: [2.3111]: 100%|███████████████████| 469/469 [00:07<00:00, 63.29it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.85it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 19/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3006, Loss Parts: [2.3006]: 100%|███████████████████| 469/469 [00:07<00:00, 63.60it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.97it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 20/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3056, Loss Parts: [2.3056]: 100%|███████████████████| 469/469 [00:07<00:00, 63.23it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.12it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 21/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3033, Loss Parts: [2.3033]: 100%|███████████████████| 469/469 [00:07<00:00, 65.29it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.86it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 22/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3026, Loss Parts: [2.3026]: 100%|███████████████████| 469/469 [00:06<00:00, 71.08it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.51it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 23/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3011, Loss Parts: [2.3011]: 100%|███████████████████| 469/469 [00:06<00:00, 74.54it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.18it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 24/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3039, Loss Parts: [2.3039]: 100%|███████████████████| 469/469 [00:05<00:00, 79.91it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.24it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 25/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3093, Loss Parts: [2.3093]: 100%|███████████████████| 469/469 [00:06<00:00, 75.78it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.07it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 26/50
----------
Training


Avg. Loss: 2.3013, Total Loss: 2.3114, Loss Parts: [2.3114]: 100%|███████████████████| 469/469 [00:06<00:00, 67.57it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3013
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.21it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 27/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3021, Loss Parts: [2.3021]: 100%|███████████████████| 469/469 [00:07<00:00, 63.39it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.32it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 28/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2966, Loss Parts: [2.2966]: 100%|███████████████████| 469/469 [00:06<00:00, 76.47it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.92it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 29/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2964, Loss Parts: [2.2964]: 100%|███████████████████| 469/469 [00:05<00:00, 78.24it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.06it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 30/50
----------
Training


Avg. Loss: 2.3013, Total Loss: 2.3023, Loss Parts: [2.3023]: 100%|███████████████████| 469/469 [00:06<00:00, 70.50it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3013
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.05it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 31/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2972, Loss Parts: [2.2972]: 100%|███████████████████| 469/469 [00:07<00:00, 64.63it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.63it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 32/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3075, Loss Parts: [2.3075]: 100%|███████████████████| 469/469 [00:07<00:00, 62.49it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.08it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 33/50
----------
Training


Avg. Loss: 2.3013, Total Loss: 2.3052, Loss Parts: [2.3052]: 100%|███████████████████| 469/469 [00:06<00:00, 67.36it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3013
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.46it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 34/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2981, Loss Parts: [2.2981]: 100%|███████████████████| 469/469 [00:07<00:00, 64.08it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.54it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 35/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3048, Loss Parts: [2.3048]: 100%|███████████████████| 469/469 [00:06<00:00, 67.29it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.94it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 36/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3033, Loss Parts: [2.3033]: 100%|███████████████████| 469/469 [00:07<00:00, 65.50it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.58it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 37/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2998, Loss Parts: [2.2998]: 100%|███████████████████| 469/469 [00:07<00:00, 65.45it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.79it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 38/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3066, Loss Parts: [2.3066]: 100%|███████████████████| 469/469 [00:07<00:00, 66.60it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.34it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 39/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3063, Loss Parts: [2.3063]: 100%|███████████████████| 469/469 [00:07<00:00, 65.74it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.60it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 40/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3091, Loss Parts: [2.3091]: 100%|███████████████████| 469/469 [00:07<00:00, 66.32it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.66it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 41/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3046, Loss Parts: [2.3046]: 100%|███████████████████| 469/469 [00:06<00:00, 69.06it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.15it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 42/50
----------
Training


Avg. Loss: 2.3013, Total Loss: 2.3086, Loss Parts: [2.3086]: 100%|███████████████████| 469/469 [00:06<00:00, 71.28it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3013
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.77it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 43/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3022, Loss Parts: [2.3022]: 100%|███████████████████| 469/469 [00:06<00:00, 69.20it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.48it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 44/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3076, Loss Parts: [2.3076]: 100%|███████████████████| 469/469 [00:06<00:00, 67.35it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.94it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 45/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2959, Loss Parts: [2.2959]: 100%|███████████████████| 469/469 [00:06<00:00, 71.01it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.29it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 46/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3078, Loss Parts: [2.3078]: 100%|███████████████████| 469/469 [00:06<00:00, 70.44it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.73it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 47/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3014, Loss Parts: [2.3014]: 100%|███████████████████| 469/469 [00:06<00:00, 71.84it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.19it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 48/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3060, Loss Parts: [2.3060]: 100%|███████████████████| 469/469 [00:06<00:00, 74.49it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.79it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 49/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2969, Loss Parts: [2.2969]: 100%|███████████████████| 469/469 [00:07<00:00, 65.10it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.60it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 50/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3090, Loss Parts: [2.3090]: 100%|███████████████████| 469/469 [00:06<00:00, 67.40it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.09it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

Training complete in 8m 50s
Saved session to C:\Users\Windows\Desktop\Shahir\18.408\18408-final-project\experiments\827cdb88f8dc465c\sessions\Session 05-19-2021 06-07-11 PM
{'dataset_config': {'dataset_type': 'img', 'dataset_config': {'img_dataset_type': 'mnist', 'num_train_samples': 60000, 'num_test_samples': 10000, 'new_input_size': None, 'flatten': True, 'augment': False, 'corrupt_frac': 0.0, 'seed': 0}}, 'model_config': {'model_type': 'relu_toy', 'model_config': {'input_dim': 784, 'output_dim': 10, 'layer_dims': [100, 100, 100, 100, 100, 100], 'bias': True, 'seed': None}}, 'training_config': {'optimizer_type': 'sgd_momentum', 'loss_type': 'cross_entropy', 'lr': 0.01, 'num_epochs': 50, 'clip_grad_norm': False, 'weight_decay': 0.1, 'use_lr_schedule': False, 'epoch_lr_decay_steps': None, 'lr_decay_gamma': None, 'early_stop': True, 'early_stop_acc': 0.9, 'early_stop_patience': 5}, 'trial_

Avg. Loss: 2.3018, Total Loss: 2.3026, Loss Parts: [2.3026]: 100%|███████████████████| 469/469 [00:06<00:00, 74.28it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3018
Training Accuracy: 0.1118
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.76it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: -1.0000
Stagnation was: 0

----------
Epoch 2/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3039, Loss Parts: [2.3039]: 100%|███████████████████| 469/469 [00:06<00:00, 68.14it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1117
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.68it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 3/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.2971, Loss Parts: [2.2971]: 100%|███████████████████| 469/469 [00:07<00:00, 62.21it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.14it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 4/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3057, Loss Parts: [2.3057]: 100%|███████████████████| 469/469 [00:07<00:00, 64.42it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.58it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 5/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3005, Loss Parts: [2.3005]: 100%|███████████████████| 469/469 [00:07<00:00, 65.71it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.43it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 6/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.2966, Loss Parts: [2.2966]: 100%|███████████████████| 469/469 [00:06<00:00, 68.33it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1111
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.26it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 7/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3052, Loss Parts: [2.3052]: 100%|███████████████████| 469/469 [00:07<00:00, 65.80it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.98it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 8/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.2996, Loss Parts: [2.2996]: 100%|███████████████████| 469/469 [00:07<00:00, 64.42it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1113
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.99it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 9/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3026, Loss Parts: [2.3026]: 100%|███████████████████| 469/469 [00:07<00:00, 64.80it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.91it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3017
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 10/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.2996, Loss Parts: [2.2996]: 100%|███████████████████| 469/469 [00:07<00:00, 64.51it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.86it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 11/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.2977, Loss Parts: [2.2977]: 100%|███████████████████| 469/469 [00:07<00:00, 65.68it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.66it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 12/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.2972, Loss Parts: [2.2972]: 100%|███████████████████| 469/469 [00:07<00:00, 65.54it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1118
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.33it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 13/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3039, Loss Parts: [2.3039]: 100%|███████████████████| 469/469 [00:07<00:00, 62.77it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1118
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.60it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3018
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 14/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.2972, Loss Parts: [2.2972]: 100%|███████████████████| 469/469 [00:07<00:00, 62.89it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.53it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 15/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.2996, Loss Parts: [2.2996]: 100%|███████████████████| 469/469 [00:07<00:00, 63.06it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1116
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.51it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 16/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3049, Loss Parts: [2.3049]: 100%|███████████████████| 469/469 [00:07<00:00, 60.08it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.88it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 17/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3032, Loss Parts: [2.3032]: 100%|███████████████████| 469/469 [00:07<00:00, 61.90it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1119
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.13it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3017
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 18/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.2946, Loss Parts: [2.2946]: 100%|███████████████████| 469/469 [00:07<00:00, 65.61it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.38it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 19/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.2993, Loss Parts: [2.2993]: 100%|███████████████████| 469/469 [00:07<00:00, 60.20it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1120
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.36it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 20/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3013, Loss Parts: [2.3013]: 100%|███████████████████| 469/469 [00:07<00:00, 63.26it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1118
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.35it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3018
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 21/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3034, Loss Parts: [2.3034]: 100%|███████████████████| 469/469 [00:07<00:00, 64.24it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 20.68it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 22/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3000, Loss Parts: [2.3000]: 100%|███████████████████| 469/469 [00:07<00:00, 60.36it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.48it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3017
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 23/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3019, Loss Parts: [2.3019]: 100%|███████████████████| 469/469 [00:07<00:00, 61.22it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1117
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.11it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 24/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3044, Loss Parts: [2.3044]: 100%|███████████████████| 469/469 [00:07<00:00, 61.14it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.46it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3017
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 25/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3035, Loss Parts: [2.3035]: 100%|███████████████████| 469/469 [00:07<00:00, 59.13it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.47it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 26/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3041, Loss Parts: [2.3041]: 100%|███████████████████| 469/469 [00:07<00:00, 64.19it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.49it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 27/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3018, Loss Parts: [2.3018]: 100%|███████████████████| 469/469 [00:07<00:00, 60.53it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1121
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.79it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 28/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.2980, Loss Parts: [2.2980]: 100%|███████████████████| 469/469 [00:07<00:00, 63.24it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1122
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.73it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 29/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3034, Loss Parts: [2.3034]: 100%|███████████████████| 469/469 [00:07<00:00, 60.03it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.48it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 30/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3038, Loss Parts: [2.3038]: 100%|███████████████████| 469/469 [00:07<00:00, 59.91it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1111
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.11it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 31/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3004, Loss Parts: [2.3004]: 100%|███████████████████| 469/469 [00:07<00:00, 60.17it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.73it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 32/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.2994, Loss Parts: [2.2994]: 100%|███████████████████| 469/469 [00:07<00:00, 60.49it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1120
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.22it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 33/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3071, Loss Parts: [2.3071]: 100%|███████████████████| 469/469 [00:07<00:00, 61.75it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1120
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.75it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 34/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3005, Loss Parts: [2.3005]: 100%|███████████████████| 469/469 [00:07<00:00, 61.90it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.50it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 35/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.2981, Loss Parts: [2.2981]: 100%|███████████████████| 469/469 [00:07<00:00, 62.25it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.36it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3017
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 36/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3016, Loss Parts: [2.3016]: 100%|███████████████████| 469/469 [00:07<00:00, 63.25it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.46it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3020
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 37/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3031, Loss Parts: [2.3031]: 100%|███████████████████| 469/469 [00:07<00:00, 63.94it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.65it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3017
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 38/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.2955, Loss Parts: [2.2955]: 100%|███████████████████| 469/469 [00:07<00:00, 59.10it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1118
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.29it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 39/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3036, Loss Parts: [2.3036]: 100%|███████████████████| 469/469 [00:07<00:00, 61.95it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.85it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 40/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3044, Loss Parts: [2.3044]: 100%|███████████████████| 469/469 [00:07<00:00, 65.45it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.10it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3017
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 41/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3030, Loss Parts: [2.3030]: 100%|███████████████████| 469/469 [00:06<00:00, 68.23it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.26it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3017
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 42/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3007, Loss Parts: [2.3007]: 100%|███████████████████| 469/469 [00:06<00:00, 69.85it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1118
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.10it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 43/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3005, Loss Parts: [2.3005]: 100%|███████████████████| 469/469 [00:07<00:00, 63.12it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.45it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3017
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 44/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.2995, Loss Parts: [2.2995]: 100%|███████████████████| 469/469 [00:07<00:00, 59.92it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1120
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.80it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 45/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3015, Loss Parts: [2.3015]: 100%|███████████████████| 469/469 [00:06<00:00, 67.30it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.22it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 46/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3035, Loss Parts: [2.3035]: 100%|███████████████████| 469/469 [00:07<00:00, 66.29it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.16it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 47/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3052, Loss Parts: [2.3052]: 100%|███████████████████| 469/469 [00:07<00:00, 65.54it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1119
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.92it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 48/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3075, Loss Parts: [2.3075]: 100%|███████████████████| 469/469 [00:07<00:00, 64.01it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.32it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 49/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3030, Loss Parts: [2.3030]: 100%|███████████████████| 469/469 [00:07<00:00, 60.43it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.37it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 50/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3008, Loss Parts: [2.3008]: 100%|███████████████████| 469/469 [00:07<00:00, 61.01it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1117
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.76it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

Training complete in 9m 7s
Saved session to C:\Users\Windows\Desktop\Shahir\18.408\18408-final-project\experiments\162696cc649a8201\sessions\Session 05-19-2021 06-16-18 PM
{'dataset_config': {'dataset_type': 'img', 'dataset_config': {'img_dataset_type': 'mnist', 'num_train_samples': 60000, 'num_test_samples': 10000, 'new_input_size': None, 'flatten': True, 'augment': False, 'corrupt_frac': 0.0, 'seed': 0}}, 'model_config': {'model_type': 'relu_toy', 'model_config': {'input_dim': 784, 'output_dim': 10, 'layer_dims': [100, 100, 100, 100, 100, 100, 100, 100], 'bias': True, 'seed': None}}, 'training_config': {'optimizer_type': 'sgd_momentum', 'loss_type': 'cross_entropy', 'lr': 0.01, 'num_epochs': 50, 'clip_grad_norm': False, 'weight_decay': 0.0, 'use_lr_schedule': False, 'epoch_lr_decay_steps': None, 'lr_decay_gamma': None, 'early_stop': True, 'early_stop_acc': 0.9, 'early_stop_patience': 5}

Avg. Loss: 2.3015, Total Loss: 2.3055, Loss Parts: [2.3055]: 100%|███████████████████| 469/469 [00:07<00:00, 60.95it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3015
Training Accuracy: 0.1107
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.97it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: -1.0000
Stagnation was: 0

----------
Epoch 2/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3147, Loss Parts: [2.3147]: 100%|███████████████████| 469/469 [00:07<00:00, 59.73it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.94it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 3/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2986, Loss Parts: [2.2986]: 100%|███████████████████| 469/469 [00:07<00:00, 58.99it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.52it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 4/50
----------
Training


Avg. Loss: 2.3013, Total Loss: 2.3071, Loss Parts: [2.3071]: 100%|███████████████████| 469/469 [00:07<00:00, 60.73it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3013
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.97it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 5/50
----------
Training


Avg. Loss: 2.3012, Total Loss: 2.3001, Loss Parts: [2.3001]: 100%|███████████████████| 469/469 [00:07<00:00, 59.65it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3012
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.91it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3008
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 6/50
----------
Training


Avg. Loss: 2.3009, Total Loss: 2.3059, Loss Parts: [2.3059]: 100%|███████████████████| 469/469 [00:08<00:00, 58.16it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3009
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.48it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3002
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 7/50
----------
Training


Avg. Loss: 2.2868, Total Loss: 2.1734, Loss Parts: [2.1734]: 100%|███████████████████| 469/469 [00:07<00:00, 59.53it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.2868
Training Accuracy: 0.1257
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.43it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.1290
Testing accuracy: 0.2054
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 8/50
----------
Training


Avg. Loss: 1.4395, Total Loss: 0.8291, Loss Parts: [0.8291]: 100%|███████████████████| 469/469 [00:07<00:00, 63.86it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 1.4395
Training Accuracy: 0.4035
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.40it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 1.0649
Testing accuracy: 0.5589
Best testing accuracy was: 0.2054
Stagnation was: 0

----------
Epoch 9/50
----------
Training


Avg. Loss: 0.6438, Total Loss: 0.2880, Loss Parts: [0.2880]: 100%|███████████████████| 469/469 [00:08<00:00, 57.80it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.6438
Training Accuracy: 0.7949
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.64it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.3933
Testing accuracy: 0.9021
Best testing accuracy was: 0.5589
Stagnation was: 0

----------
Epoch 10/50
----------
Training


Avg. Loss: 0.3141, Total Loss: 0.2448, Loss Parts: [0.2448]: 100%|███████████████████| 469/469 [00:08<00:00, 57.93it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.3141
Training Accuracy: 0.9221
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.07it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2828
Testing accuracy: 0.9333
Best testing accuracy was: 0.9021
Stagnation was: 0

----------
Epoch 11/50
----------
Training


Avg. Loss: 0.2210, Total Loss: 0.1318, Loss Parts: [0.1318]: 100%|███████████████████| 469/469 [00:08<00:00, 57.69it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2210
Training Accuracy: 0.9444
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.58it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.3376
Testing accuracy: 0.9201
Best testing accuracy was: 0.9333
Stagnation was: 1

----------
Epoch 12/50
----------
Training


Avg. Loss: 0.1760, Total Loss: 0.1755, Loss Parts: [0.1755]: 100%|███████████████████| 469/469 [00:08<00:00, 57.46it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1760
Training Accuracy: 0.9556
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.17it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2301
Testing accuracy: 0.9484
Best testing accuracy was: 0.9333
Stagnation was: 0

----------
Epoch 13/50
----------
Training


Avg. Loss: 0.1511, Total Loss: 0.1404, Loss Parts: [0.1404]: 100%|███████████████████| 469/469 [00:08<00:00, 57.17it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1511
Training Accuracy: 0.9613
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.09it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2078
Testing accuracy: 0.9503
Best testing accuracy was: 0.9484
Stagnation was: 0

----------
Epoch 14/50
----------
Training


Avg. Loss: 0.1335, Total Loss: 0.2183, Loss Parts: [0.2183]: 100%|███████████████████| 469/469 [00:07<00:00, 61.56it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1335
Training Accuracy: 0.9645
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.73it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2196
Testing accuracy: 0.9502
Best testing accuracy was: 0.9503
Stagnation was: 1

----------
Epoch 15/50
----------
Training


Avg. Loss: 0.1200, Total Loss: 0.3590, Loss Parts: [0.3590]: 100%|███████████████████| 469/469 [00:08<00:00, 57.67it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1200
Training Accuracy: 0.9691
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.61it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1810
Testing accuracy: 0.9621
Best testing accuracy was: 0.9503
Stagnation was: 0

----------
Epoch 16/50
----------
Training


Avg. Loss: 0.1059, Total Loss: 0.1470, Loss Parts: [0.1470]: 100%|███████████████████| 469/469 [00:07<00:00, 60.41it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1059
Training Accuracy: 0.9719
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.69it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1790
Testing accuracy: 0.9582
Best testing accuracy was: 0.9621
Stagnation was: 1

----------
Epoch 17/50
----------
Training


Avg. Loss: 0.0953, Total Loss: 0.1252, Loss Parts: [0.1252]: 100%|███████████████████| 469/469 [00:08<00:00, 57.42it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0953
Training Accuracy: 0.9751
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.87it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1634
Testing accuracy: 0.9622
Best testing accuracy was: 0.9621
Stagnation was: 0

----------
Epoch 18/50
----------
Training


Avg. Loss: 0.0890, Total Loss: 0.0273, Loss Parts: [0.0273]: 100%|███████████████████| 469/469 [00:07<00:00, 58.98it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0890
Training Accuracy: 0.9769
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.71it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1808
Testing accuracy: 0.9624
Best testing accuracy was: 0.9622
Stagnation was: 0

----------
Epoch 19/50
----------
Training


Avg. Loss: 0.0852, Total Loss: 0.0710, Loss Parts: [0.0710]: 100%|███████████████████| 469/469 [00:07<00:00, 60.74it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0852
Training Accuracy: 0.9776
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.61it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1723
Testing accuracy: 0.9629
Best testing accuracy was: 0.9624
Stagnation was: 0

----------
Epoch 20/50
----------
Training


Avg. Loss: 0.0660, Total Loss: 0.0940, Loss Parts: [0.0940]: 100%|███████████████████| 469/469 [00:07<00:00, 60.53it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0660
Training Accuracy: 0.9832
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.55it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1647
Testing accuracy: 0.9619
Best testing accuracy was: 0.9629
Stagnation was: 1

----------
Epoch 21/50
----------
Training


Avg. Loss: 0.0672, Total Loss: 0.0153, Loss Parts: [0.0153]: 100%|███████████████████| 469/469 [00:07<00:00, 62.66it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0672
Training Accuracy: 0.9823
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.01it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1464
Testing accuracy: 0.9685
Best testing accuracy was: 0.9629
Stagnation was: 0

----------
Epoch 22/50
----------
Training


Avg. Loss: 0.0630, Total Loss: 0.1370, Loss Parts: [0.1370]: 100%|███████████████████| 469/469 [00:07<00:00, 66.56it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0630
Training Accuracy: 0.9829
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.49it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1558
Testing accuracy: 0.9674
Best testing accuracy was: 0.9685
Stagnation was: 1

----------
Epoch 23/50
----------
Training


Avg. Loss: 0.0572, Total Loss: 0.1560, Loss Parts: [0.1560]: 100%|███████████████████| 469/469 [00:07<00:00, 64.38it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0572
Training Accuracy: 0.9851
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.96it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1638
Testing accuracy: 0.9627
Best testing accuracy was: 0.9685
Stagnation was: 2

----------
Epoch 24/50
----------
Training


Avg. Loss: 0.0568, Total Loss: 0.1154, Loss Parts: [0.1154]: 100%|███████████████████| 469/469 [00:07<00:00, 60.25it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0568
Training Accuracy: 0.9843
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.29it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1475
Testing accuracy: 0.9704
Best testing accuracy was: 0.9685
Stagnation was: 0

----------
Epoch 25/50
----------
Training


Avg. Loss: 0.0527, Total Loss: 0.0025, Loss Parts: [0.0025]: 100%|███████████████████| 469/469 [00:08<00:00, 58.26it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0527
Training Accuracy: 0.9860
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.83it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1498
Testing accuracy: 0.9697
Best testing accuracy was: 0.9704
Stagnation was: 1

----------
Epoch 26/50
----------
Training


Avg. Loss: 0.0421, Total Loss: 0.0755, Loss Parts: [0.0755]: 100%|███████████████████| 469/469 [00:07<00:00, 63.23it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0421
Training Accuracy: 0.9887
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.57it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1505
Testing accuracy: 0.9667
Best testing accuracy was: 0.9704
Stagnation was: 2

----------
Epoch 27/50
----------
Training


Avg. Loss: 0.0393, Total Loss: 0.1312, Loss Parts: [0.1312]: 100%|███████████████████| 469/469 [00:07<00:00, 59.29it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0393
Training Accuracy: 0.9893
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.11it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1430
Testing accuracy: 0.9690
Best testing accuracy was: 0.9704
Stagnation was: 3

----------
Epoch 28/50
----------
Training


Avg. Loss: 0.0334, Total Loss: 0.1096, Loss Parts: [0.1096]: 100%|███████████████████| 469/469 [00:07<00:00, 60.64it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0334
Training Accuracy: 0.9910
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.92it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1379
Testing accuracy: 0.9722
Best testing accuracy was: 0.9704
Stagnation was: 0

----------
Epoch 29/50
----------
Training


Avg. Loss: 0.0323, Total Loss: 0.0038, Loss Parts: [0.0038]: 100%|███████████████████| 469/469 [00:07<00:00, 61.04it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0323
Training Accuracy: 0.9915
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.81it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1343
Testing accuracy: 0.9722
Best testing accuracy was: 0.9722
Stagnation was: 1

----------
Epoch 30/50
----------
Training


Avg. Loss: 0.0305, Total Loss: 0.0321, Loss Parts: [0.0321]: 100%|███████████████████| 469/469 [00:07<00:00, 60.28it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0305
Training Accuracy: 0.9919
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.73it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1453
Testing accuracy: 0.9686
Best testing accuracy was: 0.9722
Stagnation was: 2

----------
Epoch 31/50
----------
Training


Avg. Loss: 0.0320, Total Loss: 0.0583, Loss Parts: [0.0583]: 100%|███████████████████| 469/469 [00:08<00:00, 57.97it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0320
Training Accuracy: 0.9915
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.83it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1417
Testing accuracy: 0.9712
Best testing accuracy was: 0.9722
Stagnation was: 3

----------
Epoch 32/50
----------
Training


Avg. Loss: 0.0267, Total Loss: 0.0422, Loss Parts: [0.0422]: 100%|███████████████████| 469/469 [00:07<00:00, 59.22it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0267
Training Accuracy: 0.9926
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.66it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1389
Testing accuracy: 0.9716
Best testing accuracy was: 0.9722
Stagnation was: 4

----------
Epoch 33/50
----------
Training


Avg. Loss: 0.0266, Total Loss: 0.0620, Loss Parts: [0.0620]: 100%|███████████████████| 469/469 [00:07<00:00, 58.88it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0266
Training Accuracy: 0.9927
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.73it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1378
Testing accuracy: 0.9721
Best testing accuracy was: 0.9722
Ran out of patience at epoch: 32
Patience was: 5
Training complete in 6m 14s
Saved session to C:\Users\Windows\Desktop\Shahir\18.408\18408-final-project\experiments\5cb241610e7ddaf1\sessions\Session 05-19-2021 06-22-32 PM
{'dataset_config': {'dataset_type': 'img', 'dataset_config': {'img_dataset_type': 'mnist', 'num_train_samples': 60000, 'num_test_samples': 10000, 'new_input_size': None, 'flatten': True, 'augment': False, 'corrupt_frac': 0.0, 'seed': 0}}, 'model_config': {'model_type': 'relu_toy', 'model_config': {'input_dim': 784, 'output_dim': 10, 'layer_dims': [100, 100, 100, 100, 100, 100, 100, 100], 'bias': True, 'seed': None}}, 'training_config': {'optimizer_type': 'sgd_momentum', 'loss_type': 'cross_entropy', 'lr': 0.01, 'num_epochs': 50, 'clip_grad_norm': False, 'weight_decay': 0.01, 'use_lr_schedule': False, 'epoch_lr_decay_steps': None, 'lr_decay_gamma': None, 'early_stop': True, 'early_stop_acc'

Avg. Loss: 2.3017, Total Loss: 2.2996, Loss Parts: [2.2996]: 100%|███████████████████| 469/469 [00:07<00:00, 58.97it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1119
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.89it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: -1.0000
Stagnation was: 0

----------
Epoch 2/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2979, Loss Parts: [2.2979]: 100%|███████████████████| 469/469 [00:07<00:00, 60.67it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.45it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 3/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2985, Loss Parts: [2.2985]: 100%|███████████████████| 469/469 [00:08<00:00, 58.60it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.90it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 4/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2992, Loss Parts: [2.2992]: 100%|███████████████████| 469/469 [00:08<00:00, 56.19it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.62it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 5/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3031, Loss Parts: [2.3031]: 100%|███████████████████| 469/469 [00:08<00:00, 58.03it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.85it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 6/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3054, Loss Parts: [2.3054]: 100%|███████████████████| 469/469 [00:08<00:00, 57.28it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.40it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 7/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3178, Loss Parts: [2.3178]: 100%|███████████████████| 469/469 [00:06<00:00, 70.01it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.74it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 8/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3045, Loss Parts: [2.3045]: 100%|███████████████████| 469/469 [00:08<00:00, 57.80it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.33it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 9/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3013, Loss Parts: [2.3013]: 100%|███████████████████| 469/469 [00:08<00:00, 57.86it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.98it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 10/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2977, Loss Parts: [2.2977]: 100%|███████████████████| 469/469 [00:08<00:00, 57.59it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.37it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 11/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3074, Loss Parts: [2.3074]: 100%|███████████████████| 469/469 [00:07<00:00, 58.84it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.77it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 12/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3028, Loss Parts: [2.3028]: 100%|███████████████████| 469/469 [00:08<00:00, 57.44it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.83it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 13/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3031, Loss Parts: [2.3031]: 100%|███████████████████| 469/469 [00:07<00:00, 58.87it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.17it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 14/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3078, Loss Parts: [2.3078]: 100%|███████████████████| 469/469 [00:07<00:00, 58.94it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.24it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 15/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3110, Loss Parts: [2.3110]: 100%|███████████████████| 469/469 [00:08<00:00, 58.11it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.37it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3009
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 16/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2950, Loss Parts: [2.2950]: 100%|███████████████████| 469/469 [00:08<00:00, 58.60it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.89it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 17/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3100, Loss Parts: [2.3100]: 100%|███████████████████| 469/469 [00:08<00:00, 56.85it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.94it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 18/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2997, Loss Parts: [2.2997]: 100%|███████████████████| 469/469 [00:08<00:00, 57.91it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.43it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 19/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3052, Loss Parts: [2.3052]: 100%|███████████████████| 469/469 [00:08<00:00, 56.88it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.93it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 20/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3007, Loss Parts: [2.3007]: 100%|███████████████████| 469/469 [00:08<00:00, 56.13it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.31it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 21/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2944, Loss Parts: [2.2944]: 100%|███████████████████| 469/469 [00:08<00:00, 57.20it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.66it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 22/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3091, Loss Parts: [2.3091]: 100%|███████████████████| 469/469 [00:07<00:00, 59.09it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.92it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 23/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3031, Loss Parts: [2.3031]: 100%|███████████████████| 469/469 [00:07<00:00, 61.70it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.24it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 24/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3028, Loss Parts: [2.3028]: 100%|███████████████████| 469/469 [00:07<00:00, 61.79it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.24it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 25/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3031, Loss Parts: [2.3031]: 100%|███████████████████| 469/469 [00:08<00:00, 57.36it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.36it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 26/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2997, Loss Parts: [2.2997]: 100%|███████████████████| 469/469 [00:07<00:00, 58.85it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.80it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 27/50
----------
Training


Avg. Loss: 2.3013, Total Loss: 2.3045, Loss Parts: [2.3045]: 100%|███████████████████| 469/469 [00:08<00:00, 56.85it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3013
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.04it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 28/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2985, Loss Parts: [2.2985]: 100%|███████████████████| 469/469 [00:07<00:00, 61.43it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.96it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 29/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3074, Loss Parts: [2.3074]: 100%|███████████████████| 469/469 [00:08<00:00, 56.05it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.40it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 30/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3030, Loss Parts: [2.3030]: 100%|███████████████████| 469/469 [00:08<00:00, 55.63it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.83it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 31/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2996, Loss Parts: [2.2996]: 100%|███████████████████| 469/469 [00:08<00:00, 58.59it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.60it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 32/50
----------
Training


Avg. Loss: 2.3013, Total Loss: 2.3033, Loss Parts: [2.3033]: 100%|███████████████████| 469/469 [00:08<00:00, 56.97it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3013
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.90it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 33/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2967, Loss Parts: [2.2967]: 100%|███████████████████| 469/469 [00:07<00:00, 59.44it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.09it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 34/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3099, Loss Parts: [2.3099]: 100%|███████████████████| 469/469 [00:08<00:00, 57.77it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.09it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 35/50
----------
Training


Avg. Loss: 2.3015, Total Loss: 2.3089, Loss Parts: [2.3089]: 100%|███████████████████| 469/469 [00:08<00:00, 57.15it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3015
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.68it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 36/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2963, Loss Parts: [2.2963]: 100%|███████████████████| 469/469 [00:07<00:00, 59.82it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 20.88it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 37/50
----------
Training


Avg. Loss: 2.3013, Total Loss: 2.2995, Loss Parts: [2.2995]: 100%|███████████████████| 469/469 [00:07<00:00, 59.59it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3013
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.70it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 38/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2982, Loss Parts: [2.2982]: 100%|███████████████████| 469/469 [00:06<00:00, 67.78it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.65it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 39/50
----------
Training


Avg. Loss: 2.3013, Total Loss: 2.2983, Loss Parts: [2.2983]: 100%|███████████████████| 469/469 [00:07<00:00, 59.06it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3013
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.55it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 40/50
----------
Training


Avg. Loss: 2.3015, Total Loss: 2.3017, Loss Parts: [2.3017]: 100%|███████████████████| 469/469 [00:07<00:00, 64.82it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3015
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.58it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 41/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3024, Loss Parts: [2.3024]: 100%|███████████████████| 469/469 [00:06<00:00, 67.35it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.15it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 42/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3110, Loss Parts: [2.3110]: 100%|███████████████████| 469/469 [00:07<00:00, 66.94it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.11it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 43/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3027, Loss Parts: [2.3027]: 100%|███████████████████| 469/469 [00:07<00:00, 62.14it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.54it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 44/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2956, Loss Parts: [2.2956]: 100%|███████████████████| 469/469 [00:07<00:00, 66.83it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.35it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 45/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3035, Loss Parts: [2.3035]: 100%|███████████████████| 469/469 [00:07<00:00, 63.58it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.62it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 46/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2939, Loss Parts: [2.2939]: 100%|███████████████████| 469/469 [00:07<00:00, 62.23it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.14it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 47/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3128, Loss Parts: [2.3128]: 100%|███████████████████| 469/469 [00:08<00:00, 57.84it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.17it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 48/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2952, Loss Parts: [2.2952]: 100%|███████████████████| 469/469 [00:07<00:00, 59.37it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.16it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 49/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3063, Loss Parts: [2.3063]: 100%|███████████████████| 469/469 [00:07<00:00, 62.58it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.06it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 50/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3049, Loss Parts: [2.3049]: 100%|███████████████████| 469/469 [00:07<00:00, 58.75it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.39it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

Training complete in 9m 32s
Saved session to C:\Users\Windows\Desktop\Shahir\18.408\18408-final-project\experiments\118a90f4f3627eb8\sessions\Session 05-19-2021 06-32-04 PM
{'dataset_config': {'dataset_type': 'img', 'dataset_config': {'img_dataset_type': 'mnist', 'num_train_samples': 60000, 'num_test_samples': 10000, 'new_input_size': None, 'flatten': True, 'augment': False, 'corrupt_frac': 0.0, 'seed': 0}}, 'model_config': {'model_type': 'relu_toy', 'model_config': {'input_dim': 784, 'output_dim': 10, 'layer_dims': [100, 100, 100, 100, 100, 100, 100, 100], 'bias': True, 'seed': None}}, 'training_config': {'optimizer_type': 'sgd_momentum', 'loss_type': 'cross_entropy', 'lr': 0.01, 'num_epochs': 50, 'clip_grad_norm': False, 'weight_decay': 0.1, 'use_lr_schedule': False, 'epoch_lr_decay_steps': None, 'lr_decay_gamma': None, 'early_stop': True, 'early_stop_acc': 0.9, 'early_stop_patience': 5

Avg. Loss: 2.3018, Total Loss: 2.3023, Loss Parts: [2.3023]: 100%|███████████████████| 469/469 [00:07<00:00, 61.12it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3018
Training Accuracy: 0.1103
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.67it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: -1.0000
Stagnation was: 0

----------
Epoch 2/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3019, Loss Parts: [2.3019]: 100%|███████████████████| 469/469 [00:07<00:00, 59.56it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1115
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.14it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 3/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3004, Loss Parts: [2.3004]: 100%|███████████████████| 469/469 [00:07<00:00, 58.89it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.16it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 4/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.2919, Loss Parts: [2.2919]: 100%|███████████████████| 469/469 [00:07<00:00, 60.65it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.39it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 5/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3019, Loss Parts: [2.3019]: 100%|███████████████████| 469/469 [00:08<00:00, 57.75it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1120
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.70it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3017
Testing accuracy: 0.1028
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 6/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3046, Loss Parts: [2.3046]: 100%|███████████████████| 469/469 [00:08<00:00, 58.55it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1118
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.40it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 7/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3042, Loss Parts: [2.3042]: 100%|███████████████████| 469/469 [00:08<00:00, 56.79it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.12it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 8/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.2984, Loss Parts: [2.2984]: 100%|███████████████████| 469/469 [00:08<00:00, 57.98it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.98it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 9/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3062, Loss Parts: [2.3062]: 100%|███████████████████| 469/469 [00:07<00:00, 59.71it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.12it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 10/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3032, Loss Parts: [2.3032]: 100%|███████████████████| 469/469 [00:07<00:00, 59.90it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1120
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.92it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 11/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.2985, Loss Parts: [2.2985]: 100%|███████████████████| 469/469 [00:08<00:00, 57.46it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1120
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.49it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 12/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3022, Loss Parts: [2.3022]: 100%|███████████████████| 469/469 [00:07<00:00, 60.11it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.76it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 13/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.2995, Loss Parts: [2.2995]: 100%|███████████████████| 469/469 [00:07<00:00, 60.09it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.85it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 14/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3020, Loss Parts: [2.3020]: 100%|███████████████████| 469/469 [00:07<00:00, 59.74it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1121
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.71it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 15/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3040, Loss Parts: [2.3040]: 100%|███████████████████| 469/469 [00:07<00:00, 66.58it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.56it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 16/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3054, Loss Parts: [2.3054]: 100%|███████████████████| 469/469 [00:07<00:00, 62.30it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1119
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.02it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 17/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3026, Loss Parts: [2.3026]: 100%|███████████████████| 469/469 [00:08<00:00, 57.41it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.89it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 18/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3013, Loss Parts: [2.3013]: 100%|███████████████████| 469/469 [00:08<00:00, 57.31it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1123
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.75it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 19/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3042, Loss Parts: [2.3042]: 100%|███████████████████| 469/469 [00:07<00:00, 59.00it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1116
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.57it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 20/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3100, Loss Parts: [2.3100]: 100%|███████████████████| 469/469 [00:07<00:00, 64.90it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.18it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 21/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3034, Loss Parts: [2.3034]: 100%|███████████████████| 469/469 [00:08<00:00, 58.34it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.95it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3017
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 22/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.2929, Loss Parts: [2.2929]: 100%|███████████████████| 469/469 [00:08<00:00, 56.55it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.48it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 23/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3038, Loss Parts: [2.3038]: 100%|███████████████████| 469/469 [00:07<00:00, 60.00it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.72it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 24/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3006, Loss Parts: [2.3006]: 100%|███████████████████| 469/469 [00:07<00:00, 60.26it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1114
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.76it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 25/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3022, Loss Parts: [2.3022]: 100%|███████████████████| 469/469 [00:07<00:00, 59.21it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1118
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.49it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 26/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3026, Loss Parts: [2.3026]: 100%|███████████████████| 469/469 [00:06<00:00, 69.68it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.98it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3017
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 27/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3026, Loss Parts: [2.3026]: 100%|███████████████████| 469/469 [00:06<00:00, 72.14it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.02it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 28/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3033, Loss Parts: [2.3033]: 100%|███████████████████| 469/469 [00:07<00:00, 65.00it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.84it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 29/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3058, Loss Parts: [2.3058]: 100%|███████████████████| 469/469 [00:06<00:00, 75.59it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.09it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 30/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3037, Loss Parts: [2.3037]: 100%|███████████████████| 469/469 [00:07<00:00, 60.56it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.81it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 31/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3041, Loss Parts: [2.3041]: 100%|███████████████████| 469/469 [00:06<00:00, 71.64it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.70it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 32/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3000, Loss Parts: [2.3000]: 100%|███████████████████| 469/469 [00:07<00:00, 66.09it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.10it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 33/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3041, Loss Parts: [2.3041]: 100%|███████████████████| 469/469 [00:07<00:00, 61.80it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.87it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 34/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3072, Loss Parts: [2.3072]: 100%|███████████████████| 469/469 [00:07<00:00, 59.00it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1118
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.03it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 35/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.2997, Loss Parts: [2.2997]: 100%|███████████████████| 469/469 [00:07<00:00, 59.41it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1112
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.87it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 36/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.2982, Loss Parts: [2.2982]: 100%|███████████████████| 469/469 [00:07<00:00, 59.55it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1118
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.76it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 37/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3000, Loss Parts: [2.3000]: 100%|███████████████████| 469/469 [00:08<00:00, 57.07it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.51it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3017
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 38/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3042, Loss Parts: [2.3042]: 100%|███████████████████| 469/469 [00:07<00:00, 62.89it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.45it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 39/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.2992, Loss Parts: [2.2992]: 100%|███████████████████| 469/469 [00:08<00:00, 58.08it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1120
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.95it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 40/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3002, Loss Parts: [2.3002]: 100%|███████████████████| 469/469 [00:08<00:00, 57.50it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1118
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.80it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 41/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3018, Loss Parts: [2.3018]: 100%|███████████████████| 469/469 [00:08<00:00, 58.62it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.17it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 42/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3020, Loss Parts: [2.3020]: 100%|███████████████████| 469/469 [00:07<00:00, 60.16it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1120
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.85it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 43/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3055, Loss Parts: [2.3055]: 100%|███████████████████| 469/469 [00:07<00:00, 59.53it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.49it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 44/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3056, Loss Parts: [2.3056]: 100%|███████████████████| 469/469 [00:08<00:00, 57.40it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.12it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 45/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.2997, Loss Parts: [2.2997]: 100%|███████████████████| 469/469 [00:07<00:00, 59.56it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1119
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.58it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 46/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3020, Loss Parts: [2.3020]: 100%|███████████████████| 469/469 [00:08<00:00, 57.61it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1121
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.19it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 47/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3012, Loss Parts: [2.3012]: 100%|███████████████████| 469/469 [00:07<00:00, 64.72it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1120
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.23it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 48/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3003, Loss Parts: [2.3003]: 100%|███████████████████| 469/469 [00:08<00:00, 57.72it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1120
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.33it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 49/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3040, Loss Parts: [2.3040]: 100%|███████████████████| 469/469 [00:08<00:00, 56.58it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.82it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 50/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3006, Loss Parts: [2.3006]: 100%|███████████████████| 469/469 [00:08<00:00, 58.47it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.88it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

Training complete in 9m 25s
Saved session to C:\Users\Windows\Desktop\Shahir\18.408\18408-final-project\experiments\e15583346bb4c876\sessions\Session 05-19-2021 06-41-29 PM
{'dataset_config': {'dataset_type': 'img', 'dataset_config': {'img_dataset_type': 'mnist', 'num_train_samples': 60000, 'num_test_samples': 10000, 'new_input_size': None, 'flatten': True, 'augment': False, 'corrupt_frac': 0.0, 'seed': 0}}, 'model_config': {'model_type': 'relu_toy', 'model_config': {'input_dim': 784, 'output_dim': 10, 'layer_dims': [100, 100, 100, 100, 100, 100, 100, 100, 100, 100], 'bias': True, 'seed': None}}, 'training_config': {'optimizer_type': 'sgd_momentum', 'loss_type': 'cross_entropy', 'lr': 0.01, 'num_epochs': 50, 'clip_grad_norm': False, 'weight_decay': 0.0, 'use_lr_schedule': False, 'epoch_lr_decay_steps': None, 'lr_decay_gamma': None, 'early_stop': True, 'early_stop_acc': 0.9, 'early_stop_pa

Avg. Loss: 2.3017, Total Loss: 2.2998, Loss Parts: [2.2998]: 100%|███████████████████| 469/469 [00:08<00:00, 56.26it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1107
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.27it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: -1.0000
Stagnation was: 0

----------
Epoch 2/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2993, Loss Parts: [2.2993]: 100%|███████████████████| 469/469 [00:07<00:00, 60.33it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.27it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 3/50
----------
Training


Avg. Loss: 2.3015, Total Loss: 2.3087, Loss Parts: [2.3087]: 100%|███████████████████| 469/469 [00:08<00:00, 55.15it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3015
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.23it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 4/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2909, Loss Parts: [2.2909]: 100%|███████████████████| 469/469 [00:08<00:00, 54.52it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.21it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 5/50
----------
Training


Avg. Loss: 2.3015, Total Loss: 2.3044, Loss Parts: [2.3044]: 100%|███████████████████| 469/469 [00:08<00:00, 56.04it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3015
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.15it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 6/50
----------
Training


Avg. Loss: 2.3015, Total Loss: 2.3016, Loss Parts: [2.3016]: 100%|███████████████████| 469/469 [00:08<00:00, 55.75it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3015
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.68it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 7/50
----------
Training


Avg. Loss: 2.3015, Total Loss: 2.2943, Loss Parts: [2.2943]: 100%|███████████████████| 469/469 [00:08<00:00, 56.11it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3015
Training Accuracy: 0.1121
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.95it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 8/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3000, Loss Parts: [2.3000]: 100%|███████████████████| 469/469 [00:08<00:00, 56.13it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.71it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 9/50
----------
Training


Avg. Loss: 2.3015, Total Loss: 2.2975, Loss Parts: [2.2975]: 100%|███████████████████| 469/469 [00:08<00:00, 55.08it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3015
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.11it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 10/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3079, Loss Parts: [2.3079]: 100%|███████████████████| 469/469 [00:08<00:00, 55.79it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.96it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 11/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3096, Loss Parts: [2.3096]: 100%|███████████████████| 469/469 [00:08<00:00, 56.23it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.66it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 12/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3119, Loss Parts: [2.3119]: 100%|███████████████████| 469/469 [00:07<00:00, 60.07it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.00it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 13/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3051, Loss Parts: [2.3051]: 100%|███████████████████| 469/469 [00:08<00:00, 56.25it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.52it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 14/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2954, Loss Parts: [2.2954]: 100%|███████████████████| 469/469 [00:08<00:00, 55.09it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.24it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 15/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2990, Loss Parts: [2.2990]: 100%|███████████████████| 469/469 [00:08<00:00, 55.39it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.24it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 16/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2880, Loss Parts: [2.2880]: 100%|███████████████████| 469/469 [00:08<00:00, 54.74it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.96it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 17/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3003, Loss Parts: [2.3003]: 100%|███████████████████| 469/469 [00:08<00:00, 57.73it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.85it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 18/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3092, Loss Parts: [2.3092]: 100%|███████████████████| 469/469 [00:08<00:00, 56.47it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.55it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 19/50
----------
Training


Avg. Loss: 2.3012, Total Loss: 2.3137, Loss Parts: [2.3137]: 100%|███████████████████| 469/469 [00:08<00:00, 55.57it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3012
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.30it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3009
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 20/50
----------
Training


Avg. Loss: 2.3009, Total Loss: 2.3163, Loss Parts: [2.3163]: 100%|███████████████████| 469/469 [00:08<00:00, 55.74it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3009
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.05it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3002
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 21/50
----------
Training


Avg. Loss: 2.2847, Total Loss: 2.1069, Loss Parts: [2.1069]: 100%|███████████████████| 469/469 [00:08<00:00, 56.76it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.2847
Training Accuracy: 0.1394
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.92it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.1220
Testing accuracy: 0.2149
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 22/50
----------
Training


Avg. Loss: 1.4482, Total Loss: 0.7354, Loss Parts: [0.7354]: 100%|███████████████████| 469/469 [00:07<00:00, 59.79it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 1.4482
Training Accuracy: 0.4191
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.37it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.9924
Testing accuracy: 0.7338
Best testing accuracy was: 0.2149
Stagnation was: 0

----------
Epoch 23/50
----------
Training


Avg. Loss: 0.8784, Total Loss: 0.4296, Loss Parts: [0.4296]: 100%|███████████████████| 469/469 [00:08<00:00, 55.16it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.8784
Training Accuracy: 0.7073
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.69it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.6365
Testing accuracy: 0.8258
Best testing accuracy was: 0.7338
Stagnation was: 0

----------
Epoch 24/50
----------
Training


Avg. Loss: 0.6367, Total Loss: 0.6486, Loss Parts: [0.6486]: 100%|███████████████████| 469/469 [00:08<00:00, 56.17it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.6367
Training Accuracy: 0.7926
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.21it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.7052
Testing accuracy: 0.7708
Best testing accuracy was: 0.8258
Stagnation was: 0

----------
Epoch 25/50
----------
Training


Avg. Loss: 0.2699, Total Loss: 0.2637, Loss Parts: [0.2637]: 100%|███████████████████| 469/469 [00:08<00:00, 54.84it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.2699
Training Accuracy: 0.9354
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.85it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2548
Testing accuracy: 0.9377
Best testing accuracy was: 0.8258
Stagnation was: 0

----------
Epoch 26/50
----------
Training


Avg. Loss: 0.1915, Total Loss: 0.2497, Loss Parts: [0.2497]: 100%|███████████████████| 469/469 [00:08<00:00, 55.53it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1915
Training Accuracy: 0.9525
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.60it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.2248
Testing accuracy: 0.9494
Best testing accuracy was: 0.9377
Stagnation was: 0

----------
Epoch 27/50
----------
Training


Avg. Loss: 0.1593, Total Loss: 0.1850, Loss Parts: [0.1850]: 100%|███████████████████| 469/469 [00:08<00:00, 54.41it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1593
Training Accuracy: 0.9611
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.63it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1849
Testing accuracy: 0.9604
Best testing accuracy was: 0.9494
Stagnation was: 0

----------
Epoch 28/50
----------
Training


Avg. Loss: 0.1406, Total Loss: 0.2030, Loss Parts: [0.2030]: 100%|███████████████████| 469/469 [00:08<00:00, 55.07it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1406
Training Accuracy: 0.9663
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.05it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1992
Testing accuracy: 0.9563
Best testing accuracy was: 0.9604
Stagnation was: 1

----------
Epoch 29/50
----------
Training


Avg. Loss: 0.1255, Total Loss: 0.1163, Loss Parts: [0.1163]: 100%|███████████████████| 469/469 [00:08<00:00, 55.98it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1255
Training Accuracy: 0.9700
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.47it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1646
Testing accuracy: 0.9625
Best testing accuracy was: 0.9604
Stagnation was: 0

----------
Epoch 30/50
----------
Training


Avg. Loss: 0.1110, Total Loss: 0.0926, Loss Parts: [0.0926]: 100%|███████████████████| 469/469 [00:08<00:00, 55.53it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1110
Training Accuracy: 0.9736
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.95it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1471
Testing accuracy: 0.9660
Best testing accuracy was: 0.9625
Stagnation was: 0

----------
Epoch 31/50
----------
Training


Avg. Loss: 0.1061, Total Loss: 0.1297, Loss Parts: [0.1297]: 100%|███████████████████| 469/469 [00:08<00:00, 55.47it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.1061
Training Accuracy: 0.9746
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.29it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1801
Testing accuracy: 0.9606
Best testing accuracy was: 0.9660
Stagnation was: 1

----------
Epoch 32/50
----------
Training


Avg. Loss: 0.0946, Total Loss: 0.0679, Loss Parts: [0.0679]: 100%|███████████████████| 469/469 [00:07<00:00, 63.23it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0946
Training Accuracy: 0.9773
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.40it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1542
Testing accuracy: 0.9650
Best testing accuracy was: 0.9660
Stagnation was: 2

----------
Epoch 33/50
----------
Training


Avg. Loss: 0.0867, Total Loss: 0.1235, Loss Parts: [0.1235]: 100%|███████████████████| 469/469 [00:08<00:00, 55.43it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0867
Training Accuracy: 0.9793
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.73it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1719
Testing accuracy: 0.9610
Best testing accuracy was: 0.9660
Stagnation was: 3

----------
Epoch 34/50
----------
Training


Avg. Loss: 0.0892, Total Loss: 0.0158, Loss Parts: [0.0158]: 100%|███████████████████| 469/469 [00:08<00:00, 55.51it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0892
Training Accuracy: 0.9785
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.84it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1651
Testing accuracy: 0.9642
Best testing accuracy was: 0.9660
Stagnation was: 4

----------
Epoch 35/50
----------
Training


Avg. Loss: 0.0829, Total Loss: 0.0306, Loss Parts: [0.0306]: 100%|███████████████████| 469/469 [00:08<00:00, 54.41it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 0.0829
Training Accuracy: 0.9798
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.99it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 0.1463
Testing accuracy: 0.9660
Best testing accuracy was: 0.9660
Ran out of patience at epoch: 34
Patience was: 5
Training complete in 6m 57s
Saved session to C:\Users\Windows\Desktop\Shahir\18.408\18408-final-project\experiments\57549825e10ba640\sessions\Session 05-19-2021 06-48-26 PM
{'dataset_config': {'dataset_type': 'img', 'dataset_config': {'img_dataset_type': 'mnist', 'num_train_samples': 60000, 'num_test_samples': 10000, 'new_input_size': None, 'flatten': True, 'augment': False, 'corrupt_frac': 0.0, 'seed': 0}}, 'model_config': {'model_type': 'relu_toy', 'model_config': {'input_dim': 784, 'output_dim': 10, 'layer_dims': [100, 100, 100, 100, 100, 100, 100, 100, 100, 100], 'bias': True, 'seed': None}}, 'training_config': {'optimizer_type': 'sgd_momentum', 'loss_type': 'cross_entropy', 'lr': 0.01, 'num_epochs': 50, 'clip_grad_norm': False, 'weight_decay': 0.01, 'use_lr_schedule': False, 'epoch_lr_decay_steps': None, 'lr_decay_gamma': None, 'early_stop': True, 'early

Avg. Loss: 2.3019, Total Loss: 2.3035, Loss Parts: [2.3035]: 100%|███████████████████| 469/469 [00:08<00:00, 54.50it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3019
Training Accuracy: 0.1108
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.23it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: -1.0000
Stagnation was: 0

----------
Epoch 2/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3050, Loss Parts: [2.3050]: 100%|███████████████████| 469/469 [00:08<00:00, 54.05it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.13it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 3/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2963, Loss Parts: [2.2963]: 100%|███████████████████| 469/469 [00:08<00:00, 54.77it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.46it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 4/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2947, Loss Parts: [2.2947]: 100%|███████████████████| 469/469 [00:08<00:00, 54.63it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.80it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 5/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3012, Loss Parts: [2.3012]: 100%|███████████████████| 469/469 [00:08<00:00, 53.42it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.08it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3009
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 6/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3081, Loss Parts: [2.3081]: 100%|███████████████████| 469/469 [00:08<00:00, 53.95it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.85it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 7/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3048, Loss Parts: [2.3048]: 100%|███████████████████| 469/469 [00:07<00:00, 62.60it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.00it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 8/50
----------
Training


Avg. Loss: 2.3013, Total Loss: 2.3046, Loss Parts: [2.3046]: 100%|███████████████████| 469/469 [00:08<00:00, 55.44it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3013
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.04it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 9/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2919, Loss Parts: [2.2919]: 100%|███████████████████| 469/469 [00:08<00:00, 57.15it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.59it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 10/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2990, Loss Parts: [2.2990]: 100%|███████████████████| 469/469 [00:07<00:00, 59.13it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1121
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.18it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 11/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3008, Loss Parts: [2.3008]: 100%|███████████████████| 469/469 [00:08<00:00, 57.59it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.45it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 12/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3001, Loss Parts: [2.3001]: 100%|███████████████████| 469/469 [00:08<00:00, 56.30it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.70it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 13/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3014, Loss Parts: [2.3014]: 100%|███████████████████| 469/469 [00:08<00:00, 57.01it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.80it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 14/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2969, Loss Parts: [2.2969]: 100%|███████████████████| 469/469 [00:08<00:00, 54.77it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.23it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 15/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2987, Loss Parts: [2.2987]: 100%|███████████████████| 469/469 [00:08<00:00, 55.89it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.67it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 16/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3099, Loss Parts: [2.3099]: 100%|███████████████████| 469/469 [00:08<00:00, 55.54it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.07it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 17/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2978, Loss Parts: [2.2978]: 100%|███████████████████| 469/469 [00:08<00:00, 55.45it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.38it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 18/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3090, Loss Parts: [2.3090]: 100%|███████████████████| 469/469 [00:08<00:00, 57.66it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.00it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 19/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3007, Loss Parts: [2.3007]: 100%|███████████████████| 469/469 [00:07<00:00, 59.08it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.56it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 20/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3085, Loss Parts: [2.3085]: 100%|███████████████████| 469/469 [00:07<00:00, 58.79it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.92it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 21/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3063, Loss Parts: [2.3063]: 100%|███████████████████| 469/469 [00:08<00:00, 56.78it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.91it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 22/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3000, Loss Parts: [2.3000]: 100%|███████████████████| 469/469 [00:07<00:00, 63.81it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.66it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 23/50
----------
Training


Avg. Loss: 2.3013, Total Loss: 2.3030, Loss Parts: [2.3030]: 100%|███████████████████| 469/469 [00:07<00:00, 64.85it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3013
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.37it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 24/50
----------
Training


Avg. Loss: 2.3015, Total Loss: 2.3027, Loss Parts: [2.3027]: 100%|███████████████████| 469/469 [00:07<00:00, 66.81it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3015
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.20it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 25/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3002, Loss Parts: [2.3002]: 100%|███████████████████| 469/469 [00:06<00:00, 67.73it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.44it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 26/50
----------
Training


Avg. Loss: 2.3013, Total Loss: 2.3000, Loss Parts: [2.3000]: 100%|███████████████████| 469/469 [00:06<00:00, 67.45it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3013
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.23it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 27/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3046, Loss Parts: [2.3046]: 100%|███████████████████| 469/469 [00:07<00:00, 65.25it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.54it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 28/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3106, Loss Parts: [2.3106]: 100%|███████████████████| 469/469 [00:07<00:00, 65.36it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.06it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 29/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3055, Loss Parts: [2.3055]: 100%|███████████████████| 469/469 [00:06<00:00, 68.69it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.37it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 30/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3046, Loss Parts: [2.3046]: 100%|███████████████████| 469/469 [00:07<00:00, 64.70it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.45it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 31/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3019, Loss Parts: [2.3019]: 100%|███████████████████| 469/469 [00:07<00:00, 65.88it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.49it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 32/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3017, Loss Parts: [2.3017]: 100%|███████████████████| 469/469 [00:07<00:00, 64.29it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.46it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 33/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3015, Loss Parts: [2.3015]: 100%|███████████████████| 469/469 [00:07<00:00, 60.06it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.68it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 34/50
----------
Training


Avg. Loss: 2.3013, Total Loss: 2.3058, Loss Parts: [2.3058]: 100%|███████████████████| 469/469 [00:08<00:00, 56.43it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3013
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.02it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 35/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3053, Loss Parts: [2.3053]: 100%|███████████████████| 469/469 [00:07<00:00, 58.89it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.66it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 36/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2915, Loss Parts: [2.2915]: 100%|███████████████████| 469/469 [00:08<00:00, 56.55it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.52it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 37/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3073, Loss Parts: [2.3073]: 100%|███████████████████| 469/469 [00:08<00:00, 55.88it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.44it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 38/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2934, Loss Parts: [2.2934]: 100%|███████████████████| 469/469 [00:07<00:00, 58.91it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.73it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 39/50
----------
Training


Avg. Loss: 2.3013, Total Loss: 2.3017, Loss Parts: [2.3017]: 100%|███████████████████| 469/469 [00:07<00:00, 61.37it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3013
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.62it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 40/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3018, Loss Parts: [2.3018]: 100%|███████████████████| 469/469 [00:08<00:00, 55.46it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.34it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 41/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2917, Loss Parts: [2.2917]: 100%|███████████████████| 469/469 [00:08<00:00, 55.23it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 20.55it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 42/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3023, Loss Parts: [2.3023]: 100%|███████████████████| 469/469 [00:08<00:00, 53.94it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.41it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 43/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3016, Loss Parts: [2.3016]: 100%|███████████████████| 469/469 [00:08<00:00, 55.41it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.19it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 44/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2981, Loss Parts: [2.2981]: 100%|███████████████████| 469/469 [00:08<00:00, 58.45it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.55it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 45/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3084, Loss Parts: [2.3084]: 100%|███████████████████| 469/469 [00:08<00:00, 54.91it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.77it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 46/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3016, Loss Parts: [2.3016]: 100%|███████████████████| 469/469 [00:08<00:00, 55.04it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.77it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 47/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2990, Loss Parts: [2.2990]: 100%|███████████████████| 469/469 [00:08<00:00, 54.33it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.28it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 48/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2950, Loss Parts: [2.2950]: 100%|███████████████████| 469/469 [00:08<00:00, 54.77it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.08it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 49/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3012, Loss Parts: [2.3012]: 100%|███████████████████| 469/469 [00:06<00:00, 67.60it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.94it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 50/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3017, Loss Parts: [2.3017]: 100%|███████████████████| 469/469 [00:08<00:00, 52.97it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.53it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

Training complete in 9m 39s
Saved session to C:\Users\Windows\Desktop\Shahir\18.408\18408-final-project\experiments\1ef6d3c069e14304\sessions\Session 05-19-2021 06-58-05 PM
{'dataset_config': {'dataset_type': 'img', 'dataset_config': {'img_dataset_type': 'mnist', 'num_train_samples': 60000, 'num_test_samples': 10000, 'new_input_size': None, 'flatten': True, 'augment': False, 'corrupt_frac': 0.0, 'seed': 0}}, 'model_config': {'model_type': 'relu_toy', 'model_config': {'input_dim': 784, 'output_dim': 10, 'layer_dims': [100, 100, 100, 100, 100, 100, 100, 100, 100, 100], 'bias': True, 'seed': None}}, 'training_config': {'optimizer_type': 'sgd_momentum', 'loss_type': 'cross_entropy', 'lr': 0.01, 'num_epochs': 50, 'clip_grad_norm': False, 'weight_decay': 0.1, 'use_lr_schedule': False, 'epoch_lr_decay_steps': None, 'lr_decay_gamma': None, 'early_stop': True, 'early_stop_acc': 0.9, 'early_stop_pa

Avg. Loss: 2.3017, Total Loss: 2.2989, Loss Parts: [2.2989]: 100%|███████████████████| 469/469 [00:08<00:00, 55.09it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1120
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.52it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: -1.0000
Stagnation was: 0

----------
Epoch 2/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3000, Loss Parts: [2.3000]: 100%|███████████████████| 469/469 [00:08<00:00, 54.47it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.40it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 3/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3059, Loss Parts: [2.3059]: 100%|███████████████████| 469/469 [00:08<00:00, 53.87it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1118
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.20it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 4/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3026, Loss Parts: [2.3026]: 100%|███████████████████| 469/469 [00:08<00:00, 54.69it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.56it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 5/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3030, Loss Parts: [2.3030]: 100%|███████████████████| 469/469 [00:08<00:00, 53.40it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1123
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.81it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1028
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 6/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3023, Loss Parts: [2.3023]: 100%|███████████████████| 469/469 [00:08<00:00, 54.53it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1121
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.59it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 7/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.2975, Loss Parts: [2.2975]: 100%|███████████████████| 469/469 [00:08<00:00, 54.30it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1117
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.79it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 8/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3038, Loss Parts: [2.3038]: 100%|███████████████████| 469/469 [00:08<00:00, 53.90it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.67it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 9/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3008, Loss Parts: [2.3008]: 100%|███████████████████| 469/469 [00:07<00:00, 61.17it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1119
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.28it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3017
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 10/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3050, Loss Parts: [2.3050]: 100%|███████████████████| 469/469 [00:08<00:00, 54.48it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1117
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.26it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 11/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3022, Loss Parts: [2.3022]: 100%|███████████████████| 469/469 [00:08<00:00, 55.30it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.95it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 12/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.2984, Loss Parts: [2.2984]: 100%|███████████████████| 469/469 [00:08<00:00, 54.43it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.96it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 13/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.2936, Loss Parts: [2.2936]: 100%|███████████████████| 469/469 [00:08<00:00, 54.61it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.44it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 14/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3013, Loss Parts: [2.3013]: 100%|███████████████████| 469/469 [00:08<00:00, 54.19it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.42it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 15/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3023, Loss Parts: [2.3023]: 100%|███████████████████| 469/469 [00:08<00:00, 54.93it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.71it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 16/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.2977, Loss Parts: [2.2977]: 100%|███████████████████| 469/469 [00:08<00:00, 53.91it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.12it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 17/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.2994, Loss Parts: [2.2994]: 100%|███████████████████| 469/469 [00:08<00:00, 54.93it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.45it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 18/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3018, Loss Parts: [2.3018]: 100%|███████████████████| 469/469 [00:08<00:00, 53.85it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1120
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.78it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 19/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3089, Loss Parts: [2.3089]: 100%|███████████████████| 469/469 [00:07<00:00, 59.81it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1118
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.74it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 20/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3004, Loss Parts: [2.3004]: 100%|███████████████████| 469/469 [00:08<00:00, 53.60it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.25it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 21/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.2981, Loss Parts: [2.2981]: 100%|███████████████████| 469/469 [00:08<00:00, 53.96it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.02it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 22/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3041, Loss Parts: [2.3041]: 100%|███████████████████| 469/469 [00:08<00:00, 53.89it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1118
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.55it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 23/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.2988, Loss Parts: [2.2988]: 100%|███████████████████| 469/469 [00:08<00:00, 54.19it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.37it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 24/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3026, Loss Parts: [2.3026]: 100%|███████████████████| 469/469 [00:08<00:00, 55.98it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1123
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.33it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 25/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3011, Loss Parts: [2.3011]: 100%|███████████████████| 469/469 [00:08<00:00, 53.28it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.33it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 26/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.2979, Loss Parts: [2.2979]: 100%|███████████████████| 469/469 [00:08<00:00, 55.67it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.50it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 27/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3015, Loss Parts: [2.3015]: 100%|███████████████████| 469/469 [00:08<00:00, 57.30it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1118
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.88it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 28/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.2932, Loss Parts: [2.2932]: 100%|███████████████████| 469/469 [00:08<00:00, 54.67it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.39it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 29/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3049, Loss Parts: [2.3049]: 100%|███████████████████| 469/469 [00:07<00:00, 61.64it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 20.37it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 30/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3028, Loss Parts: [2.3028]: 100%|███████████████████| 469/469 [00:08<00:00, 54.11it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.70it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 31/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3038, Loss Parts: [2.3038]: 100%|███████████████████| 469/469 [00:08<00:00, 55.02it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1117
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.84it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 32/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3016, Loss Parts: [2.3016]: 100%|███████████████████| 469/469 [00:08<00:00, 55.07it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1118
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.35it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 33/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3006, Loss Parts: [2.3006]: 100%|███████████████████| 469/469 [00:08<00:00, 53.91it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.47it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 34/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3081, Loss Parts: [2.3081]: 100%|███████████████████| 469/469 [00:08<00:00, 56.29it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.51it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 35/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3072, Loss Parts: [2.3072]: 100%|███████████████████| 469/469 [00:08<00:00, 54.38it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1126
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.19it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3017
Testing accuracy: 0.1028
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 36/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3034, Loss Parts: [2.3034]: 100%|███████████████████| 469/469 [00:08<00:00, 55.97it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1118
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.77it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 37/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.2973, Loss Parts: [2.2973]: 100%|███████████████████| 469/469 [00:08<00:00, 55.79it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.60it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 38/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3018, Loss Parts: [2.3018]: 100%|███████████████████| 469/469 [00:08<00:00, 55.52it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.07it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 39/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3069, Loss Parts: [2.3069]: 100%|███████████████████| 469/469 [00:08<00:00, 58.05it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.97it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 40/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3010, Loss Parts: [2.3010]: 100%|███████████████████| 469/469 [00:08<00:00, 55.12it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1119
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.84it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 41/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3014, Loss Parts: [2.3014]: 100%|███████████████████| 469/469 [00:08<00:00, 55.22it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.52it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 42/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.2997, Loss Parts: [2.2997]: 100%|███████████████████| 469/469 [00:08<00:00, 53.29it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.14it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 43/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3020, Loss Parts: [2.3020]: 100%|███████████████████| 469/469 [00:08<00:00, 55.14it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.94it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3016
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 44/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.2992, Loss Parts: [2.2992]: 100%|███████████████████| 469/469 [00:08<00:00, 55.72it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.27it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 45/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3039, Loss Parts: [2.3039]: 100%|███████████████████| 469/469 [00:08<00:00, 56.39it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.24it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 46/50
----------
Training


Avg. Loss: 2.3016, Total Loss: 2.3061, Loss Parts: [2.3061]: 100%|███████████████████| 469/469 [00:08<00:00, 53.73it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3016
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.05it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 47/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3023, Loss Parts: [2.3023]: 100%|███████████████████| 469/469 [00:08<00:00, 54.54it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.61it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3017
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 48/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3009, Loss Parts: [2.3009]: 100%|███████████████████| 469/469 [00:08<00:00, 54.08it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.12it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 49/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3008, Loss Parts: [2.3008]: 100%|███████████████████| 469/469 [00:07<00:00, 62.14it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.47it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 50/50
----------
Training


Avg. Loss: 2.3017, Total Loss: 2.3082, Loss Parts: [2.3082]: 100%|███████████████████| 469/469 [00:08<00:00, 54.81it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3017
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.63it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

Training complete in 10m 3s
Saved session to C:\Users\Windows\Desktop\Shahir\18.408\18408-final-project\experiments\7a8c21cebbae6784\sessions\Session 05-19-2021 07-08-08 PM
{'dataset_config': {'dataset_type': 'img', 'dataset_config': {'img_dataset_type': 'mnist', 'num_train_samples': 60000, 'num_test_samples': 10000, 'new_input_size': None, 'flatten': True, 'augment': False, 'corrupt_frac': 0.0, 'seed': 0}}, 'model_config': {'model_type': 'relu_toy', 'model_config': {'input_dim': 784, 'output_dim': 10, 'layer_dims': [100, 100, 100, 100, 100, 100, 100, 100, 100, 100, 100, 100], 'bias': True, 'seed': None}}, 'training_config': {'optimizer_type': 'sgd_momentum', 'loss_type': 'cross_entropy', 'lr': 0.01, 'num_epochs': 50, 'clip_grad_norm': False, 'weight_decay': 0.0, 'use_lr_schedule': False, 'epoch_lr_decay_steps': None, 'lr_decay_gamma': None, 'early_stop': True, 'early_stop_acc': 0.9, 'ear

Avg. Loss: 2.3018, Total Loss: 2.2974, Loss Parts: [2.2974]: 100%|███████████████████| 469/469 [00:08<00:00, 53.52it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3018
Training Accuracy: 0.1102
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.95it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: -1.0000
Stagnation was: 0

----------
Epoch 2/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3005, Loss Parts: [2.3005]: 100%|███████████████████| 469/469 [00:08<00:00, 53.69it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.78it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 3/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3014, Loss Parts: [2.3014]: 100%|███████████████████| 469/469 [00:08<00:00, 53.64it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.16it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 4/50
----------
Training


Avg. Loss: 2.3015, Total Loss: 2.3016, Loss Parts: [2.3016]: 100%|███████████████████| 469/469 [00:08<00:00, 55.66it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3015
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.13it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 5/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3013, Loss Parts: [2.3013]: 100%|███████████████████| 469/469 [00:08<00:00, 52.74it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.73it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 6/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2938, Loss Parts: [2.2938]: 100%|███████████████████| 469/469 [00:08<00:00, 53.71it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.60it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 7/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2972, Loss Parts: [2.2972]: 100%|███████████████████| 469/469 [00:08<00:00, 55.71it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.75it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 8/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3080, Loss Parts: [2.3080]: 100%|███████████████████| 469/469 [00:08<00:00, 55.72it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.34it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 9/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2975, Loss Parts: [2.2975]: 100%|███████████████████| 469/469 [00:06<00:00, 69.83it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1121
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.64it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 10/50
----------
Training


Avg. Loss: 2.3015, Total Loss: 2.3038, Loss Parts: [2.3038]: 100%|███████████████████| 469/469 [00:08<00:00, 53.84it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3015
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.74it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 11/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2953, Loss Parts: [2.2953]: 100%|███████████████████| 469/469 [00:08<00:00, 54.05it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.39it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 12/50
----------
Training


Avg. Loss: 2.3013, Total Loss: 2.3001, Loss Parts: [2.3001]: 100%|███████████████████| 469/469 [00:08<00:00, 54.03it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3013
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.53it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 13/50
----------
Training


Avg. Loss: 2.3015, Total Loss: 2.3023, Loss Parts: [2.3023]: 100%|███████████████████| 469/469 [00:08<00:00, 52.70it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3015
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.96it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 14/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3069, Loss Parts: [2.3069]: 100%|███████████████████| 469/469 [00:08<00:00, 55.09it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.76it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 15/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2912, Loss Parts: [2.2912]: 100%|███████████████████| 469/469 [00:09<00:00, 51.90it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.52it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 16/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2996, Loss Parts: [2.2996]: 100%|███████████████████| 469/469 [00:08<00:00, 53.12it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.73it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 17/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3009, Loss Parts: [2.3009]: 100%|███████████████████| 469/469 [00:08<00:00, 54.35it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.76it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 18/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3069, Loss Parts: [2.3069]: 100%|███████████████████| 469/469 [00:08<00:00, 54.14it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.03it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 19/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3055, Loss Parts: [2.3055]: 100%|███████████████████| 469/469 [00:08<00:00, 56.33it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.78it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 20/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2955, Loss Parts: [2.2955]: 100%|███████████████████| 469/469 [00:08<00:00, 55.92it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.08it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 21/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2964, Loss Parts: [2.2964]: 100%|███████████████████| 469/469 [00:08<00:00, 54.86it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.49it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 22/50
----------
Training


Avg. Loss: 2.3015, Total Loss: 2.2962, Loss Parts: [2.2962]: 100%|███████████████████| 469/469 [00:08<00:00, 56.29it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3015
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.76it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 23/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2985, Loss Parts: [2.2985]: 100%|███████████████████| 469/469 [00:08<00:00, 53.86it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.51it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 24/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3001, Loss Parts: [2.3001]: 100%|███████████████████| 469/469 [00:08<00:00, 56.12it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.40it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 25/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2987, Loss Parts: [2.2987]: 100%|███████████████████| 469/469 [00:08<00:00, 54.21it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1115
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.75it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 26/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2957, Loss Parts: [2.2957]: 100%|███████████████████| 469/469 [00:08<00:00, 55.21it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.69it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 27/50
----------
Training


Avg. Loss: 2.3015, Total Loss: 2.2908, Loss Parts: [2.2908]: 100%|███████████████████| 469/469 [00:08<00:00, 56.49it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3015
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.14it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 28/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3036, Loss Parts: [2.3036]: 100%|███████████████████| 469/469 [00:08<00:00, 55.11it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.85it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 29/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3060, Loss Parts: [2.3060]: 100%|███████████████████| 469/469 [00:08<00:00, 55.89it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 20.47it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 30/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2843, Loss Parts: [2.2843]: 100%|███████████████████| 469/469 [00:08<00:00, 53.36it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.51it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 31/50
----------
Training


Avg. Loss: 2.3013, Total Loss: 2.2962, Loss Parts: [2.2962]: 100%|███████████████████| 469/469 [00:08<00:00, 53.55it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3013
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.52it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 32/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2991, Loss Parts: [2.2991]: 100%|███████████████████| 469/469 [00:08<00:00, 53.19it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.43it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3009
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 33/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2971, Loss Parts: [2.2971]: 100%|███████████████████| 469/469 [00:08<00:00, 53.45it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.52it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 34/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3070, Loss Parts: [2.3070]: 100%|███████████████████| 469/469 [00:08<00:00, 54.96it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.11it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 35/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3076, Loss Parts: [2.3076]: 100%|███████████████████| 469/469 [00:08<00:00, 52.96it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.04it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 36/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3048, Loss Parts: [2.3048]: 100%|███████████████████| 469/469 [00:08<00:00, 55.09it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.41it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 37/50
----------
Training


Avg. Loss: 2.3015, Total Loss: 2.3071, Loss Parts: [2.3071]: 100%|███████████████████| 469/469 [00:08<00:00, 55.05it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3015
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.92it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 38/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2957, Loss Parts: [2.2957]: 100%|███████████████████| 469/469 [00:08<00:00, 54.45it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.15it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 39/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3034, Loss Parts: [2.3034]: 100%|███████████████████| 469/469 [00:07<00:00, 61.83it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.25it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 40/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2996, Loss Parts: [2.2996]: 100%|███████████████████| 469/469 [00:07<00:00, 61.86it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.90it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 41/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3041, Loss Parts: [2.3041]: 100%|███████████████████| 469/469 [00:08<00:00, 56.66it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.55it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 42/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3015, Loss Parts: [2.3015]: 100%|███████████████████| 469/469 [00:08<00:00, 57.77it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.71it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 43/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3061, Loss Parts: [2.3061]: 100%|███████████████████| 469/469 [00:08<00:00, 57.00it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1118
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.74it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 44/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3060, Loss Parts: [2.3060]: 100%|███████████████████| 469/469 [00:07<00:00, 58.86it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.48it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 45/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2969, Loss Parts: [2.2969]: 100%|███████████████████| 469/469 [00:08<00:00, 52.91it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.10it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 46/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3059, Loss Parts: [2.3059]: 100%|███████████████████| 469/469 [00:08<00:00, 56.59it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.42it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 47/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3022, Loss Parts: [2.3022]: 100%|███████████████████| 469/469 [00:08<00:00, 54.51it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.63it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3009
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 48/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3033, Loss Parts: [2.3033]: 100%|███████████████████| 469/469 [00:08<00:00, 53.64it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.18it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 49/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2990, Loss Parts: [2.2990]: 100%|███████████████████| 469/469 [00:08<00:00, 55.66it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.17it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 50/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3005, Loss Parts: [2.3005]: 100%|███████████████████| 469/469 [00:08<00:00, 53.72it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.21it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

Training complete in 10m 3s
Saved session to C:\Users\Windows\Desktop\Shahir\18.408\18408-final-project\experiments\104efcad1f2821f2\sessions\Session 05-19-2021 07-18-10 PM
{'dataset_config': {'dataset_type': 'img', 'dataset_config': {'img_dataset_type': 'mnist', 'num_train_samples': 60000, 'num_test_samples': 10000, 'new_input_size': None, 'flatten': True, 'augment': False, 'corrupt_frac': 0.0, 'seed': 0}}, 'model_config': {'model_type': 'relu_toy', 'model_config': {'input_dim': 784, 'output_dim': 10, 'layer_dims': [100, 100, 100, 100, 100, 100, 100, 100, 100, 100, 100, 100], 'bias': True, 'seed': None}}, 'training_config': {'optimizer_type': 'sgd_momentum', 'loss_type': 'cross_entropy', 'lr': 0.01, 'num_epochs': 50, 'clip_grad_norm': False, 'weight_decay': 0.01, 'use_lr_schedule': False, 'epoch_lr_decay_steps': None, 'lr_decay_gamma': None, 'early_stop': True, 'early_stop_acc': 0.9, 'ea

Avg. Loss: 2.3020, Total Loss: 2.3084, Loss Parts: [2.3084]: 100%|███████████████████| 469/469 [00:08<00:00, 53.34it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3020
Training Accuracy: 0.1097
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.47it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: -1.0000
Stagnation was: 0

----------
Epoch 2/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3150, Loss Parts: [2.3150]: 100%|███████████████████| 469/469 [00:08<00:00, 54.70it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.67it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 3/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3029, Loss Parts: [2.3029]: 100%|███████████████████| 469/469 [00:09<00:00, 51.43it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.35it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 4/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3062, Loss Parts: [2.3062]: 100%|███████████████████| 469/469 [00:08<00:00, 53.00it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 20.88it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 5/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2964, Loss Parts: [2.2964]: 100%|███████████████████| 469/469 [00:09<00:00, 51.32it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.51it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 6/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2914, Loss Parts: [2.2914]: 100%|███████████████████| 469/469 [00:08<00:00, 52.31it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.45it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 7/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2934, Loss Parts: [2.2934]: 100%|███████████████████| 469/469 [00:08<00:00, 52.65it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.99it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 8/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2987, Loss Parts: [2.2987]: 100%|███████████████████| 469/469 [00:08<00:00, 54.73it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.63it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 9/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3047, Loss Parts: [2.3047]: 100%|███████████████████| 469/469 [00:08<00:00, 52.68it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.62it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 10/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3018, Loss Parts: [2.3018]: 100%|███████████████████| 469/469 [00:08<00:00, 52.42it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.02it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 11/50
----------
Training


Avg. Loss: 2.3013, Total Loss: 2.2959, Loss Parts: [2.2959]: 100%|███████████████████| 469/469 [00:08<00:00, 52.82it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3013
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.90it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3015
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 12/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2998, Loss Parts: [2.2998]: 100%|███████████████████| 469/469 [00:08<00:00, 53.65it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.18it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 13/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2949, Loss Parts: [2.2949]: 100%|███████████████████| 469/469 [00:08<00:00, 53.82it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.24it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 14/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3024, Loss Parts: [2.3024]: 100%|███████████████████| 469/469 [00:08<00:00, 55.09it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.26it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 15/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2946, Loss Parts: [2.2946]: 100%|███████████████████| 469/469 [00:08<00:00, 53.49it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.18it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 16/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3049, Loss Parts: [2.3049]: 100%|███████████████████| 469/469 [00:08<00:00, 53.92it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.09it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 17/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3051, Loss Parts: [2.3051]: 100%|███████████████████| 469/469 [00:08<00:00, 52.16it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.74it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 18/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3067, Loss Parts: [2.3067]: 100%|███████████████████| 469/469 [00:08<00:00, 58.27it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.49it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 19/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3043, Loss Parts: [2.3043]: 100%|███████████████████| 469/469 [00:08<00:00, 52.77it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.60it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 20/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3006, Loss Parts: [2.3006]: 100%|███████████████████| 469/469 [00:08<00:00, 53.90it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.79it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 21/50
----------
Training


Avg. Loss: 2.3013, Total Loss: 2.2875, Loss Parts: [2.2875]: 100%|███████████████████| 469/469 [00:08<00:00, 53.30it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3013
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.09it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 22/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3062, Loss Parts: [2.3062]: 100%|███████████████████| 469/469 [00:08<00:00, 53.73it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1121
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.94it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1028
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 23/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3117, Loss Parts: [2.3117]: 100%|███████████████████| 469/469 [00:08<00:00, 56.40it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1120
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.38it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 24/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3014, Loss Parts: [2.3014]: 100%|███████████████████| 469/469 [00:08<00:00, 52.18it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.84it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 25/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3116, Loss Parts: [2.3116]: 100%|███████████████████| 469/469 [00:09<00:00, 50.93it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.70it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 26/50
----------
Training


Avg. Loss: 2.3013, Total Loss: 2.2967, Loss Parts: [2.2967]: 100%|███████████████████| 469/469 [00:08<00:00, 52.56it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3013
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 20.93it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 27/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3019, Loss Parts: [2.3019]: 100%|███████████████████| 469/469 [00:09<00:00, 51.16it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.14it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 28/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3048, Loss Parts: [2.3048]: 100%|███████████████████| 469/469 [00:08<00:00, 54.30it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.16it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 29/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2968, Loss Parts: [2.2968]: 100%|███████████████████| 469/469 [00:09<00:00, 50.92it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 24.36it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 30/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3048, Loss Parts: [2.3048]: 100%|███████████████████| 469/469 [00:09<00:00, 51.81it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 23.03it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 31/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2948, Loss Parts: [2.2948]: 100%|███████████████████| 469/469 [00:08<00:00, 52.77it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.69it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 32/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2991, Loss Parts: [2.2991]: 100%|███████████████████| 469/469 [00:09<00:00, 50.92it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.12it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 33/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3031, Loss Parts: [2.3031]: 100%|███████████████████| 469/469 [00:08<00:00, 52.13it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.12it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 34/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2955, Loss Parts: [2.2955]: 100%|███████████████████| 469/469 [00:08<00:00, 52.27it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.86it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 35/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3018, Loss Parts: [2.3018]: 100%|███████████████████| 469/469 [00:09<00:00, 51.68it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.58it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 36/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3029, Loss Parts: [2.3029]: 100%|███████████████████| 469/469 [00:08<00:00, 56.18it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.35it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 37/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3044, Loss Parts: [2.3044]: 100%|███████████████████| 469/469 [00:07<00:00, 58.77it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.29it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 38/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3068, Loss Parts: [2.3068]: 100%|███████████████████| 469/469 [00:09<00:00, 51.94it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.76it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 39/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3076, Loss Parts: [2.3076]: 100%|███████████████████| 469/469 [00:08<00:00, 54.13it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.10it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 40/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2964, Loss Parts: [2.2964]: 100%|███████████████████| 469/469 [00:09<00:00, 51.90it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.35it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 41/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3043, Loss Parts: [2.3043]: 100%|███████████████████| 469/469 [00:08<00:00, 52.80it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.47it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 42/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2995, Loss Parts: [2.2995]: 100%|███████████████████| 469/469 [00:08<00:00, 52.41it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.53it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3014
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 43/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3035, Loss Parts: [2.3035]: 100%|███████████████████| 469/469 [00:09<00:00, 51.40it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.13it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3012
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 44/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3073, Loss Parts: [2.3073]: 100%|███████████████████| 469/469 [00:08<00:00, 52.30it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.73it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3011
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 45/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.2978, Loss Parts: [2.2978]: 100%|███████████████████| 469/469 [00:09<00:00, 51.30it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 21.48it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3013
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 46/50
----------
Training


Avg. Loss: 2.3014, Total Loss: 2.3014, Loss Parts: [2.3014]: 100%|███████████████████| 469/469 [00:09<00:00, 51.48it/s]
  0%|                                                                                           | 0/79 [00:00<?, ?it/s]

Training Loss: 2.3014
Training Accuracy: 0.1124
Testing


100%|██████████████████████████████████████████████████████████████████████████████████| 79/79 [00:03<00:00, 22.31it/s]
  0%|                                                                                          | 0/469 [00:00<?, ?it/s]

Testing loss: 2.3010
Testing accuracy: 0.1135
Best testing accuracy was: 0.1135
Stagnation was: 0

----------
Epoch 47/50
----------
Training
