In [1]:
%cd ..

/home/ltorres/leo/tesis/cloud-classification/code


In [2]:
%load_ext autoreload
%autoreload 2

In [3]:
from torchvision.io import read_image
import glob
import os
import math


import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

from random import sample
import torch
import torch.nn as nn

In [4]:
from src.dataset import GCD
from src import config
from src import engine_gnn as engine
from src import utils
from src import sweeps

from src.models.graph_nets import GraphConvGNN, GATConvGNN

In [5]:
from sklearn.metrics import accuracy_score

In [6]:
import wandb

In [7]:
wandb.login()

[34m[1mwandb[0m: Currently logged in as: [33mleonardtd[0m (use `wandb login --relogin` to force relogin)


True

In [8]:
device = config.DEVICE

### Sweep config

In [9]:
sweep_config = {
    'method': 'random'
    }

In [10]:
metric = {
    'name': 'test_accuracy',
    'goal': 'maximize'   
    }

sweep_config['metric'] = metric

In [28]:
# parameters_dict = {
#     'optimizer': {
#         'values': ['adam', 'sgd', 'nadam']
#         },
#     'criterion': {
#         'values': ['cross_entropy', 'loge']
#         },
#     'hidden_dim': {
#         'values': [128, 256, 512, 1024]
#         },
#     'num_hidden': {
#         'values': [2,3,4]
#         },
#     'num_heads': {
#           'values': [1,2,4]
#         },
#     'similarity_threshold': {
#           'values': [0.5, 0.6, 0.7, 0.75, 0.8, 0.9]
#         },
#     }

# sweep_config['parameters'] = parameters_dict

In [None]:
parameters_dict = {
    'optimizer': {
        'values': ['sgd', 'nadam']
        },
    'criterion': {
        'values': ['cross_entropy', 'loge']
        },
    'hidden_dim': {
        'values': [512, 1024]
        },
    'num_hidden': {
        'values': [2,3,4]
        },
    'num_heads': {
          'values': [1,4]
        },
    'similarity_threshold': {
          'values': [0.65, 0.7, 0.75, 0.8]
        },
    }

sweep_config['parameters'] = parameters_dict

In [12]:
parameters_dict.update({
    'epochs': {
        'value': config.EPOCHS,
        },
    'device': {
        'value': device,
        },
    'classes': {
        'value': config.GCD_CLASSES,
        },
    })

In [13]:
parameters_dict.update({
    'learning_rate': {
        # a flat distribution between 0 and 0.1
        'distribution': 'uniform',
        'min': 5e-6,
        'max': 3e-5
      },
    'batch_size': {
        # integers between 16 and 32
        # with evenly-distributed logarithms 
        'distribution': 'q_log_uniform',
        'q': 1,
        'min': math.log(16),
        'max': math.log(36),
      }
    })

In [14]:
sweep_config

{'method': 'random',
 'metric': {'name': 'loss', 'goal': 'minimize'},
 'parameters': {'optimizer': {'values': ['adam', 'sgd', 'nadam']},
  'criterion': {'values': ['cross_entropy', 'loge']},
  'hidden_dim': {'values': [128, 256, 512, 1024]},
  'num_hidden': {'values': [2, 3, 4]},
  'num_heads': {'values': [1, 2, 4]},
  'similarity_threshold': {'values': [0.5, 0.6, 0.7, 0.75, 0.8, 0.9]},
  'epochs': {'value': 25},
  'device': {'value': 'cuda:2'},
  'learning_rate': {'distribution': 'uniform', 'min': 1e-06, 'max': 6e-05},
  'batch_size': {'distribution': 'q_log_uniform',
   'q': 1,
   'min': 2.772588722239781,
   'max': 3.4657359027997265}}}

In [15]:
sweep_id = wandb.sweep(sweep_config, project="cloud classification")

Create sweep with ID: 03otgj81
Sweep URL: https://wandb.ai/leonardtd/cloud%20classification/sweeps/03otgj81


---

In [16]:
def train(config=None):

#Init new run
    with wandb.init(config=config):

        config = wandb.config
        train_loader, test_loader, augmentation_loaders = utils.build_dataset_gcd(config.batch_size)

        model = utils.build_model_gatconv(
                                            7, #GCD num classes
                                            config.hidden_dim,
                                            config.num_hidden,
                                            config.num_heads,
                                            config.similarity_threshold,
                                            config.device
                                           )

        optimizer = utils.build_optimizer(config.optimizer, model, config.learning_rate)
        criterion = utils.build_criterion(config.criterion)

        for e in range(config.epochs):
            ### TRAIN DATASET
                preds, targets, loss = engine.train_fn(model, 
                                       train_loader, 
                                       criterion, 
                                       optimizer, 
                                       config.device)
                
                train_acc = accuracy_score(targets, preds)

                ### AUGMENTATION IMAGES
                for _loader in augmentation_loaders:
                    engine.forward_backward_pass(model, 
                                                 _loader, 
                                                 criterion, 
                                                 optimizer, 
                                                 device=config.device)

                test_preds, test_targets, test_loss = engine.eval_fn(model, 
                                           test_loader, 
                                           criterion, 
                                           device=config.device)
                test_acc = accuracy_score(test_targets, test_preds)


                print("EPOCH {}: Train acc: {:.2%} Train Loss: {:.4f} Test acc: {:.2%} Test Loss: {:.4f}".format(
                    e+1,
                    train_acc,
                    loss,
                    test_acc,
                    test_loss
                ))

                metrics = {
                            "train/train_loss": loss,
                            "train/train_accuracy": train_acc,
                            "test/test_loss": test_loss,
                            "test/test_accuracy": test_acc,
                          }

                wandb.log(metrics)
                wandb.log({"test_accuracy": test_acc, "epoch": e+1})
            
        wandb.log({"conf_mat" : wandb.plot.confusion_matrix(probs=None, 
                                                            preds=test_preds,
                                                            y_true=test_targets,
                                                            class_names=config.classes)})

---

In [17]:
wandb.agent(sweep_id, train, count=10)

[34m[1mwandb[0m: Agent Starting Run: dhty9zi0 with config:
[34m[1mwandb[0m: 	batch_size: 23
[34m[1mwandb[0m: 	criterion: loge
[34m[1mwandb[0m: 	device: cuda:2
[34m[1mwandb[0m: 	epochs: 25
[34m[1mwandb[0m: 	hidden_dim: 1024
[34m[1mwandb[0m: 	learning_rate: 5.101083500805064e-06
[34m[1mwandb[0m: 	num_heads: 1
[34m[1mwandb[0m: 	num_hidden: 4
[34m[1mwandb[0m: 	optimizer: sgd
[34m[1mwandb[0m: 	similarity_threshold: 0.75


100%|██████████| 435/435 [01:00<00:00,  7.16it/s]
100%|██████████| 435/435 [00:58<00:00,  7.44it/s]
100%|██████████| 435/435 [00:58<00:00,  7.40it/s]
100%|██████████| 435/435 [00:58<00:00,  7.45it/s]
100%|██████████| 435/435 [00:58<00:00,  7.45it/s]
100%|██████████| 392/392 [00:19<00:00, 19.98it/s]


EPOCH 1: Train acc: 37.91% Train Loss: 3.6822 Test acc: 53.23% Test Loss: 2.7823


100%|██████████| 435/435 [01:01<00:00,  7.13it/s]
100%|██████████| 435/435 [00:58<00:00,  7.43it/s]
100%|██████████| 435/435 [00:58<00:00,  7.41it/s]
100%|██████████| 435/435 [00:58<00:00,  7.46it/s]
100%|██████████| 435/435 [00:58<00:00,  7.41it/s]
100%|██████████| 392/392 [00:19<00:00, 20.31it/s]


EPOCH 2: Train acc: 64.59% Train Loss: 2.4977 Test acc: 63.86% Test Loss: 2.3849


100%|██████████| 435/435 [01:00<00:00,  7.18it/s]
100%|██████████| 435/435 [00:58<00:00,  7.44it/s]
100%|██████████| 435/435 [00:58<00:00,  7.41it/s]
100%|██████████| 435/435 [00:58<00:00,  7.46it/s]
100%|██████████| 435/435 [00:58<00:00,  7.41it/s]
100%|██████████| 392/392 [00:19<00:00, 19.95it/s]


EPOCH 3: Train acc: 73.43% Train Loss: 2.0289 Test acc: 71.06% Test Loss: 2.0831


100%|██████████| 435/435 [01:00<00:00,  7.16it/s]
100%|██████████| 435/435 [00:58<00:00,  7.44it/s]
100%|██████████| 435/435 [00:58<00:00,  7.42it/s]
100%|██████████| 435/435 [00:58<00:00,  7.45it/s]
100%|██████████| 435/435 [00:58<00:00,  7.42it/s]
100%|██████████| 392/392 [00:19<00:00, 20.05it/s]


EPOCH 4: Train acc: 78.05% Train Loss: 1.7197 Test acc: 72.06% Test Loss: 1.9424


100%|██████████| 435/435 [01:00<00:00,  7.20it/s]
100%|██████████| 435/435 [00:58<00:00,  7.42it/s]
100%|██████████| 435/435 [00:58<00:00,  7.44it/s]
100%|██████████| 435/435 [00:58<00:00,  7.47it/s]
100%|██████████| 435/435 [00:58<00:00,  7.44it/s]
100%|██████████| 392/392 [00:19<00:00, 19.87it/s]


EPOCH 5: Train acc: 79.83% Train Loss: 1.5187 Test acc: 74.50% Test Loss: 1.7611


100%|██████████| 435/435 [01:00<00:00,  7.18it/s]
100%|██████████| 435/435 [00:58<00:00,  7.42it/s]
100%|██████████| 435/435 [00:58<00:00,  7.43it/s]
100%|██████████| 435/435 [00:58<00:00,  7.46it/s]
100%|██████████| 435/435 [00:58<00:00,  7.46it/s]
100%|██████████| 392/392 [00:19<00:00, 19.96it/s]


EPOCH 6: Train acc: 81.53% Train Loss: 1.3626 Test acc: 73.36% Test Loss: 1.7580


100%|██████████| 435/435 [01:00<00:00,  7.17it/s]
100%|██████████| 435/435 [00:58<00:00,  7.39it/s]
100%|██████████| 435/435 [00:58<00:00,  7.41it/s]
100%|██████████| 435/435 [00:58<00:00,  7.46it/s]
100%|██████████| 435/435 [00:58<00:00,  7.43it/s]
100%|██████████| 392/392 [00:19<00:00, 19.91it/s]


EPOCH 7: Train acc: 83.45% Train Loss: 1.1998 Test acc: 76.12% Test Loss: 1.5644


100%|██████████| 435/435 [01:00<00:00,  7.20it/s]
100%|██████████| 435/435 [00:58<00:00,  7.44it/s]
100%|██████████| 435/435 [00:58<00:00,  7.40it/s]
100%|██████████| 435/435 [00:58<00:00,  7.46it/s]
100%|██████████| 435/435 [00:58<00:00,  7.42it/s]
100%|██████████| 392/392 [00:19<00:00, 19.89it/s]


EPOCH 8: Train acc: 83.60% Train Loss: 1.1124 Test acc: 76.27% Test Loss: 1.5387


100%|██████████| 435/435 [01:00<00:00,  7.17it/s]
100%|██████████| 435/435 [00:58<00:00,  7.44it/s]
100%|██████████| 435/435 [00:58<00:00,  7.42it/s]
100%|██████████| 435/435 [00:58<00:00,  7.46it/s]
100%|██████████| 435/435 [00:58<00:00,  7.42it/s]
100%|██████████| 392/392 [00:19<00:00, 19.95it/s]


EPOCH 9: Train acc: 84.08% Train Loss: 1.0391 Test acc: 74.16% Test Loss: 1.6158


100%|██████████| 435/435 [01:00<00:00,  7.16it/s]
100%|██████████| 435/435 [00:58<00:00,  7.42it/s]
100%|██████████| 435/435 [00:58<00:00,  7.44it/s]
100%|██████████| 435/435 [00:58<00:00,  7.46it/s]
100%|██████████| 435/435 [00:58<00:00,  7.46it/s]
100%|██████████| 392/392 [00:19<00:00, 19.90it/s]


EPOCH 10: Train acc: 84.84% Train Loss: 0.9780 Test acc: 76.21% Test Loss: 1.5179


100%|██████████| 435/435 [01:00<00:00,  7.14it/s]
100%|██████████| 435/435 [00:58<00:00,  7.42it/s]
100%|██████████| 435/435 [00:58<00:00,  7.41it/s]
100%|██████████| 435/435 [00:58<00:00,  7.46it/s]
100%|██████████| 435/435 [00:58<00:00,  7.41it/s]
100%|██████████| 392/392 [00:19<00:00, 20.01it/s]


EPOCH 11: Train acc: 84.88% Train Loss: 0.9458 Test acc: 76.39% Test Loss: 1.4928


100%|██████████| 435/435 [01:01<00:00,  7.11it/s]
100%|██████████| 435/435 [00:58<00:00,  7.42it/s]
100%|██████████| 435/435 [00:58<00:00,  7.41it/s]
100%|██████████| 435/435 [00:58<00:00,  7.47it/s]
100%|██████████| 435/435 [00:58<00:00,  7.43it/s]
100%|██████████| 392/392 [00:19<00:00, 20.01it/s]


EPOCH 12: Train acc: 86.03% Train Loss: 0.9045 Test acc: 77.41% Test Loss: 1.4408


100%|██████████| 435/435 [01:00<00:00,  7.17it/s]
100%|██████████| 435/435 [00:58<00:00,  7.46it/s]
100%|██████████| 435/435 [00:58<00:00,  7.41it/s]
100%|██████████| 435/435 [00:58<00:00,  7.46it/s]
100%|██████████| 435/435 [00:58<00:00,  7.38it/s]
100%|██████████| 392/392 [00:19<00:00, 19.96it/s]


EPOCH 13: Train acc: 86.40% Train Loss: 0.8652 Test acc: 79.33% Test Loss: 1.3565


100%|██████████| 435/435 [01:00<00:00,  7.16it/s]
100%|██████████| 435/435 [00:58<00:00,  7.44it/s]
100%|██████████| 435/435 [00:58<00:00,  7.41it/s]
100%|██████████| 435/435 [00:58<00:00,  7.45it/s]
100%|██████████| 435/435 [00:58<00:00,  7.42it/s]
100%|██████████| 392/392 [00:19<00:00, 19.98it/s]


EPOCH 14: Train acc: 86.69% Train Loss: 0.8511 Test acc: 79.13% Test Loss: 1.3550


100%|██████████| 435/435 [01:00<00:00,  7.14it/s]
100%|██████████| 435/435 [00:58<00:00,  7.44it/s]
100%|██████████| 435/435 [00:58<00:00,  7.42it/s]
100%|██████████| 435/435 [00:58<00:00,  7.46it/s]
100%|██████████| 435/435 [00:58<00:00,  7.41it/s]
100%|██████████| 392/392 [00:19<00:00, 20.04it/s]


EPOCH 15: Train acc: 86.87% Train Loss: 0.8338 Test acc: 77.26% Test Loss: 1.4446


100%|██████████| 435/435 [01:00<00:00,  7.18it/s]
100%|██████████| 435/435 [00:58<00:00,  7.41it/s]
100%|██████████| 435/435 [00:58<00:00,  7.41it/s]
100%|██████████| 435/435 [00:58<00:00,  7.47it/s]
100%|██████████| 435/435 [00:58<00:00,  7.41it/s]
100%|██████████| 392/392 [00:19<00:00, 20.00it/s]


EPOCH 16: Train acc: 86.89% Train Loss: 0.8183 Test acc: 78.73% Test Loss: 1.3744


100%|██████████| 435/435 [01:00<00:00,  7.16it/s]
100%|██████████| 435/435 [00:58<00:00,  7.43it/s]
100%|██████████| 435/435 [00:58<00:00,  7.41it/s]
100%|██████████| 435/435 [00:58<00:00,  7.46it/s]
100%|██████████| 435/435 [00:58<00:00,  7.39it/s]
100%|██████████| 392/392 [00:19<00:00, 20.09it/s]


EPOCH 17: Train acc: 87.05% Train Loss: 0.8035 Test acc: 78.21% Test Loss: 1.3898


100%|██████████| 435/435 [01:00<00:00,  7.18it/s]
100%|██████████| 435/435 [00:58<00:00,  7.42it/s]
100%|██████████| 435/435 [00:58<00:00,  7.42it/s]
100%|██████████| 435/435 [00:58<00:00,  7.48it/s]
100%|██████████| 435/435 [00:58<00:00,  7.42it/s]
100%|██████████| 392/392 [00:19<00:00, 20.13it/s]


EPOCH 18: Train acc: 87.85% Train Loss: 0.7791 Test acc: 77.64% Test Loss: 1.4148


100%|██████████| 435/435 [01:00<00:00,  7.18it/s]
100%|██████████| 435/435 [00:58<00:00,  7.44it/s]
100%|██████████| 435/435 [00:58<00:00,  7.42it/s]
100%|██████████| 435/435 [00:58<00:00,  7.45it/s]
100%|██████████| 435/435 [00:58<00:00,  7.48it/s]
100%|██████████| 392/392 [00:19<00:00, 20.20it/s]


EPOCH 19: Train acc: 87.97% Train Loss: 0.7686 Test acc: 77.72% Test Loss: 1.3865


100%|██████████| 435/435 [01:00<00:00,  7.17it/s]
100%|██████████| 435/435 [00:58<00:00,  7.46it/s]
100%|██████████| 435/435 [00:58<00:00,  7.42it/s]
100%|██████████| 435/435 [00:58<00:00,  7.46it/s]
100%|██████████| 435/435 [00:58<00:00,  7.43it/s]
100%|██████████| 392/392 [00:19<00:00, 20.10it/s]


EPOCH 20: Train acc: 87.72% Train Loss: 0.7708 Test acc: 78.64% Test Loss: 1.3519


100%|██████████| 435/435 [01:00<00:00,  7.19it/s]
100%|██████████| 435/435 [00:58<00:00,  7.45it/s]
100%|██████████| 435/435 [00:58<00:00,  7.42it/s]
100%|██████████| 435/435 [00:58<00:00,  7.46it/s]
100%|██████████| 435/435 [00:58<00:00,  7.43it/s]
100%|██████████| 392/392 [00:19<00:00, 20.31it/s]


EPOCH 21: Train acc: 88.13% Train Loss: 0.7467 Test acc: 78.39% Test Loss: 1.3748


100%|██████████| 435/435 [01:00<00:00,  7.18it/s]
100%|██████████| 435/435 [00:58<00:00,  7.44it/s]
100%|██████████| 435/435 [00:58<00:00,  7.43it/s]
100%|██████████| 435/435 [00:58<00:00,  7.47it/s]
100%|██████████| 435/435 [00:58<00:00,  7.42it/s]
100%|██████████| 392/392 [00:19<00:00, 20.12it/s]


EPOCH 22: Train acc: 88.81% Train Loss: 0.7273 Test acc: 79.40% Test Loss: 1.3395


100%|██████████| 435/435 [01:00<00:00,  7.18it/s]
100%|██████████| 435/435 [00:58<00:00,  7.46it/s]
100%|██████████| 435/435 [00:58<00:00,  7.40it/s]
100%|██████████| 435/435 [00:58<00:00,  7.46it/s]
100%|██████████| 435/435 [00:58<00:00,  7.42it/s]
100%|██████████| 392/392 [00:19<00:00, 20.16it/s]


EPOCH 23: Train acc: 88.76% Train Loss: 0.7173 Test acc: 79.98% Test Loss: 1.3218


100%|██████████| 435/435 [01:00<00:00,  7.19it/s]
100%|██████████| 435/435 [00:58<00:00,  7.44it/s]
100%|██████████| 435/435 [00:58<00:00,  7.44it/s]
100%|██████████| 435/435 [00:58<00:00,  7.46it/s]
100%|██████████| 435/435 [00:58<00:00,  7.44it/s]
100%|██████████| 392/392 [00:19<00:00, 20.08it/s]


EPOCH 24: Train acc: 88.44% Train Loss: 0.7205 Test acc: 79.08% Test Loss: 1.3553


100%|██████████| 435/435 [01:00<00:00,  7.15it/s]
100%|██████████| 435/435 [00:58<00:00,  7.45it/s]
100%|██████████| 435/435 [00:58<00:00,  7.39it/s]
100%|██████████| 435/435 [00:58<00:00,  7.46it/s]
100%|██████████| 435/435 [00:58<00:00,  7.42it/s]
100%|██████████| 392/392 [00:19<00:00, 20.15it/s]


EPOCH 25: Train acc: 89.09% Train Loss: 0.6995 Test acc: 80.01% Test Loss: 1.3104



VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▂▃▃▃▄▄▄▅▅▅▅▆▆▆▇▇▇▇██
loss,█▆▅▄▃▃▂▂▂▂▂▂▁▁▂▁▁▁▁▁▁▁▁▁▁
test/test_accuracy,▁▄▆▆▇▆▇▇▆▇▇▇██▇██▇▇██████
test/test_loss,█▆▅▄▃▃▂▂▂▂▂▂▁▁▂▁▁▁▁▁▁▁▁▁▁
train/train_accuracy,▁▅▆▆▇▇▇▇▇▇▇██████████████
train/train_loss,█▅▄▃▃▃▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,25.0
loss,1.31042
test/test_accuracy,0.80011
test/test_loss,1.31042
train/train_accuracy,0.8909
train/train_loss,0.69946


Run dhty9zi0 errored: NameError("name 'classes' is not defined")
[34m[1mwandb[0m: [32m[41mERROR[0m Run dhty9zi0 errored: NameError("name 'classes' is not defined")
[34m[1mwandb[0m: Agent Starting Run: rlw5rywq with config:
[34m[1mwandb[0m: 	batch_size: 23
[34m[1mwandb[0m: 	criterion: loge
[34m[1mwandb[0m: 	device: cuda:2
[34m[1mwandb[0m: 	epochs: 25
[34m[1mwandb[0m: 	hidden_dim: 1024
[34m[1mwandb[0m: 	learning_rate: 2.481169315141051e-05
[34m[1mwandb[0m: 	num_heads: 4
[34m[1mwandb[0m: 	num_hidden: 3
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	similarity_threshold: 0.5


100%|██████████| 435/435 [01:02<00:00,  6.91it/s]
100%|██████████| 435/435 [01:01<00:00,  7.08it/s]
100%|██████████| 435/435 [01:01<00:00,  7.09it/s]
100%|██████████| 435/435 [01:01<00:00,  7.11it/s]
100%|██████████| 435/435 [01:01<00:00,  7.11it/s]
100%|██████████| 392/392 [00:19<00:00, 20.37it/s]


EPOCH 1: Train acc: 78.28% Train Loss: 1.2762 Test acc: 82.41% Test Loss: 1.2296


100%|██████████| 435/435 [01:03<00:00,  6.88it/s]
100%|██████████| 435/435 [01:01<00:00,  7.07it/s]
100%|██████████| 435/435 [01:01<00:00,  7.08it/s]
100%|██████████| 435/435 [01:01<00:00,  7.08it/s]
100%|██████████| 435/435 [01:01<00:00,  7.10it/s]
100%|██████████| 392/392 [00:19<00:00, 20.45it/s]


EPOCH 2: Train acc: 92.37% Train Loss: 0.4532 Test acc: 81.33% Test Loss: 1.2545


100%|██████████| 435/435 [01:02<00:00,  6.91it/s]
100%|██████████| 435/435 [01:01<00:00,  7.07it/s]
100%|██████████| 435/435 [01:01<00:00,  7.08it/s]
100%|██████████| 435/435 [01:01<00:00,  7.09it/s]
100%|██████████| 435/435 [01:01<00:00,  7.11it/s]
100%|██████████| 392/392 [00:19<00:00, 20.47it/s]


EPOCH 3: Train acc: 95.06% Train Loss: 0.2955 Test acc: 80.83% Test Loss: 1.2918


100%|██████████| 435/435 [01:02<00:00,  6.90it/s]
100%|██████████| 435/435 [01:01<00:00,  7.08it/s]
100%|██████████| 435/435 [01:01<00:00,  7.09it/s]
100%|██████████| 435/435 [01:01<00:00,  7.12it/s]
100%|██████████| 435/435 [01:01<00:00,  7.10it/s]
100%|██████████| 392/392 [00:19<00:00, 20.36it/s]


EPOCH 4: Train acc: 97.20% Train Loss: 0.1799 Test acc: 78.66% Test Loss: 1.4436


100%|██████████| 435/435 [01:02<00:00,  6.91it/s]
100%|██████████| 435/435 [01:01<00:00,  7.09it/s]
100%|██████████| 435/435 [01:01<00:00,  7.09it/s]
100%|██████████| 435/435 [01:01<00:00,  7.11it/s]
100%|██████████| 435/435 [01:01<00:00,  7.12it/s]
100%|██████████| 392/392 [00:19<00:00, 20.32it/s]


EPOCH 5: Train acc: 98.36% Train Loss: 0.1125 Test acc: 78.23% Test Loss: 1.4872


100%|██████████| 435/435 [01:02<00:00,  6.91it/s]
100%|██████████| 435/435 [01:01<00:00,  7.08it/s]
100%|██████████| 435/435 [01:01<00:00,  7.08it/s]
100%|██████████| 435/435 [01:01<00:00,  7.10it/s]
100%|██████████| 435/435 [01:01<00:00,  7.11it/s]
100%|██████████| 392/392 [00:19<00:00, 20.45it/s]


EPOCH 6: Train acc: 98.69% Train Loss: 0.0887 Test acc: 79.81% Test Loss: 1.4036


100%|██████████| 435/435 [01:03<00:00,  6.90it/s]
100%|██████████| 435/435 [01:01<00:00,  7.08it/s]
100%|██████████| 435/435 [01:01<00:00,  7.09it/s]
100%|██████████| 435/435 [01:01<00:00,  7.09it/s]
100%|██████████| 435/435 [01:01<00:00,  7.07it/s]
100%|██████████| 392/392 [00:18<00:00, 20.64it/s]


EPOCH 7: Train acc: 98.98% Train Loss: 0.0707 Test acc: 80.53% Test Loss: 1.3687


100%|██████████| 435/435 [01:03<00:00,  6.90it/s]
100%|██████████| 435/435 [01:01<00:00,  7.08it/s]
100%|██████████| 435/435 [01:01<00:00,  7.07it/s]
100%|██████████| 435/435 [01:01<00:00,  7.13it/s]
100%|██████████| 435/435 [01:01<00:00,  7.11it/s]
100%|██████████| 392/392 [00:19<00:00, 20.49it/s]


EPOCH 8: Train acc: 99.01% Train Loss: 0.0629 Test acc: 80.58% Test Loss: 1.3534


100%|██████████| 435/435 [01:03<00:00,  6.90it/s]
100%|██████████| 435/435 [01:01<00:00,  7.07it/s]
100%|██████████| 435/435 [01:01<00:00,  7.08it/s]
100%|██████████| 435/435 [01:01<00:00,  7.12it/s]
100%|██████████| 435/435 [01:01<00:00,  7.10it/s]
100%|██████████| 392/392 [00:19<00:00, 20.53it/s]


EPOCH 9: Train acc: 99.46% Train Loss: 0.0378 Test acc: 80.54% Test Loss: 1.3433


100%|██████████| 435/435 [01:03<00:00,  6.90it/s]
100%|██████████| 435/435 [01:01<00:00,  7.08it/s]
100%|██████████| 435/435 [01:01<00:00,  7.08it/s]
100%|██████████| 435/435 [01:01<00:00,  7.09it/s]
100%|██████████| 435/435 [01:01<00:00,  7.08it/s]
100%|██████████| 392/392 [00:19<00:00, 20.46it/s]


EPOCH 10: Train acc: 99.50% Train Loss: 0.0357 Test acc: 78.49% Test Loss: 1.5128


100%|██████████| 435/435 [01:02<00:00,  6.91it/s]
100%|██████████| 435/435 [01:01<00:00,  7.08it/s]
100%|██████████| 435/435 [01:01<00:00,  7.09it/s]
100%|██████████| 435/435 [01:01<00:00,  7.11it/s]
100%|██████████| 435/435 [01:01<00:00,  7.11it/s]
100%|██████████| 392/392 [00:19<00:00, 20.54it/s]


EPOCH 11: Train acc: 99.55% Train Loss: 0.0333 Test acc: 80.72% Test Loss: 1.3678


100%|██████████| 435/435 [01:02<00:00,  6.91it/s]
100%|██████████| 435/435 [01:01<00:00,  7.08it/s]
100%|██████████| 435/435 [01:01<00:00,  7.07it/s]
100%|██████████| 435/435 [01:01<00:00,  7.07it/s]
100%|██████████| 435/435 [01:01<00:00,  7.10it/s]
100%|██████████| 392/392 [00:19<00:00, 20.45it/s]


EPOCH 12: Train acc: 99.60% Train Loss: 0.0279 Test acc: 79.98% Test Loss: 1.4048


100%|██████████| 435/435 [01:02<00:00,  6.91it/s]
100%|██████████| 435/435 [01:01<00:00,  7.08it/s]
100%|██████████| 435/435 [01:01<00:00,  7.09it/s]
100%|██████████| 435/435 [01:01<00:00,  7.09it/s]
100%|██████████| 435/435 [01:01<00:00,  7.10it/s]
100%|██████████| 392/392 [00:19<00:00, 20.47it/s]


EPOCH 13: Train acc: 99.55% Train Loss: 0.0283 Test acc: 79.07% Test Loss: 1.4698


100%|██████████| 435/435 [01:02<00:00,  6.91it/s]
100%|██████████| 435/435 [01:01<00:00,  7.08it/s]
100%|██████████| 435/435 [01:01<00:00,  7.09it/s]
100%|██████████| 435/435 [01:01<00:00,  7.09it/s]
100%|██████████| 435/435 [01:01<00:00,  7.09it/s]
100%|██████████| 392/392 [00:19<00:00, 20.38it/s]


EPOCH 14: Train acc: 99.73% Train Loss: 0.0228 Test acc: 80.31% Test Loss: 1.3770


100%|██████████| 435/435 [01:02<00:00,  6.92it/s]
100%|██████████| 435/435 [01:01<00:00,  7.08it/s]
100%|██████████| 435/435 [01:01<00:00,  7.08it/s]
100%|██████████| 435/435 [01:01<00:00,  7.11it/s]
100%|██████████| 435/435 [01:00<00:00,  7.13it/s]
100%|██████████| 392/392 [00:19<00:00, 20.38it/s]


EPOCH 15: Train acc: 99.76% Train Loss: 0.0207 Test acc: 78.23% Test Loss: 1.5406


100%|██████████| 435/435 [01:03<00:00,  6.89it/s]
100%|██████████| 435/435 [01:01<00:00,  7.07it/s]
100%|██████████| 435/435 [01:01<00:00,  7.07it/s]
100%|██████████| 435/435 [01:01<00:00,  7.10it/s]
100%|██████████| 435/435 [01:01<00:00,  7.11it/s]
100%|██████████| 392/392 [00:19<00:00, 20.38it/s]


EPOCH 16: Train acc: 99.64% Train Loss: 0.0247 Test acc: 78.99% Test Loss: 1.5116


100%|██████████| 435/435 [01:03<00:00,  6.89it/s]
100%|██████████| 435/435 [01:01<00:00,  7.08it/s]
100%|██████████| 435/435 [01:01<00:00,  7.07it/s]
100%|██████████| 435/435 [01:01<00:00,  7.11it/s]
100%|██████████| 435/435 [01:01<00:00,  7.10it/s]
100%|██████████| 392/392 [00:19<00:00, 20.42it/s]


EPOCH 17: Train acc: 99.80% Train Loss: 0.0142 Test acc: 78.79% Test Loss: 1.4874


100%|██████████| 435/435 [01:03<00:00,  6.90it/s]
100%|██████████| 435/435 [01:01<00:00,  7.06it/s]
100%|██████████| 435/435 [01:01<00:00,  7.09it/s]
100%|██████████| 435/435 [01:01<00:00,  7.09it/s]
100%|██████████| 435/435 [01:01<00:00,  7.09it/s]
100%|██████████| 392/392 [00:19<00:00, 20.37it/s]


EPOCH 18: Train acc: 99.78% Train Loss: 0.0167 Test acc: 79.87% Test Loss: 1.4357


100%|██████████| 435/435 [01:02<00:00,  6.91it/s]
100%|██████████| 435/435 [01:01<00:00,  7.06it/s]
100%|██████████| 435/435 [01:01<00:00,  7.07it/s]
100%|██████████| 435/435 [01:01<00:00,  7.11it/s]
100%|██████████| 435/435 [01:01<00:00,  7.11it/s]
100%|██████████| 392/392 [00:19<00:00, 20.45it/s]


EPOCH 19: Train acc: 99.78% Train Loss: 0.0171 Test acc: 79.71% Test Loss: 1.4136


100%|██████████| 435/435 [01:02<00:00,  6.91it/s]
100%|██████████| 435/435 [01:01<00:00,  7.08it/s]
100%|██████████| 435/435 [01:01<00:00,  7.11it/s]
100%|██████████| 435/435 [01:01<00:00,  7.11it/s]
100%|██████████| 435/435 [01:01<00:00,  7.11it/s]
100%|██████████| 392/392 [00:19<00:00, 20.53it/s]


EPOCH 20: Train acc: 99.90% Train Loss: 0.0101 Test acc: 79.44% Test Loss: 1.4653


100%|██████████| 435/435 [01:02<00:00,  6.91it/s]
100%|██████████| 435/435 [01:01<00:00,  7.07it/s]
100%|██████████| 435/435 [01:01<00:00,  7.07it/s]
100%|██████████| 435/435 [01:01<00:00,  7.11it/s]
100%|██████████| 435/435 [01:01<00:00,  7.10it/s]
100%|██████████| 392/392 [00:19<00:00, 20.50it/s]


EPOCH 21: Train acc: 99.80% Train Loss: 0.0146 Test acc: 78.10% Test Loss: 1.5866


100%|██████████| 435/435 [01:02<00:00,  6.95it/s]
100%|██████████| 435/435 [01:01<00:00,  7.08it/s]
100%|██████████| 435/435 [01:01<00:00,  7.09it/s]
100%|██████████| 435/435 [01:01<00:00,  7.09it/s]
100%|██████████| 435/435 [01:01<00:00,  7.11it/s]
100%|██████████| 392/392 [00:19<00:00, 20.39it/s]


EPOCH 22: Train acc: 99.85% Train Loss: 0.0123 Test acc: 79.42% Test Loss: 1.5309


100%|██████████| 435/435 [01:03<00:00,  6.90it/s]
100%|██████████| 435/435 [01:01<00:00,  7.09it/s]
100%|██████████| 435/435 [01:01<00:00,  7.07it/s]
100%|██████████| 435/435 [01:01<00:00,  7.09it/s]
100%|██████████| 435/435 [01:01<00:00,  7.13it/s]
100%|██████████| 392/392 [00:19<00:00, 20.37it/s]


EPOCH 23: Train acc: 99.74% Train Loss: 0.0158 Test acc: 78.09% Test Loss: 1.5543


100%|██████████| 435/435 [01:02<00:00,  6.91it/s]
100%|██████████| 435/435 [01:01<00:00,  7.07it/s]
100%|██████████| 435/435 [01:01<00:00,  7.08it/s]
100%|██████████| 435/435 [01:01<00:00,  7.09it/s]
100%|██████████| 435/435 [01:01<00:00,  7.10it/s]
100%|██████████| 392/392 [00:19<00:00, 20.38it/s]


EPOCH 24: Train acc: 99.78% Train Loss: 0.0161 Test acc: 78.18% Test Loss: 1.5583


100%|██████████| 435/435 [01:02<00:00,  6.92it/s]
100%|██████████| 435/435 [01:01<00:00,  7.08it/s]
100%|██████████| 435/435 [01:01<00:00,  7.10it/s]
100%|██████████| 435/435 [01:01<00:00,  7.10it/s]
100%|██████████| 435/435 [01:01<00:00,  7.09it/s]
100%|██████████| 392/392 [00:19<00:00, 20.37it/s]


EPOCH 25: Train acc: 99.81% Train Loss: 0.0145 Test acc: 77.63% Test Loss: 1.5639



VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▂▃▃▃▄▄▄▅▅▅▅▆▆▆▇▇▇▇██
loss,▁▁▂▅▆▄▄▃▃▇▄▄▆▄▇▇▆▅▅▆█▇▇▇█
test/test_accuracy,█▆▆▂▂▄▅▅▅▂▆▄▃▅▂▃▃▄▄▄▂▄▂▂▁
test/test_loss,▁▁▂▅▆▄▄▃▃▇▄▄▆▄▇▇▆▅▅▆█▇▇▇█
train/train_accuracy,▁▆▆▇█████████████████████
train/train_loss,█▃▃▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,25.0
loss,1.56386
test/test_accuracy,0.77633
test/test_loss,1.56386
train/train_accuracy,0.9981
train/train_loss,0.01448


Run rlw5rywq errored: NameError("name 'classes' is not defined")
[34m[1mwandb[0m: [32m[41mERROR[0m Run rlw5rywq errored: NameError("name 'classes' is not defined")
[34m[1mwandb[0m: Agent Starting Run: z0o4ky74 with config:
[34m[1mwandb[0m: 	batch_size: 16
[34m[1mwandb[0m: 	criterion: loge
[34m[1mwandb[0m: 	device: cuda:2
[34m[1mwandb[0m: 	epochs: 25
[34m[1mwandb[0m: 	hidden_dim: 256
[34m[1mwandb[0m: 	learning_rate: 2.0041349912259276e-05
[34m[1mwandb[0m: 	num_heads: 2
[34m[1mwandb[0m: 	num_hidden: 2
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	similarity_threshold: 0.75


100%|██████████| 625/625 [01:02<00:00, 10.04it/s]
100%|██████████| 625/625 [01:01<00:00, 10.23it/s]
100%|██████████| 625/625 [01:01<00:00, 10.22it/s]
100%|██████████| 625/625 [01:01<00:00, 10.24it/s]
100%|██████████| 625/625 [01:00<00:00, 10.26it/s]
100%|██████████| 563/563 [00:19<00:00, 29.27it/s]


EPOCH 1: Train acc: 78.87% Train Loss: 1.2966 Test acc: 81.08% Test Loss: 1.2273


100%|██████████| 625/625 [01:02<00:00,  9.94it/s]
100%|██████████| 625/625 [01:01<00:00, 10.23it/s]
100%|██████████| 625/625 [01:01<00:00, 10.24it/s]
100%|██████████| 625/625 [01:01<00:00, 10.25it/s]
100%|██████████| 625/625 [01:00<00:00, 10.27it/s]
100%|██████████| 563/563 [00:19<00:00, 29.20it/s]


EPOCH 2: Train acc: 92.00% Train Loss: 0.4814 Test acc: 79.90% Test Loss: 1.2947


100%|██████████| 625/625 [01:02<00:00,  9.95it/s]
100%|██████████| 625/625 [01:01<00:00, 10.22it/s]
100%|██████████| 625/625 [01:01<00:00, 10.23it/s]
100%|██████████| 625/625 [01:01<00:00, 10.21it/s]
100%|██████████| 625/625 [01:00<00:00, 10.26it/s]
100%|██████████| 563/563 [00:19<00:00, 29.24it/s]


EPOCH 3: Train acc: 94.86% Train Loss: 0.3189 Test acc: 78.67% Test Loss: 1.4093


100%|██████████| 625/625 [01:02<00:00,  9.97it/s]
100%|██████████| 625/625 [01:01<00:00, 10.22it/s]
100%|██████████| 625/625 [01:01<00:00, 10.21it/s]
100%|██████████| 625/625 [01:01<00:00, 10.23it/s]
100%|██████████| 625/625 [01:00<00:00, 10.26it/s]
100%|██████████| 563/563 [00:19<00:00, 29.15it/s]


EPOCH 4: Train acc: 96.80% Train Loss: 0.1957 Test acc: 79.07% Test Loss: 1.3970


100%|██████████| 625/625 [01:02<00:00,  9.93it/s]
100%|██████████| 625/625 [01:01<00:00, 10.23it/s]
100%|██████████| 625/625 [01:01<00:00, 10.22it/s]
100%|██████████| 625/625 [01:00<00:00, 10.27it/s]
100%|██████████| 625/625 [01:01<00:00, 10.24it/s]
100%|██████████| 563/563 [00:19<00:00, 29.13it/s]


EPOCH 5: Train acc: 98.14% Train Loss: 0.1228 Test acc: 78.50% Test Loss: 1.4231


100%|██████████| 625/625 [01:02<00:00,  9.94it/s]
100%|██████████| 625/625 [01:01<00:00, 10.22it/s]
100%|██████████| 625/625 [01:01<00:00, 10.22it/s]
100%|██████████| 625/625 [01:01<00:00, 10.23it/s]
100%|██████████| 625/625 [01:01<00:00, 10.23it/s]
100%|██████████| 563/563 [00:19<00:00, 29.34it/s]


EPOCH 6: Train acc: 98.62% Train Loss: 0.0989 Test acc: 77.93% Test Loss: 1.4496


100%|██████████| 625/625 [01:02<00:00,  9.97it/s]
100%|██████████| 625/625 [01:01<00:00, 10.22it/s]
100%|██████████| 625/625 [01:01<00:00, 10.23it/s]
100%|██████████| 625/625 [01:01<00:00, 10.23it/s]
100%|██████████| 625/625 [01:00<00:00, 10.25it/s]
100%|██████████| 563/563 [00:19<00:00, 28.91it/s]


EPOCH 7: Train acc: 98.73% Train Loss: 0.0803 Test acc: 78.16% Test Loss: 1.4458


100%|██████████| 625/625 [01:02<00:00,  9.96it/s]
100%|██████████| 625/625 [01:01<00:00, 10.23it/s]
100%|██████████| 625/625 [01:01<00:00, 10.23it/s]
100%|██████████| 625/625 [01:01<00:00, 10.23it/s]
100%|██████████| 625/625 [01:00<00:00, 10.28it/s]
100%|██████████| 563/563 [00:19<00:00, 29.07it/s]


EPOCH 8: Train acc: 99.18% Train Loss: 0.0585 Test acc: 75.77% Test Loss: 1.5683


100%|██████████| 625/625 [01:02<00:00,  9.95it/s]
100%|██████████| 625/625 [01:01<00:00, 10.24it/s]
100%|██████████| 625/625 [01:01<00:00, 10.22it/s]
100%|██████████| 625/625 [01:00<00:00, 10.27it/s]
100%|██████████| 625/625 [01:00<00:00, 10.26it/s]
100%|██████████| 563/563 [00:19<00:00, 29.31it/s]


EPOCH 9: Train acc: 99.42% Train Loss: 0.0423 Test acc: 76.77% Test Loss: 1.5249


100%|██████████| 625/625 [01:02<00:00,  9.94it/s]
100%|██████████| 625/625 [01:01<00:00, 10.21it/s]
100%|██████████| 625/625 [01:01<00:00, 10.22it/s]
100%|██████████| 625/625 [01:01<00:00, 10.21it/s]
100%|██████████| 625/625 [01:00<00:00, 10.26it/s]
100%|██████████| 563/563 [00:19<00:00, 29.14it/s]


EPOCH 10: Train acc: 99.44% Train Loss: 0.0379 Test acc: 76.88% Test Loss: 1.5482


100%|██████████| 625/625 [01:02<00:00,  9.93it/s]
100%|██████████| 625/625 [01:01<00:00, 10.21it/s]
100%|██████████| 625/625 [01:01<00:00, 10.22it/s]
100%|██████████| 625/625 [01:01<00:00, 10.23it/s]
100%|██████████| 625/625 [01:01<00:00, 10.24it/s]
100%|██████████| 563/563 [00:19<00:00, 29.21it/s]


EPOCH 11: Train acc: 99.60% Train Loss: 0.0289 Test acc: 77.79% Test Loss: 1.5097


100%|██████████| 625/625 [01:02<00:00,  9.96it/s]
100%|██████████| 625/625 [01:00<00:00, 10.25it/s]
100%|██████████| 625/625 [01:01<00:00, 10.24it/s]
100%|██████████| 625/625 [01:01<00:00, 10.22it/s]
100%|██████████| 625/625 [01:00<00:00, 10.25it/s]
100%|██████████| 563/563 [00:19<00:00, 29.26it/s]


EPOCH 12: Train acc: 99.71% Train Loss: 0.0238 Test acc: 77.86% Test Loss: 1.4641


100%|██████████| 625/625 [01:02<00:00,  9.97it/s]
100%|██████████| 625/625 [01:01<00:00, 10.23it/s]
100%|██████████| 625/625 [01:01<00:00, 10.22it/s]
100%|██████████| 625/625 [01:01<00:00, 10.22it/s]
100%|██████████| 625/625 [01:00<00:00, 10.27it/s]
100%|██████████| 563/563 [00:19<00:00, 29.26it/s]


EPOCH 13: Train acc: 99.62% Train Loss: 0.0252 Test acc: 78.79% Test Loss: 1.4317


100%|██████████| 625/625 [01:02<00:00,  9.94it/s]
100%|██████████| 625/625 [01:01<00:00, 10.22it/s]
100%|██████████| 625/625 [01:01<00:00, 10.24it/s]
100%|██████████| 625/625 [01:00<00:00, 10.25it/s]
100%|██████████| 625/625 [01:00<00:00, 10.26it/s]
100%|██████████| 563/563 [00:19<00:00, 29.12it/s]


EPOCH 14: Train acc: 99.78% Train Loss: 0.0164 Test acc: 77.42% Test Loss: 1.5439


100%|██████████| 625/625 [01:02<00:00,  9.94it/s]
100%|██████████| 625/625 [01:01<00:00, 10.24it/s]
100%|██████████| 625/625 [01:01<00:00, 10.22it/s]
100%|██████████| 625/625 [01:01<00:00, 10.23it/s]
100%|██████████| 625/625 [01:00<00:00, 10.26it/s]
100%|██████████| 563/563 [00:19<00:00, 29.17it/s]


EPOCH 15: Train acc: 99.69% Train Loss: 0.0243 Test acc: 78.16% Test Loss: 1.4511


100%|██████████| 625/625 [01:02<00:00,  9.95it/s]
100%|██████████| 625/625 [01:01<00:00, 10.24it/s]
100%|██████████| 625/625 [01:00<00:00, 10.25it/s]
100%|██████████| 625/625 [01:01<00:00, 10.24it/s]
100%|██████████| 625/625 [01:00<00:00, 10.27it/s]
100%|██████████| 563/563 [00:19<00:00, 29.03it/s]


EPOCH 16: Train acc: 99.73% Train Loss: 0.0194 Test acc: 77.26% Test Loss: 1.5369


100%|██████████| 625/625 [01:02<00:00,  9.95it/s]
100%|██████████| 625/625 [01:01<00:00, 10.21it/s]
100%|██████████| 625/625 [01:01<00:00, 10.22it/s]
100%|██████████| 625/625 [01:01<00:00, 10.24it/s]
100%|██████████| 625/625 [01:00<00:00, 10.31it/s]
100%|██████████| 563/563 [00:19<00:00, 29.46it/s]


EPOCH 17: Train acc: 99.69% Train Loss: 0.0208 Test acc: 77.97% Test Loss: 1.5091


100%|██████████| 625/625 [01:02<00:00,  9.95it/s]
100%|██████████| 625/625 [01:01<00:00, 10.22it/s]
100%|██████████| 625/625 [01:01<00:00, 10.24it/s]
100%|██████████| 625/625 [01:01<00:00, 10.24it/s]
100%|██████████| 625/625 [01:00<00:00, 10.27it/s]
100%|██████████| 563/563 [00:19<00:00, 29.30it/s]


EPOCH 18: Train acc: 99.83% Train Loss: 0.0141 Test acc: 76.70% Test Loss: 1.5929


100%|██████████| 625/625 [01:02<00:00,  9.95it/s]
100%|██████████| 625/625 [01:01<00:00, 10.22it/s]
100%|██████████| 625/625 [01:01<00:00, 10.21it/s]
100%|██████████| 625/625 [01:01<00:00, 10.24it/s]
100%|██████████| 625/625 [01:01<00:00, 10.24it/s]
100%|██████████| 563/563 [00:19<00:00, 29.16it/s]


EPOCH 19: Train acc: 99.80% Train Loss: 0.0140 Test acc: 77.00% Test Loss: 1.5745


100%|██████████| 625/625 [01:02<00:00,  9.95it/s]
100%|██████████| 625/625 [01:01<00:00, 10.23it/s]
100%|██████████| 625/625 [01:01<00:00, 10.23it/s]
100%|██████████| 625/625 [01:01<00:00, 10.22it/s]
100%|██████████| 625/625 [01:00<00:00, 10.25it/s]
100%|██████████| 563/563 [00:19<00:00, 29.26it/s]


EPOCH 20: Train acc: 99.75% Train Loss: 0.0183 Test acc: 75.21% Test Loss: 1.6910


100%|██████████| 625/625 [01:02<00:00,  9.94it/s]
100%|██████████| 625/625 [01:01<00:00, 10.22it/s]
100%|██████████| 625/625 [01:01<00:00, 10.21it/s]
100%|██████████| 625/625 [01:01<00:00, 10.22it/s]
100%|██████████| 625/625 [01:00<00:00, 10.25it/s]
100%|██████████| 563/563 [00:19<00:00, 29.28it/s]


EPOCH 21: Train acc: 99.73% Train Loss: 0.0180 Test acc: 77.58% Test Loss: 1.5783


100%|██████████| 625/625 [01:02<00:00,  9.94it/s]
100%|██████████| 625/625 [01:01<00:00, 10.22it/s]
100%|██████████| 625/625 [01:01<00:00, 10.24it/s]
100%|██████████| 625/625 [01:01<00:00, 10.24it/s]
100%|██████████| 625/625 [01:00<00:00, 10.26it/s]
100%|██████████| 563/563 [00:19<00:00, 29.18it/s]


EPOCH 22: Train acc: 99.86% Train Loss: 0.0114 Test acc: 77.23% Test Loss: 1.5531


100%|██████████| 625/625 [01:02<00:00,  9.98it/s]
100%|██████████| 625/625 [01:01<00:00, 10.22it/s]
100%|██████████| 625/625 [01:01<00:00, 10.24it/s]
100%|██████████| 625/625 [01:01<00:00, 10.24it/s]
100%|██████████| 625/625 [01:00<00:00, 10.25it/s]
100%|██████████| 563/563 [00:19<00:00, 29.21it/s]


EPOCH 23: Train acc: 99.84% Train Loss: 0.0136 Test acc: 77.17% Test Loss: 1.5611


100%|██████████| 625/625 [01:02<00:00,  9.97it/s]
100%|██████████| 625/625 [01:01<00:00, 10.23it/s]
100%|██████████| 625/625 [01:01<00:00, 10.22it/s]
100%|██████████| 625/625 [01:01<00:00, 10.23it/s]
100%|██████████| 625/625 [01:00<00:00, 10.25it/s]
100%|██████████| 563/563 [00:19<00:00, 29.20it/s]


EPOCH 24: Train acc: 99.82% Train Loss: 0.0132 Test acc: 77.83% Test Loss: 1.5170


100%|██████████| 625/625 [01:02<00:00,  9.96it/s]
100%|██████████| 625/625 [01:01<00:00, 10.23it/s]
100%|██████████| 625/625 [01:01<00:00, 10.22it/s]
100%|██████████| 625/625 [01:00<00:00, 10.27it/s]
100%|██████████| 625/625 [01:00<00:00, 10.27it/s]
100%|██████████| 563/563 [00:19<00:00, 29.24it/s]

EPOCH 25: Train acc: 99.87% Train Loss: 0.0115 Test acc: 76.04% Test Loss: 1.6531






VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▂▃▃▃▄▄▄▅▅▅▅▆▆▆▇▇▇▇██
loss,▁▂▄▄▄▄▄▆▅▆▅▅▄▆▄▆▅▇▆█▆▆▆▅▇
test/test_accuracy,█▇▅▆▅▄▅▂▃▃▄▄▅▄▅▃▄▃▃▁▄▃▃▄▂
test/test_loss,▁▂▄▄▄▄▄▆▅▆▅▅▄▆▄▆▅▇▆█▆▆▆▅▇
train/train_accuracy,▁▅▆▇▇████████████████████
train/train_loss,█▄▃▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,25.0
loss,1.65308
test/test_accuracy,0.76044
test/test_loss,1.65308
train/train_accuracy,0.9987
train/train_loss,0.01155


Run z0o4ky74 errored: NameError("name 'classes' is not defined")
[34m[1mwandb[0m: [32m[41mERROR[0m Run z0o4ky74 errored: NameError("name 'classes' is not defined")
[34m[1mwandb[0m: Agent Starting Run: w2nqk3lb with config:
[34m[1mwandb[0m: 	batch_size: 25
[34m[1mwandb[0m: 	criterion: loge
[34m[1mwandb[0m: 	device: cuda:2
[34m[1mwandb[0m: 	epochs: 25
[34m[1mwandb[0m: 	hidden_dim: 512
[34m[1mwandb[0m: 	learning_rate: 3.0236125085020263e-05
[34m[1mwandb[0m: 	num_heads: 1
[34m[1mwandb[0m: 	num_hidden: 3
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	similarity_threshold: 0.9


100%|██████████| 400/400 [01:01<00:00,  6.54it/s]
100%|██████████| 400/400 [00:59<00:00,  6.67it/s]
100%|██████████| 400/400 [01:00<00:00,  6.66it/s]
100%|██████████| 400/400 [00:59<00:00,  6.69it/s]
100%|██████████| 400/400 [00:59<00:00,  6.69it/s]
100%|██████████| 360/360 [00:19<00:00, 18.79it/s]


EPOCH 1: Train acc: 81.17% Train Loss: 1.1853 Test acc: 76.78% Test Loss: 1.3519


100%|██████████| 400/400 [01:01<00:00,  6.56it/s]
100%|██████████| 400/400 [00:59<00:00,  6.67it/s]
100%|██████████| 400/400 [01:00<00:00,  6.65it/s]
100%|██████████| 400/400 [00:59<00:00,  6.68it/s]
100%|██████████| 400/400 [00:59<00:00,  6.68it/s]
100%|██████████| 360/360 [00:19<00:00, 18.82it/s]


EPOCH 2: Train acc: 92.38% Train Loss: 0.4439 Test acc: 75.10% Test Loss: 1.5402


100%|██████████| 400/400 [01:00<00:00,  6.59it/s]
100%|██████████| 400/400 [00:59<00:00,  6.67it/s]
100%|██████████| 400/400 [00:59<00:00,  6.67it/s]
100%|██████████| 400/400 [00:59<00:00,  6.68it/s]
100%|██████████| 400/400 [00:59<00:00,  6.68it/s]
100%|██████████| 360/360 [00:19<00:00, 18.90it/s]


EPOCH 3: Train acc: 95.28% Train Loss: 0.2814 Test acc: 74.41% Test Loss: 1.6283


100%|██████████| 400/400 [01:00<00:00,  6.57it/s]
100%|██████████| 400/400 [00:59<00:00,  6.68it/s]
100%|██████████| 400/400 [00:59<00:00,  6.67it/s]
100%|██████████| 400/400 [00:59<00:00,  6.70it/s]
100%|██████████| 400/400 [01:00<00:00,  6.66it/s]
100%|██████████| 360/360 [00:18<00:00, 18.97it/s]


EPOCH 4: Train acc: 96.86% Train Loss: 0.1896 Test acc: 76.04% Test Loss: 1.4780


100%|██████████| 400/400 [01:00<00:00,  6.56it/s]
100%|██████████| 400/400 [00:59<00:00,  6.67it/s]
100%|██████████| 400/400 [00:59<00:00,  6.67it/s]
100%|██████████| 400/400 [00:59<00:00,  6.69it/s]
100%|██████████| 400/400 [00:59<00:00,  6.69it/s]
100%|██████████| 360/360 [00:19<00:00, 18.84it/s]


EPOCH 5: Train acc: 97.96% Train Loss: 0.1266 Test acc: 75.83% Test Loss: 1.5312


100%|██████████| 400/400 [01:01<00:00,  6.56it/s]
100%|██████████| 400/400 [01:00<00:00,  6.66it/s]
100%|██████████| 400/400 [00:59<00:00,  6.68it/s]
100%|██████████| 400/400 [00:59<00:00,  6.70it/s]
100%|██████████| 400/400 [00:59<00:00,  6.68it/s]
100%|██████████| 360/360 [00:19<00:00, 18.84it/s]


EPOCH 6: Train acc: 98.50% Train Loss: 0.0960 Test acc: 77.50% Test Loss: 1.4254


100%|██████████| 400/400 [01:00<00:00,  6.56it/s]
100%|██████████| 400/400 [00:59<00:00,  6.67it/s]
100%|██████████| 400/400 [00:59<00:00,  6.67it/s]
100%|██████████| 400/400 [00:59<00:00,  6.69it/s]
100%|██████████| 400/400 [00:59<00:00,  6.69it/s]
100%|██████████| 360/360 [00:19<00:00, 18.95it/s]


EPOCH 7: Train acc: 98.78% Train Loss: 0.0755 Test acc: 75.34% Test Loss: 1.6533


100%|██████████| 400/400 [01:01<00:00,  6.55it/s]
100%|██████████| 400/400 [01:00<00:00,  6.67it/s]
100%|██████████| 400/400 [01:00<00:00,  6.66it/s]
100%|██████████| 400/400 [00:59<00:00,  6.70it/s]
100%|██████████| 400/400 [00:59<00:00,  6.70it/s]
100%|██████████| 360/360 [00:18<00:00, 19.02it/s]


EPOCH 8: Train acc: 98.96% Train Loss: 0.0665 Test acc: 75.57% Test Loss: 1.5272


100%|██████████| 400/400 [01:01<00:00,  6.55it/s]
100%|██████████| 400/400 [00:59<00:00,  6.69it/s]
100%|██████████| 400/400 [00:59<00:00,  6.67it/s]
100%|██████████| 400/400 [00:59<00:00,  6.68it/s]
100%|██████████| 400/400 [00:59<00:00,  6.70it/s]
100%|██████████| 360/360 [00:18<00:00, 19.16it/s]


EPOCH 9: Train acc: 99.23% Train Loss: 0.0474 Test acc: 77.06% Test Loss: 1.4782


100%|██████████| 400/400 [01:00<00:00,  6.57it/s]
100%|██████████| 400/400 [01:00<00:00,  6.66it/s]
100%|██████████| 400/400 [01:00<00:00,  6.66it/s]
100%|██████████| 400/400 [00:59<00:00,  6.68it/s]
100%|██████████| 400/400 [00:59<00:00,  6.69it/s]
100%|██████████| 360/360 [00:19<00:00, 18.95it/s]


EPOCH 10: Train acc: 99.20% Train Loss: 0.0458 Test acc: 74.87% Test Loss: 1.6370


100%|██████████| 400/400 [01:00<00:00,  6.57it/s]
100%|██████████| 400/400 [00:59<00:00,  6.67it/s]
100%|██████████| 400/400 [01:00<00:00,  6.66it/s]
100%|██████████| 400/400 [00:59<00:00,  6.69it/s]
100%|██████████| 400/400 [00:59<00:00,  6.69it/s]
100%|██████████| 360/360 [00:19<00:00, 18.88it/s]


EPOCH 11: Train acc: 99.45% Train Loss: 0.0370 Test acc: 75.11% Test Loss: 1.6557


100%|██████████| 400/400 [01:00<00:00,  6.58it/s]
100%|██████████| 400/400 [00:59<00:00,  6.67it/s]
100%|██████████| 400/400 [00:59<00:00,  6.67it/s]
100%|██████████| 400/400 [00:59<00:00,  6.70it/s]
100%|██████████| 400/400 [00:59<00:00,  6.68it/s]
100%|██████████| 360/360 [00:18<00:00, 18.98it/s]


EPOCH 12: Train acc: 99.35% Train Loss: 0.0396 Test acc: 74.90% Test Loss: 1.6305


100%|██████████| 400/400 [01:01<00:00,  6.56it/s]
100%|██████████| 400/400 [00:59<00:00,  6.68it/s]
100%|██████████| 400/400 [01:00<00:00,  6.66it/s]
100%|██████████| 400/400 [00:59<00:00,  6.69it/s]
100%|██████████| 400/400 [01:00<00:00,  6.66it/s]
100%|██████████| 360/360 [00:18<00:00, 19.01it/s]


EPOCH 13: Train acc: 99.42% Train Loss: 0.0361 Test acc: 73.71% Test Loss: 1.7292


100%|██████████| 400/400 [01:01<00:00,  6.55it/s]
100%|██████████| 400/400 [01:00<00:00,  6.67it/s]
100%|██████████| 400/400 [00:59<00:00,  6.67it/s]
100%|██████████| 400/400 [00:59<00:00,  6.70it/s]
100%|██████████| 400/400 [00:59<00:00,  6.68it/s]
100%|██████████| 360/360 [00:19<00:00, 18.84it/s]


EPOCH 14: Train acc: 99.54% Train Loss: 0.0295 Test acc: 76.30% Test Loss: 1.5264


100%|██████████| 400/400 [01:00<00:00,  6.56it/s]
100%|██████████| 400/400 [00:59<00:00,  6.67it/s]
100%|██████████| 400/400 [01:00<00:00,  6.67it/s]
100%|██████████| 400/400 [00:59<00:00,  6.70it/s]
100%|██████████| 400/400 [00:59<00:00,  6.68it/s]
100%|██████████| 360/360 [00:18<00:00, 19.23it/s]


EPOCH 15: Train acc: 99.58% Train Loss: 0.0295 Test acc: 75.32% Test Loss: 1.5841


100%|██████████| 400/400 [01:01<00:00,  6.53it/s]
100%|██████████| 400/400 [01:00<00:00,  6.66it/s]
100%|██████████| 400/400 [01:00<00:00,  6.65it/s]
100%|██████████| 400/400 [00:59<00:00,  6.69it/s]
100%|██████████| 400/400 [00:59<00:00,  6.69it/s]
100%|██████████| 360/360 [00:18<00:00, 18.97it/s]


EPOCH 16: Train acc: 99.61% Train Loss: 0.0259 Test acc: 76.83% Test Loss: 1.4971


100%|██████████| 400/400 [01:00<00:00,  6.56it/s]
100%|██████████| 400/400 [00:59<00:00,  6.69it/s]
100%|██████████| 400/400 [00:59<00:00,  6.69it/s]
100%|██████████| 400/400 [00:59<00:00,  6.67it/s]
100%|██████████| 400/400 [00:59<00:00,  6.68it/s]
100%|██████████| 360/360 [00:18<00:00, 19.11it/s]


EPOCH 17: Train acc: 99.73% Train Loss: 0.0189 Test acc: 74.90% Test Loss: 1.6580


100%|██████████| 400/400 [01:00<00:00,  6.57it/s]
100%|██████████| 400/400 [01:00<00:00,  6.66it/s]
100%|██████████| 400/400 [00:59<00:00,  6.68it/s]
100%|██████████| 400/400 [00:59<00:00,  6.69it/s]
100%|██████████| 400/400 [00:59<00:00,  6.67it/s]
100%|██████████| 360/360 [00:18<00:00, 18.97it/s]


EPOCH 18: Train acc: 99.64% Train Loss: 0.0231 Test acc: 74.19% Test Loss: 1.7130


100%|██████████| 400/400 [01:00<00:00,  6.56it/s]
100%|██████████| 400/400 [00:59<00:00,  6.67it/s]
100%|██████████| 400/400 [01:00<00:00,  6.67it/s]
100%|██████████| 400/400 [00:59<00:00,  6.68it/s]
100%|██████████| 400/400 [00:59<00:00,  6.68it/s]
100%|██████████| 360/360 [00:19<00:00, 18.87it/s]


EPOCH 19: Train acc: 99.72% Train Loss: 0.0186 Test acc: 74.44% Test Loss: 1.6624


100%|██████████| 400/400 [01:01<00:00,  6.56it/s]
100%|██████████| 400/400 [00:59<00:00,  6.68it/s]
100%|██████████| 400/400 [01:00<00:00,  6.67it/s]
100%|██████████| 400/400 [00:59<00:00,  6.68it/s]
100%|██████████| 400/400 [01:00<00:00,  6.66it/s]
100%|██████████| 360/360 [00:19<00:00, 18.87it/s]


EPOCH 20: Train acc: 99.73% Train Loss: 0.0180 Test acc: 74.94% Test Loss: 1.7104


100%|██████████| 400/400 [01:01<00:00,  6.54it/s]
100%|██████████| 400/400 [01:00<00:00,  6.67it/s]
100%|██████████| 400/400 [01:00<00:00,  6.65it/s]
100%|██████████| 400/400 [00:59<00:00,  6.69it/s]
100%|██████████| 400/400 [00:59<00:00,  6.68it/s]
100%|██████████| 360/360 [00:18<00:00, 19.02it/s]


EPOCH 21: Train acc: 99.72% Train Loss: 0.0169 Test acc: 75.19% Test Loss: 1.6417


100%|██████████| 400/400 [01:00<00:00,  6.57it/s]
100%|██████████| 400/400 [01:00<00:00,  6.67it/s]
100%|██████████| 400/400 [00:59<00:00,  6.68it/s]
100%|██████████| 400/400 [00:59<00:00,  6.70it/s]
100%|██████████| 400/400 [00:59<00:00,  6.69it/s]
100%|██████████| 360/360 [00:18<00:00, 19.13it/s]


EPOCH 22: Train acc: 99.65% Train Loss: 0.0226 Test acc: 77.01% Test Loss: 1.4905


100%|██████████| 400/400 [01:01<00:00,  6.56it/s]
100%|██████████| 400/400 [01:00<00:00,  6.66it/s]
100%|██████████| 400/400 [00:59<00:00,  6.67it/s]
100%|██████████| 400/400 [00:59<00:00,  6.69it/s]
100%|██████████| 400/400 [00:59<00:00,  6.69it/s]
100%|██████████| 360/360 [00:18<00:00, 19.00it/s]


EPOCH 23: Train acc: 99.80% Train Loss: 0.0139 Test acc: 75.94% Test Loss: 1.5614


100%|██████████| 400/400 [01:00<00:00,  6.57it/s]
100%|██████████| 400/400 [00:59<00:00,  6.69it/s]
100%|██████████| 400/400 [01:00<00:00,  6.66it/s]
100%|██████████| 400/400 [00:59<00:00,  6.69it/s]
100%|██████████| 400/400 [00:59<00:00,  6.67it/s]
100%|██████████| 360/360 [00:19<00:00, 18.94it/s]


EPOCH 24: Train acc: 99.81% Train Loss: 0.0148 Test acc: 75.33% Test Loss: 1.6492


100%|██████████| 400/400 [01:00<00:00,  6.56it/s]
100%|██████████| 400/400 [00:59<00:00,  6.67it/s]
100%|██████████| 400/400 [01:00<00:00,  6.67it/s]
100%|██████████| 400/400 [00:59<00:00,  6.69it/s]
100%|██████████| 400/400 [00:59<00:00,  6.69it/s]
100%|██████████| 360/360 [00:19<00:00, 18.87it/s]


EPOCH 25: Train acc: 99.77% Train Loss: 0.0164 Test acc: 75.12% Test Loss: 1.7154



VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▂▃▃▃▄▄▄▅▅▅▅▆▆▆▇▇▇▇██
loss,▁▄▆▃▄▂▇▄▃▆▇▆█▄▅▄▇█▇█▆▄▅▇█
test/test_accuracy,▇▄▂▅▅█▄▄▇▃▄▃▁▆▄▇▃▂▂▃▄▇▅▄▄
test/test_loss,▁▄▆▃▄▂▇▄▃▆▇▆█▄▅▄▇█▇█▆▄▅▇█
train/train_accuracy,▁▅▆▇▇████████████████████
train/train_loss,█▄▃▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,25.0
loss,1.71544
test/test_accuracy,0.75122
test/test_loss,1.71544
train/train_accuracy,0.9977
train/train_loss,0.01636


Run w2nqk3lb errored: NameError("name 'classes' is not defined")
[34m[1mwandb[0m: [32m[41mERROR[0m Run w2nqk3lb errored: NameError("name 'classes' is not defined")
[34m[1mwandb[0m: Agent Starting Run: 925yo3hw with config:
[34m[1mwandb[0m: 	batch_size: 26
[34m[1mwandb[0m: 	criterion: loge
[34m[1mwandb[0m: 	device: cuda:2
[34m[1mwandb[0m: 	epochs: 25
[34m[1mwandb[0m: 	hidden_dim: 512
[34m[1mwandb[0m: 	learning_rate: 4.594822028254274e-05
[34m[1mwandb[0m: 	num_heads: 1
[34m[1mwandb[0m: 	num_hidden: 2
[34m[1mwandb[0m: 	optimizer: adam
[34m[1mwandb[0m: 	similarity_threshold: 0.6


100%|██████████| 385/385 [01:00<00:00,  6.36it/s]
100%|██████████| 385/385 [00:59<00:00,  6.49it/s]
100%|██████████| 385/385 [00:59<00:00,  6.48it/s]
100%|██████████| 385/385 [00:59<00:00,  6.51it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 347/347 [00:18<00:00, 18.69it/s]


EPOCH 1: Train acc: 79.91% Train Loss: 1.1681 Test acc: 80.03% Test Loss: 1.3581


100%|██████████| 385/385 [01:00<00:00,  6.35it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 385/385 [00:59<00:00,  6.49it/s]
100%|██████████| 385/385 [00:59<00:00,  6.51it/s]
100%|██████████| 385/385 [00:59<00:00,  6.51it/s]
100%|██████████| 347/347 [00:18<00:00, 18.62it/s]


EPOCH 2: Train acc: 92.35% Train Loss: 0.4575 Test acc: 80.68% Test Loss: 1.2960


100%|██████████| 385/385 [01:00<00:00,  6.35it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 385/385 [00:59<00:00,  6.51it/s]
100%|██████████| 385/385 [00:59<00:00,  6.51it/s]
100%|██████████| 347/347 [00:18<00:00, 18.70it/s]


EPOCH 3: Train acc: 94.63% Train Loss: 0.3220 Test acc: 81.92% Test Loss: 1.2492


100%|██████████| 385/385 [01:00<00:00,  6.34it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 385/385 [00:59<00:00,  6.49it/s]
100%|██████████| 385/385 [00:59<00:00,  6.51it/s]
100%|██████████| 385/385 [00:59<00:00,  6.49it/s]
100%|██████████| 347/347 [00:18<00:00, 18.64it/s]


EPOCH 4: Train acc: 96.63% Train Loss: 0.2051 Test acc: 79.20% Test Loss: 1.3797


100%|██████████| 385/385 [01:00<00:00,  6.35it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 385/385 [00:59<00:00,  6.48it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 347/347 [00:18<00:00, 18.61it/s]


EPOCH 5: Train acc: 97.70% Train Loss: 0.1441 Test acc: 79.04% Test Loss: 1.4539


100%|██████████| 385/385 [01:00<00:00,  6.35it/s]
100%|██████████| 385/385 [00:59<00:00,  6.49it/s]
100%|██████████| 385/385 [00:59<00:00,  6.51it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 347/347 [00:18<00:00, 18.53it/s]


EPOCH 6: Train acc: 98.51% Train Loss: 0.0982 Test acc: 78.49% Test Loss: 1.4673


100%|██████████| 385/385 [01:00<00:00,  6.37it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 385/385 [00:59<00:00,  6.49it/s]
100%|██████████| 385/385 [00:59<00:00,  6.51it/s]
100%|██████████| 347/347 [00:18<00:00, 18.71it/s]


EPOCH 7: Train acc: 98.93% Train Loss: 0.0732 Test acc: 76.81% Test Loss: 1.6168


100%|██████████| 385/385 [01:00<00:00,  6.38it/s]
100%|██████████| 385/385 [00:59<00:00,  6.52it/s]
100%|██████████| 385/385 [00:59<00:00,  6.51it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 347/347 [00:18<00:00, 18.75it/s]


EPOCH 8: Train acc: 99.10% Train Loss: 0.0614 Test acc: 78.22% Test Loss: 1.5107


100%|██████████| 385/385 [01:00<00:00,  6.35it/s]
100%|██████████| 385/385 [00:59<00:00,  6.49it/s]
100%|██████████| 385/385 [00:59<00:00,  6.51it/s]
100%|██████████| 385/385 [00:59<00:00,  6.52it/s]
100%|██████████| 385/385 [00:59<00:00,  6.51it/s]
100%|██████████| 347/347 [00:18<00:00, 18.69it/s]


EPOCH 9: Train acc: 99.10% Train Loss: 0.0629 Test acc: 77.03% Test Loss: 1.5924


100%|██████████| 385/385 [01:00<00:00,  6.36it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 385/385 [00:59<00:00,  6.49it/s]
100%|██████████| 385/385 [00:59<00:00,  6.49it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 347/347 [00:18<00:00, 18.65it/s]


EPOCH 10: Train acc: 99.25% Train Loss: 0.0487 Test acc: 78.04% Test Loss: 1.5337


100%|██████████| 385/385 [01:00<00:00,  6.35it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 385/385 [00:59<00:00,  6.48it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 385/385 [00:59<00:00,  6.48it/s]
100%|██████████| 347/347 [00:18<00:00, 18.65it/s]


EPOCH 11: Train acc: 99.47% Train Loss: 0.0399 Test acc: 79.18% Test Loss: 1.4673


100%|██████████| 385/385 [01:00<00:00,  6.35it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 385/385 [00:59<00:00,  6.49it/s]
100%|██████████| 385/385 [00:59<00:00,  6.51it/s]
100%|██████████| 347/347 [00:18<00:00, 18.59it/s]


EPOCH 12: Train acc: 99.51% Train Loss: 0.0350 Test acc: 78.72% Test Loss: 1.4599


100%|██████████| 385/385 [01:00<00:00,  6.36it/s]
100%|██████████| 385/385 [00:59<00:00,  6.49it/s]
100%|██████████| 385/385 [00:59<00:00,  6.49it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 347/347 [00:18<00:00, 18.72it/s]


EPOCH 13: Train acc: 99.53% Train Loss: 0.0303 Test acc: 80.89% Test Loss: 1.3796


100%|██████████| 385/385 [01:00<00:00,  6.36it/s]
100%|██████████| 385/385 [00:59<00:00,  6.49it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 385/385 [00:59<00:00,  6.49it/s]
100%|██████████| 385/385 [00:59<00:00,  6.51it/s]
100%|██████████| 347/347 [00:18<00:00, 18.82it/s]


EPOCH 14: Train acc: 99.65% Train Loss: 0.0240 Test acc: 77.87% Test Loss: 1.5263


100%|██████████| 385/385 [01:00<00:00,  6.37it/s]
100%|██████████| 385/385 [00:59<00:00,  6.49it/s]
100%|██████████| 385/385 [00:59<00:00,  6.49it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 385/385 [00:59<00:00,  6.51it/s]
100%|██████████| 347/347 [00:18<00:00, 18.71it/s]


EPOCH 15: Train acc: 99.62% Train Loss: 0.0249 Test acc: 79.96% Test Loss: 1.3903


100%|██████████| 385/385 [01:00<00:00,  6.35it/s]
100%|██████████| 385/385 [00:59<00:00,  6.49it/s]
100%|██████████| 385/385 [00:59<00:00,  6.49it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 347/347 [00:18<00:00, 18.68it/s]


EPOCH 16: Train acc: 99.55% Train Loss: 0.0320 Test acc: 75.10% Test Loss: 1.7231


100%|██████████| 385/385 [01:00<00:00,  6.37it/s]
100%|██████████| 385/385 [00:59<00:00,  6.49it/s]
100%|██████████| 385/385 [00:59<00:00,  6.49it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 347/347 [00:18<00:00, 18.64it/s]


EPOCH 17: Train acc: 99.72% Train Loss: 0.0202 Test acc: 78.31% Test Loss: 1.5153


100%|██████████| 385/385 [01:00<00:00,  6.36it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 385/385 [00:59<00:00,  6.49it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 347/347 [00:18<00:00, 18.67it/s]


EPOCH 18: Train acc: 99.68% Train Loss: 0.0226 Test acc: 77.20% Test Loss: 1.5908


100%|██████████| 385/385 [01:00<00:00,  6.35it/s]
100%|██████████| 385/385 [00:59<00:00,  6.48it/s]
100%|██████████| 385/385 [00:59<00:00,  6.49it/s]
100%|██████████| 385/385 [00:59<00:00,  6.49it/s]
100%|██████████| 385/385 [00:59<00:00,  6.49it/s]
100%|██████████| 347/347 [00:18<00:00, 18.67it/s]


EPOCH 19: Train acc: 99.60% Train Loss: 0.0255 Test acc: 76.32% Test Loss: 1.6200


100%|██████████| 385/385 [01:00<00:00,  6.34it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 385/385 [00:59<00:00,  6.49it/s]
100%|██████████| 385/385 [00:59<00:00,  6.49it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 347/347 [00:18<00:00, 18.62it/s]


EPOCH 20: Train acc: 99.78% Train Loss: 0.0176 Test acc: 76.98% Test Loss: 1.5830


100%|██████████| 385/385 [01:00<00:00,  6.36it/s]
100%|██████████| 385/385 [00:59<00:00,  6.48it/s]
100%|██████████| 385/385 [00:59<00:00,  6.51it/s]
100%|██████████| 385/385 [00:59<00:00,  6.49it/s]
100%|██████████| 385/385 [00:59<00:00,  6.51it/s]
100%|██████████| 347/347 [00:18<00:00, 18.75it/s]


EPOCH 21: Train acc: 99.70% Train Loss: 0.0220 Test acc: 77.08% Test Loss: 1.6406


100%|██████████| 385/385 [01:00<00:00,  6.36it/s]
100%|██████████| 385/385 [00:59<00:00,  6.49it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 385/385 [00:59<00:00,  6.51it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 347/347 [00:18<00:00, 18.68it/s]


EPOCH 22: Train acc: 99.76% Train Loss: 0.0175 Test acc: 78.87% Test Loss: 1.5525


100%|██████████| 385/385 [01:00<00:00,  6.36it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 385/385 [00:59<00:00,  6.49it/s]
100%|██████████| 385/385 [00:59<00:00,  6.49it/s]
100%|██████████| 385/385 [00:59<00:00,  6.52it/s]
100%|██████████| 347/347 [00:18<00:00, 18.71it/s]


EPOCH 23: Train acc: 99.66% Train Loss: 0.0186 Test acc: 76.42% Test Loss: 1.6770


100%|██████████| 385/385 [01:00<00:00,  6.36it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 385/385 [00:59<00:00,  6.49it/s]
100%|██████████| 385/385 [00:59<00:00,  6.49it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 347/347 [00:18<00:00, 18.68it/s]


EPOCH 24: Train acc: 99.68% Train Loss: 0.0206 Test acc: 78.96% Test Loss: 1.4505


100%|██████████| 385/385 [01:00<00:00,  6.35it/s]
100%|██████████| 385/385 [00:59<00:00,  6.49it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 385/385 [00:59<00:00,  6.50it/s]
100%|██████████| 347/347 [00:18<00:00, 18.81it/s]


EPOCH 25: Train acc: 99.71% Train Loss: 0.0193 Test acc: 76.62% Test Loss: 1.6647



VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▂▃▃▃▄▄▄▅▅▅▅▆▆▆▇▇▇▇██
loss,▃▂▁▃▄▄▆▅▆▅▄▄▃▅▃█▅▆▆▆▇▅▇▄▇
test/test_accuracy,▆▇█▅▅▄▃▄▃▄▅▅▇▄▆▁▄▃▂▃▃▅▂▅▃
test/test_loss,▃▂▁▃▄▄▆▅▆▅▄▄▃▅▃█▅▆▆▆▇▅▇▄▇
train/train_accuracy,▁▅▆▇▇████████████████████
train/train_loss,█▄▃▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,25.0
loss,1.66469
test/test_accuracy,0.76622
test/test_loss,1.66469
train/train_accuracy,0.9971
train/train_loss,0.01935


Run 925yo3hw errored: NameError("name 'classes' is not defined")
[34m[1mwandb[0m: [32m[41mERROR[0m Run 925yo3hw errored: NameError("name 'classes' is not defined")
[34m[1mwandb[0m: Agent Starting Run: mcx3xz7m with config:
[34m[1mwandb[0m: 	batch_size: 17
[34m[1mwandb[0m: 	criterion: loge
[34m[1mwandb[0m: 	device: cuda:2
[34m[1mwandb[0m: 	epochs: 25
[34m[1mwandb[0m: 	hidden_dim: 512
[34m[1mwandb[0m: 	learning_rate: 5.6846545379717045e-05
[34m[1mwandb[0m: 	num_heads: 1
[34m[1mwandb[0m: 	num_hidden: 4
[34m[1mwandb[0m: 	optimizer: nadam
[34m[1mwandb[0m: 	similarity_threshold: 0.75


100%|██████████| 589/589 [01:08<00:00,  8.59it/s]
100%|██████████| 589/589 [01:06<00:00,  8.81it/s]
100%|██████████| 589/589 [01:06<00:00,  8.83it/s]
100%|██████████| 589/589 [01:06<00:00,  8.86it/s]
100%|██████████| 589/589 [01:06<00:00,  8.83it/s]
100%|██████████| 530/530 [00:21<00:00, 24.65it/s]


EPOCH 1: Train acc: 79.78% Train Loss: 1.2045 Test acc: 78.92% Test Loss: 1.3600


100%|██████████| 589/589 [01:08<00:00,  8.56it/s]
100%|██████████| 589/589 [01:06<00:00,  8.81it/s]
100%|██████████| 589/589 [01:07<00:00,  8.79it/s]
100%|██████████| 589/589 [01:06<00:00,  8.85it/s]
100%|██████████| 589/589 [01:06<00:00,  8.84it/s]
100%|██████████| 530/530 [00:21<00:00, 24.59it/s]


EPOCH 2: Train acc: 91.14% Train Loss: 0.5236 Test acc: 77.43% Test Loss: 1.4646


100%|██████████| 589/589 [01:08<00:00,  8.58it/s]
100%|██████████| 589/589 [01:06<00:00,  8.80it/s]
100%|██████████| 589/589 [01:07<00:00,  8.79it/s]
100%|██████████| 589/589 [01:06<00:00,  8.84it/s]
100%|██████████| 589/589 [01:06<00:00,  8.82it/s]
100%|██████████| 530/530 [00:21<00:00, 24.67it/s]


EPOCH 3: Train acc: 93.77% Train Loss: 0.3709 Test acc: 77.78% Test Loss: 1.4465


100%|██████████| 589/589 [01:08<00:00,  8.56it/s]
100%|██████████| 589/589 [01:06<00:00,  8.83it/s]
100%|██████████| 589/589 [01:06<00:00,  8.82it/s]
100%|██████████| 589/589 [01:06<00:00,  8.82it/s]
100%|██████████| 589/589 [01:06<00:00,  8.80it/s]
100%|██████████| 530/530 [00:21<00:00, 24.80it/s]


EPOCH 4: Train acc: 95.35% Train Loss: 0.2785 Test acc: 79.56% Test Loss: 1.3471


100%|██████████| 589/589 [01:08<00:00,  8.58it/s]
100%|██████████| 589/589 [01:06<00:00,  8.80it/s]
100%|██████████| 589/589 [01:07<00:00,  8.79it/s]
100%|██████████| 589/589 [01:06<00:00,  8.84it/s]
100%|██████████| 589/589 [01:06<00:00,  8.82it/s]
100%|██████████| 530/530 [00:21<00:00, 24.54it/s]


EPOCH 5: Train acc: 96.69% Train Loss: 0.2042 Test acc: 76.63% Test Loss: 1.4928


100%|██████████| 589/589 [01:08<00:00,  8.58it/s]
100%|██████████| 589/589 [01:06<00:00,  8.85it/s]
100%|██████████| 589/589 [01:06<00:00,  8.83it/s]
100%|██████████| 589/589 [01:06<00:00,  8.84it/s]
100%|██████████| 589/589 [01:06<00:00,  8.85it/s]
100%|██████████| 530/530 [00:21<00:00, 24.58it/s]


EPOCH 6: Train acc: 97.74% Train Loss: 0.1408 Test acc: 78.18% Test Loss: 1.4506


100%|██████████| 589/589 [01:09<00:00,  8.53it/s]
100%|██████████| 589/589 [01:06<00:00,  8.79it/s]
100%|██████████| 589/589 [01:06<00:00,  8.80it/s]
100%|██████████| 589/589 [01:06<00:00,  8.82it/s]
100%|██████████| 589/589 [01:06<00:00,  8.81it/s]
100%|██████████| 530/530 [00:21<00:00, 24.58it/s]


EPOCH 7: Train acc: 98.16% Train Loss: 0.1138 Test acc: 78.20% Test Loss: 1.4346


100%|██████████| 589/589 [01:08<00:00,  8.57it/s]
100%|██████████| 589/589 [01:06<00:00,  8.81it/s]
100%|██████████| 589/589 [01:06<00:00,  8.81it/s]
100%|██████████| 589/589 [01:06<00:00,  8.85it/s]
100%|██████████| 589/589 [01:06<00:00,  8.85it/s]
100%|██████████| 530/530 [00:21<00:00, 24.70it/s]


EPOCH 8: Train acc: 98.63% Train Loss: 0.0911 Test acc: 77.78% Test Loss: 1.4884


100%|██████████| 589/589 [01:08<00:00,  8.59it/s]
100%|██████████| 589/589 [01:07<00:00,  8.79it/s]
100%|██████████| 589/589 [01:06<00:00,  8.82it/s]
100%|██████████| 589/589 [01:06<00:00,  8.80it/s]
100%|██████████| 589/589 [01:06<00:00,  8.83it/s]
100%|██████████| 530/530 [00:21<00:00, 25.11it/s]


EPOCH 9: Train acc: 98.90% Train Loss: 0.0733 Test acc: 74.86% Test Loss: 1.6856


100%|██████████| 589/589 [01:09<00:00,  8.49it/s]
100%|██████████| 589/589 [01:07<00:00,  8.78it/s]
100%|██████████| 589/589 [01:06<00:00,  8.80it/s]
100%|██████████| 589/589 [01:06<00:00,  8.83it/s]
100%|██████████| 589/589 [01:06<00:00,  8.84it/s]
100%|██████████| 530/530 [00:21<00:00, 24.75it/s]


EPOCH 10: Train acc: 98.95% Train Loss: 0.0637 Test acc: 77.99% Test Loss: 1.5022


100%|██████████| 589/589 [01:08<00:00,  8.60it/s]
100%|██████████| 589/589 [01:06<00:00,  8.91it/s]
100%|██████████| 589/589 [01:06<00:00,  8.81it/s]
100%|██████████| 589/589 [01:06<00:00,  8.87it/s]
100%|██████████| 589/589 [01:06<00:00,  8.86it/s]
100%|██████████| 530/530 [00:21<00:00, 24.46it/s]


EPOCH 11: Train acc: 99.30% Train Loss: 0.0495 Test acc: 76.80% Test Loss: 1.5754


100%|██████████| 589/589 [01:08<00:00,  8.59it/s]
100%|██████████| 589/589 [01:07<00:00,  8.78it/s]
100%|██████████| 589/589 [01:06<00:00,  8.83it/s]
100%|██████████| 589/589 [01:06<00:00,  8.88it/s]
100%|██████████| 589/589 [01:06<00:00,  8.89it/s]
100%|██████████| 530/530 [00:21<00:00, 25.12it/s]


EPOCH 12: Train acc: 99.35% Train Loss: 0.0472 Test acc: 77.02% Test Loss: 1.5299


100%|██████████| 589/589 [01:06<00:00,  8.82it/s]
100%|██████████| 589/589 [01:05<00:00,  9.03it/s]
100%|██████████| 589/589 [01:05<00:00,  9.03it/s]
100%|██████████| 589/589 [01:05<00:00,  9.03it/s]
100%|██████████| 589/589 [01:05<00:00,  9.03it/s]
100%|██████████| 530/530 [00:21<00:00, 24.86it/s]


EPOCH 13: Train acc: 99.32% Train Loss: 0.0442 Test acc: 74.71% Test Loss: 1.7428


100%|██████████| 589/589 [01:06<00:00,  8.82it/s]
100%|██████████| 589/589 [01:05<00:00,  9.04it/s]
100%|██████████| 589/589 [01:05<00:00,  9.05it/s]
100%|██████████| 589/589 [01:05<00:00,  9.03it/s]
100%|██████████| 589/589 [01:05<00:00,  9.05it/s]
100%|██████████| 530/530 [00:21<00:00, 24.94it/s]


EPOCH 14: Train acc: 99.45% Train Loss: 0.0356 Test acc: 74.97% Test Loss: 1.7313


100%|██████████| 589/589 [01:06<00:00,  8.84it/s]
100%|██████████| 589/589 [01:05<00:00,  9.04it/s]
100%|██████████| 589/589 [01:05<00:00,  9.04it/s]
100%|██████████| 589/589 [01:05<00:00,  9.03it/s]
100%|██████████| 589/589 [01:05<00:00,  9.05it/s]
100%|██████████| 530/530 [00:21<00:00, 24.91it/s]


EPOCH 15: Train acc: 99.49% Train Loss: 0.0368 Test acc: 75.64% Test Loss: 1.6525


100%|██████████| 589/589 [01:06<00:00,  8.82it/s]
100%|██████████| 589/589 [01:05<00:00,  9.04it/s]
100%|██████████| 589/589 [01:05<00:00,  9.04it/s]
100%|██████████| 589/589 [01:05<00:00,  9.03it/s]
100%|██████████| 589/589 [01:05<00:00,  9.06it/s]
100%|██████████| 530/530 [00:21<00:00, 24.93it/s]


EPOCH 16: Train acc: 99.47% Train Loss: 0.0372 Test acc: 75.92% Test Loss: 1.6706


100%|██████████| 589/589 [01:06<00:00,  8.84it/s]
100%|██████████| 589/589 [01:05<00:00,  9.05it/s]
100%|██████████| 589/589 [01:05<00:00,  9.05it/s]
100%|██████████| 589/589 [01:05<00:00,  9.05it/s]
100%|██████████| 589/589 [01:05<00:00,  8.99it/s]
100%|██████████| 530/530 [00:21<00:00, 24.89it/s]


EPOCH 17: Train acc: 99.62% Train Loss: 0.0282 Test acc: 77.10% Test Loss: 1.5180


100%|██████████| 589/589 [01:08<00:00,  8.60it/s]
100%|██████████| 589/589 [01:06<00:00,  8.83it/s]
100%|██████████| 589/589 [01:06<00:00,  8.84it/s]
100%|██████████| 589/589 [01:06<00:00,  8.88it/s]
100%|██████████| 589/589 [01:06<00:00,  8.86it/s]
100%|██████████| 530/530 [00:21<00:00, 24.61it/s]


EPOCH 18: Train acc: 99.64% Train Loss: 0.0262 Test acc: 77.20% Test Loss: 1.5490


100%|██████████| 589/589 [01:08<00:00,  8.59it/s]
100%|██████████| 589/589 [01:06<00:00,  8.83it/s]
100%|██████████| 589/589 [01:06<00:00,  8.85it/s]
100%|██████████| 589/589 [01:06<00:00,  8.86it/s]
100%|██████████| 589/589 [01:06<00:00,  8.86it/s]
100%|██████████| 530/530 [00:21<00:00, 24.57it/s]


EPOCH 19: Train acc: 99.65% Train Loss: 0.0240 Test acc: 76.13% Test Loss: 1.6214


100%|██████████| 589/589 [01:08<00:00,  8.62it/s]
100%|██████████| 589/589 [01:06<00:00,  8.84it/s]
100%|██████████| 589/589 [01:06<00:00,  8.85it/s]
100%|██████████| 589/589 [01:06<00:00,  8.87it/s]
100%|██████████| 589/589 [01:06<00:00,  8.83it/s]
100%|██████████| 530/530 [00:21<00:00, 24.74it/s]


EPOCH 20: Train acc: 99.56% Train Loss: 0.0282 Test acc: 75.53% Test Loss: 1.6624


100%|██████████| 589/589 [01:08<00:00,  8.55it/s]
100%|██████████| 589/589 [01:06<00:00,  8.82it/s]
100%|██████████| 589/589 [01:07<00:00,  8.78it/s]
100%|██████████| 589/589 [01:06<00:00,  8.88it/s]
100%|██████████| 589/589 [01:06<00:00,  8.84it/s]
100%|██████████| 530/530 [00:21<00:00, 24.61it/s]


EPOCH 21: Train acc: 99.74% Train Loss: 0.0183 Test acc: 74.03% Test Loss: 1.7467


100%|██████████| 589/589 [01:08<00:00,  8.59it/s]
100%|██████████| 589/589 [01:06<00:00,  8.82it/s]
100%|██████████| 589/589 [01:06<00:00,  8.82it/s]
100%|██████████| 589/589 [01:06<00:00,  8.90it/s]
100%|██████████| 589/589 [01:05<00:00,  9.05it/s]
100%|██████████| 530/530 [00:21<00:00, 24.85it/s]


EPOCH 22: Train acc: 99.63% Train Loss: 0.0279 Test acc: 76.23% Test Loss: 1.6853


100%|██████████| 589/589 [01:06<00:00,  8.81it/s]
100%|██████████| 589/589 [01:05<00:00,  9.03it/s]
100%|██████████| 589/589 [01:05<00:00,  9.02it/s]
100%|██████████| 589/589 [01:05<00:00,  9.04it/s]
100%|██████████| 589/589 [01:05<00:00,  9.04it/s]
100%|██████████| 530/530 [00:21<00:00, 24.87it/s]


EPOCH 23: Train acc: 99.77% Train Loss: 0.0198 Test acc: 77.98% Test Loss: 1.5028


100%|██████████| 589/589 [01:06<00:00,  8.83it/s]
100%|██████████| 589/589 [01:05<00:00,  9.03it/s]
100%|██████████| 589/589 [01:05<00:00,  9.05it/s]
100%|██████████| 589/589 [01:05<00:00,  9.03it/s]
100%|██████████| 589/589 [01:05<00:00,  9.04it/s]
100%|██████████| 530/530 [00:21<00:00, 24.84it/s]


EPOCH 24: Train acc: 99.77% Train Loss: 0.0203 Test acc: 75.84% Test Loss: 1.6363


100%|██████████| 589/589 [01:06<00:00,  8.83it/s]
100%|██████████| 589/589 [01:05<00:00,  9.02it/s]
100%|██████████| 589/589 [01:05<00:00,  8.97it/s]
100%|██████████| 589/589 [01:06<00:00,  8.85it/s]
100%|██████████| 589/589 [01:06<00:00,  8.85it/s]
100%|██████████| 530/530 [00:21<00:00, 24.54it/s]


EPOCH 25: Train acc: 99.74% Train Loss: 0.0178 Test acc: 76.38% Test Loss: 1.6005



VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
epoch,▁▁▂▂▂▂▃▃▃▄▄▄▅▅▅▅▆▆▆▇▇▇▇██
loss,▁▃▃▁▄▃▃▃▇▄▅▄██▆▇▄▅▆▇█▇▄▆▅
test/test_accuracy,▇▅▆█▄▆▆▆▂▆▅▅▂▂▃▃▅▅▄▃▁▄▆▃▄
test/test_loss,▁▃▃▁▄▃▃▃▇▄▅▄██▆▇▄▅▆▇█▇▄▆▅
train/train_accuracy,▁▅▆▆▇▇▇██████████████████
train/train_loss,█▄▃▃▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
epoch,25.0
loss,1.60049
test/test_accuracy,0.76378
test/test_loss,1.60049
train/train_accuracy,0.9974
train/train_loss,0.01781


Run mcx3xz7m errored: NameError("name 'classes' is not defined")
[34m[1mwandb[0m: [32m[41mERROR[0m Run mcx3xz7m errored: NameError("name 'classes' is not defined")
Detected 5 failed runs in a row at start, killing sweep.
[34m[1mwandb[0m: [32m[41mERROR[0m Detected 5 failed runs in a row at start, killing sweep.
[34m[1mwandb[0m: To change this value set WANDB_AGENT_MAX_INITIAL_FAILURES=val
