In [1]:
import os
import random
import shutil
import time
import warnings

import torch
import torch.nn as nn
import torch.backends.cudnn as cudnn
import torch.optim

import torch.utils.data
import torchvision
import torchvision.transforms as transforms
import torchvision.datasets as datasets
import torchvision.models as models

In [2]:
SEED=1

In [3]:
random.seed(SEED)
torch.manual_seed(SEED)
cudnn.deterministic = True

In [4]:
torch.cuda.device_count()

1

In [5]:
START_EPOCH = 0

In [6]:
ARCH = 'resnet50'
EPOCHS = 200
LR = 0.1
MOMENTUM = 0.9
WEIGHT_DECAY = 1e-4
PRINT_FREQ = 50
TRAIN_BATCH=256
VAL_BATCH=256
WORKERS=8
TRAINDIR="/data/train"
VALDIR="/data/val"

In [7]:
if not torch.cuda.is_available():
    print('GPU not detected.. did you pass through your GPU?')

In [8]:
GPU = 0

In [9]:
torch.cuda.set_device(GPU)

In [10]:
cudnn.benchmark = True

In [11]:
def train(train_loader, model, criterion, optimizer, epoch):
    batch_time = AverageMeter('Time', ':6.3f')
    data_time = AverageMeter('Data', ':6.3f')
    losses = AverageMeter('Loss', ':.4e')
    top1 = AverageMeter('Acc@1', ':6.2f')
    top5 = AverageMeter('Acc@5', ':6.2f')
    progress = ProgressMeter(
        len(train_loader),
        [batch_time, data_time, losses, top1, top5],
        prefix="Epoch: [{}]".format(epoch))

    # switch to train mode
    model.train()

    end = time.time()
    for i, (images, target) in enumerate(train_loader):
        # measure data loading time
        data_time.update(time.time() - end)

        if GPU is not None:
            images = images.cuda(GPU, non_blocking=True)
        if torch.cuda.is_available():
            target = target.cuda(GPU, non_blocking=True)

        # compute output
        output = model(images)
        loss = criterion(output, target)

        # measure accuracy and record loss
        acc1, acc5 = accuracy(output, target, topk=(1, 5))
        losses.update(loss.item(), images.size(0))
        top1.update(acc1[0], images.size(0))
        top5.update(acc5[0], images.size(0))

        # compute gradient and do SGD step
        optimizer.zero_grad()
        loss.backward()
        optimizer.step()

        # measure elapsed time
        batch_time.update(time.time() - end)
        end = time.time()

        if i % PRINT_FREQ == 0:
            progress.display(i)

In [12]:
def validate(val_loader, model, criterion):
    batch_time = AverageMeter('Time', ':6.3f')
    losses = AverageMeter('Loss', ':.4e')
    top1 = AverageMeter('Acc@1', ':6.2f')
    top5 = AverageMeter('Acc@5', ':6.2f')
    progress = ProgressMeter(
        len(val_loader),
        [batch_time, losses, top1, top5],
        prefix='Test: ')

    # switch to evaluate mode
    model.eval()

    with torch.no_grad():
        end = time.time()
        for i, (images, target) in enumerate(val_loader):
            if GPU is not None:
                images = images.cuda(GPU, non_blocking=True)
            if torch.cuda.is_available():
                target = target.cuda(GPU, non_blocking=True)

            # compute output
            output = model(images)
            loss = criterion(output, target)

            # measure accuracy and record loss
            acc1, acc5 = accuracy(output, target, topk=(1, 5))
            losses.update(loss.item(), images.size(0))
            top1.update(acc1[0], images.size(0))
            top5.update(acc5[0], images.size(0))

            # measure elapsed time
            batch_time.update(time.time() - end)
            end = time.time()

            if i % PRINT_FREQ == 0:
                progress.display(i)

        # TODO: this should also be done with the ProgressMeter
        print(' * Acc@1 {top1.avg:.3f} Acc@5 {top5.avg:.3f}'
              .format(top1=top1, top5=top5))

    return top1.avg

In [13]:
def save_checkpoint(state, is_best, filename='checkpoint.pth.tar'):
    torch.save(state, filename)
    if is_best:
        shutil.copyfile(filename, 'model_best.pth.tar')

In [14]:
class AverageMeter(object):
    """Computes and stores the average and current value"""
    def __init__(self, name, fmt=':f'):
        self.name = name
        self.fmt = fmt
        self.reset()

    def reset(self):
        self.val = 0
        self.avg = 0
        self.sum = 0
        self.count = 0

    def update(self, val, n=1):
        self.val = val
        self.sum += val * n
        self.count += n
        self.avg = self.sum / self.count

    def __str__(self):
        fmtstr = '{name} {val' + self.fmt + '} ({avg' + self.fmt + '})'
        return fmtstr.format(**self.__dict__)

In [15]:
class ProgressMeter(object):
    def __init__(self, num_batches, meters, prefix=""):
        self.batch_fmtstr = self._get_batch_fmtstr(num_batches)
        self.meters = meters
        self.prefix = prefix

    def display(self, batch):
        entries = [self.prefix + self.batch_fmtstr.format(batch)]
        entries += [str(meter) for meter in self.meters]
        print('\t'.join(entries))

    def _get_batch_fmtstr(self, num_batches):
        num_digits = len(str(num_batches // 1))
        fmt = '{:' + str(num_digits) + 'd}'
        return '[' + fmt + '/' + fmt.format(num_batches) + ']'

In [16]:
def adjust_learning_rate(optimizer, epoch):
    """Sets the learning rate to the initial LR decayed by 10 every 30 epochs"""
#     lr = LR * (0.1 ** (epoch // 30))
    lr = LR * (0.1 ** (epoch // 17))
    for param_group in optimizer.param_groups:
        param_group['lr'] = lr

In [17]:
def accuracy(output, target, topk=(1,)):
    """Computes the accuracy over the k top predictions for the specified values of k"""
    with torch.no_grad():
        maxk = max(topk)
        batch_size = target.size(0)

        _, pred = output.topk(maxk, 1, True, True)
        pred = pred.t()
        correct = pred.eq(target.view(1, -1).expand_as(pred))

        res = []
        for k in topk:
            correct_k = correct[:k].reshape(-1).float().sum(0, keepdim=True)
            res.append(correct_k.mul_(100.0 / batch_size))
        return res

In [18]:
imagenet_mean_RGB = [0.47889522, 0.47227842, 0.43047404]
imagenet_std_RGB = [0.229, 0.224, 0.225]
cinic_mean_RGB = [0.47889522, 0.47227842, 0.43047404]
cinic_std_RGB = [0.24205776, 0.23828046, 0.25874835]
cifar_mean_RGB = [0.4914, 0.4822, 0.4465]
cifar_std_RGB = [0.2023, 0.1994, 0.2010]

In [19]:
normalize = transforms.Normalize(mean=imagenet_mean_RGB, std=imagenet_std_RGB)

In [20]:
IMG_SIZE = 224

In [21]:
NUM_CLASSES = 1000

In [22]:
model = models.__dict__[ARCH]()

In [23]:
inf = model.fc.in_features

In [24]:
model.fc = nn.Linear(inf, NUM_CLASSES)

In [25]:
model.cuda(GPU)

ResNet(
  (conv1): Conv2d(3, 64, kernel_size=(7, 7), stride=(2, 2), padding=(3, 3), bias=False)
  (bn1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
  (relu): ReLU(inplace=True)
  (maxpool): MaxPool2d(kernel_size=3, stride=2, padding=1, dilation=1, ceil_mode=False)
  (layer1): Sequential(
    (0): BasicBlock(
      (conv1): Conv2d(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)
      (bn1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      (relu): ReLU(inplace=True)
      (conv2): Conv2d(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)
      (bn2): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
    )
    (1): BasicBlock(
      (conv1): Conv2d(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)
      (bn1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      (relu): ReLU(inplace=True)
  

In [26]:
criterion = nn.CrossEntropyLoss().cuda(GPU)

In [27]:
optimizer = torch.optim.SGD(model.parameters(), LR,
                                momentum=MOMENTUM,
                                weight_decay=WEIGHT_DECAY)

In [28]:
scheduler = torch.optim.lr_scheduler.CosineAnnealingLR(optimizer, T_max=EPOCHS)

In [30]:
# train_dataset = datasets.ImageFolder(
#     TRAINDIR, transform=transform_train)
train_dataset = datasets.ImageFolder(
    TRAINDIR,
    transforms.Compose([
        transforms.Resize(256),
        transforms.RandomResizedCrop(224),
        transforms.CenterCrop(224),
        transforms.RandomHorizontalFlip(),
        transforms.ToTensor(),
        normalize,
    ])
)

In [31]:
# transform_val = transforms.Compose([
#     transforms.ToTensor(),
#     transforms.Normalize(imagenet_mean_RGB, imagenet_std_RGB),
# ])

In [32]:
# val_dataset = datasets.ImageFolder(
#     VALDIR, transform=transform_val)
val_dataset = datasets.ImageFolder(
    VALDIR,
    transforms.Compose([
        transforms.Resize(256),
        transforms.CenterCrop(224),
        transforms.ToTensor(),
        normalize,
    ])
)

In [33]:
train_loader = torch.utils.data.DataLoader(
        train_dataset, batch_size=TRAIN_BATCH, shuffle=True,
        num_workers=WORKERS, pin_memory=True, sampler=None)

In [34]:
val_loader = torch.utils.data.DataLoader(
        val_dataset, batch_size=VAL_BATCH, shuffle=False,
        num_workers=WORKERS, pin_memory=True, sampler=None) 

In [35]:
best_acc1 = 0

In [36]:
for epoch in range(START_EPOCH, EPOCHS):
    adjust_learning_rate(optimizer, epoch)

    # train for one epoch
    train(train_loader, model, criterion, optimizer, epoch)

    # evaluate on validation set
    acc1 = validate(val_loader, model, criterion)

    # remember best acc@1 and save checkpoint
    is_best = acc1 > best_acc1
    best_acc1 = max(acc1, best_acc1)


    save_checkpoint({
        'epoch': epoch + 1,
        'arch': ARCH,
        'state_dict': model.state_dict(),
        'best_acc1': best_acc1,
        'optimizer' : optimizer.state_dict(),
    }, is_best)
    
    scheduler.step()
    print('lr: ' + str(scheduler.get_last_lr()))

Epoch: [0][   0/5005]	Time 12.060 (12.060)	Data  3.392 ( 3.392)	Loss 6.9885e+00 (6.9885e+00)	Acc@1   0.00 (  0.00)	Acc@5   0.78 (  0.78)
Epoch: [0][  50/5005]	Time  0.682 ( 0.892)	Data  0.000 ( 0.067)	Loss 6.9371e+00 (7.0183e+00)	Acc@1   0.39 (  0.28)	Acc@5   1.56 (  0.97)
Epoch: [0][ 100/5005]	Time  0.680 ( 0.787)	Data  0.000 ( 0.038)	Loss 6.7528e+00 (6.9203e+00)	Acc@1   1.17 (  0.33)	Acc@5   1.56 (  1.32)
Epoch: [0][ 150/5005]	Time  0.687 ( 0.753)	Data  0.000 ( 0.029)	Loss 6.6948e+00 (6.8425e+00)	Acc@1   0.00 (  0.46)	Acc@5   1.95 (  1.81)
Epoch: [0][ 200/5005]	Time  0.683 ( 0.736)	Data  0.000 ( 0.024)	Loss 6.6117e+00 (6.7833e+00)	Acc@1   0.39 (  0.54)	Acc@5   2.34 (  2.05)
Epoch: [0][ 250/5005]	Time  0.681 ( 0.725)	Data  0.000 ( 0.021)	Loss 6.4819e+00 (6.7322e+00)	Acc@1   0.39 (  0.60)	Acc@5   3.91 (  2.32)
Epoch: [0][ 300/5005]	Time  0.680 ( 0.718)	Data  0.000 ( 0.019)	Loss 6.3872e+00 (6.6852e+00)	Acc@1   1.56 (  0.68)	Acc@5   5.47 (  2.61)
Epoch: [0][ 350/5005]	Time  0.685 ( 0.714



Epoch: [0][ 950/5005]	Time  0.690 ( 0.701)	Data  0.000 ( 0.013)	Loss 5.6154e+00 (6.2141e+00)	Acc@1   7.42 (  1.91)	Acc@5  14.84 (  6.67)
Epoch: [0][1000/5005]	Time  0.683 ( 0.700)	Data  0.000 ( 0.012)	Loss 5.5772e+00 (6.1850e+00)	Acc@1   3.91 (  2.02)	Acc@5  16.80 (  6.99)
Epoch: [0][1050/5005]	Time  0.689 ( 0.700)	Data  0.000 ( 0.012)	Loss 5.6172e+00 (6.1574e+00)	Acc@1   3.52 (  2.12)	Acc@5  10.94 (  7.31)
Epoch: [0][1100/5005]	Time  0.684 ( 0.699)	Data  0.000 ( 0.012)	Loss 5.4508e+00 (6.1314e+00)	Acc@1   5.86 (  2.22)	Acc@5  15.23 (  7.60)
Epoch: [0][1150/5005]	Time  0.685 ( 0.699)	Data  0.000 ( 0.012)	Loss 5.5111e+00 (6.1040e+00)	Acc@1   5.08 (  2.34)	Acc@5  17.19 (  7.92)
Epoch: [0][1200/5005]	Time  0.683 ( 0.698)	Data  0.000 ( 0.012)	Loss 5.6030e+00 (6.0792e+00)	Acc@1   5.08 (  2.44)	Acc@5  16.41 (  8.23)
Epoch: [0][1250/5005]	Time  0.686 ( 0.698)	Data  0.000 ( 0.012)	Loss 5.4812e+00 (6.0556e+00)	Acc@1   6.25 (  2.55)	Acc@5  17.58 (  8.52)
Epoch: [0][1300/5005]	Time  0.679 ( 0.697

Epoch: [0][3950/5005]	Time  0.683 ( 0.693)	Data  0.000 ( 0.010)	Loss 4.4426e+00 (5.1551e+00)	Acc@1  15.62 (  9.08)	Acc@5  35.55 ( 22.41)
Epoch: [0][4000/5005]	Time  0.689 ( 0.693)	Data  0.000 ( 0.010)	Loss 4.0964e+00 (5.1433e+00)	Acc@1  18.75 (  9.19)	Acc@5  39.45 ( 22.61)
Epoch: [0][4050/5005]	Time  0.691 ( 0.693)	Data  0.000 ( 0.010)	Loss 4.1174e+00 (5.1311e+00)	Acc@1  23.05 (  9.31)	Acc@5  41.80 ( 22.82)
Epoch: [0][4100/5005]	Time  0.687 ( 0.693)	Data  0.000 ( 0.010)	Loss 4.1015e+00 (5.1191e+00)	Acc@1  21.88 (  9.42)	Acc@5  41.80 ( 23.04)
Epoch: [0][4150/5005]	Time  0.693 ( 0.693)	Data  0.000 ( 0.010)	Loss 4.3607e+00 (5.1074e+00)	Acc@1  16.02 (  9.54)	Acc@5  37.89 ( 23.24)
Epoch: [0][4200/5005]	Time  0.696 ( 0.693)	Data  0.000 ( 0.010)	Loss 3.9379e+00 (5.0960e+00)	Acc@1  22.66 (  9.65)	Acc@5  42.97 ( 23.45)
Epoch: [0][4250/5005]	Time  0.707 ( 0.693)	Data  0.000 ( 0.010)	Loss 4.2802e+00 (5.0848e+00)	Acc@1  16.41 (  9.76)	Acc@5  37.50 ( 23.64)
Epoch: [0][4300/5005]	Time  0.719 ( 0.694

Epoch: [1][1750/5005]	Time  0.684 ( 0.686)	Data  0.000 ( 0.011)	Loss 3.5567e+00 (3.7475e+00)	Acc@1  28.12 ( 24.33)	Acc@5  50.00 ( 47.62)
Epoch: [1][1800/5005]	Time  0.688 ( 0.686)	Data  0.000 ( 0.011)	Loss 3.7005e+00 (3.7435e+00)	Acc@1  24.61 ( 24.40)	Acc@5  47.66 ( 47.70)
Epoch: [1][1850/5005]	Time  0.683 ( 0.686)	Data  0.000 ( 0.011)	Loss 3.4168e+00 (3.7395e+00)	Acc@1  28.52 ( 24.45)	Acc@5  58.59 ( 47.78)
Epoch: [1][1900/5005]	Time  0.686 ( 0.686)	Data  0.000 ( 0.011)	Loss 3.6669e+00 (3.7350e+00)	Acc@1  26.56 ( 24.51)	Acc@5  49.61 ( 47.88)
Epoch: [1][1950/5005]	Time  0.685 ( 0.686)	Data  0.000 ( 0.011)	Loss 3.4386e+00 (3.7307e+00)	Acc@1  28.12 ( 24.57)	Acc@5  55.08 ( 47.96)
Epoch: [1][2000/5005]	Time  0.686 ( 0.686)	Data  0.000 ( 0.011)	Loss 3.5550e+00 (3.7267e+00)	Acc@1  26.56 ( 24.63)	Acc@5  52.34 ( 48.03)
Epoch: [1][2050/5005]	Time  0.684 ( 0.686)	Data  0.000 ( 0.011)	Loss 3.4159e+00 (3.7234e+00)	Acc@1  30.86 ( 24.67)	Acc@5  53.91 ( 48.08)
Epoch: [1][2100/5005]	Time  0.686 ( 0.686



Epoch: [1][3050/5005]	Time  0.691 ( 0.686)	Data  0.000 ( 0.010)	Loss 3.7797e+00 (3.6533e+00)	Acc@1  23.05 ( 25.77)	Acc@5  46.48 ( 49.44)
Epoch: [1][3100/5005]	Time  0.703 ( 0.686)	Data  0.000 ( 0.010)	Loss 3.4458e+00 (3.6503e+00)	Acc@1  26.56 ( 25.82)	Acc@5  53.12 ( 49.50)
Epoch: [1][3150/5005]	Time  0.716 ( 0.687)	Data  0.000 ( 0.010)	Loss 3.4920e+00 (3.6468e+00)	Acc@1  28.91 ( 25.87)	Acc@5  54.69 ( 49.56)
Epoch: [1][3200/5005]	Time  0.694 ( 0.687)	Data  0.000 ( 0.010)	Loss 3.2655e+00 (3.6433e+00)	Acc@1  32.42 ( 25.92)	Acc@5  57.81 ( 49.63)
Epoch: [1][3250/5005]	Time  0.688 ( 0.687)	Data  0.000 ( 0.010)	Loss 3.4818e+00 (3.6394e+00)	Acc@1  28.91 ( 25.98)	Acc@5  55.47 ( 49.70)
Epoch: [1][3300/5005]	Time  0.687 ( 0.687)	Data  0.000 ( 0.010)	Loss 3.2951e+00 (3.6361e+00)	Acc@1  30.08 ( 26.03)	Acc@5  56.25 ( 49.76)
Epoch: [1][3350/5005]	Time  0.688 ( 0.687)	Data  0.000 ( 0.010)	Loss 3.3735e+00 (3.6332e+00)	Acc@1  34.38 ( 26.09)	Acc@5  54.69 ( 49.81)
Epoch: [1][3400/5005]	Time  0.691 ( 0.687

Epoch: [2][ 850/5005]	Time  0.684 ( 0.686)	Data  0.000 ( 0.012)	Loss 3.1084e+00 (3.1965e+00)	Acc@1  38.28 ( 32.88)	Acc@5  59.38 ( 57.78)
Epoch: [2][ 900/5005]	Time  0.682 ( 0.686)	Data  0.000 ( 0.012)	Loss 3.1276e+00 (3.1972e+00)	Acc@1  33.98 ( 32.87)	Acc@5  60.16 ( 57.77)
Epoch: [2][ 950/5005]	Time  0.684 ( 0.686)	Data  0.000 ( 0.012)	Loss 3.4574e+00 (3.1956e+00)	Acc@1  30.86 ( 32.91)	Acc@5  52.73 ( 57.80)
Epoch: [2][1000/5005]	Time  0.684 ( 0.686)	Data  0.000 ( 0.012)	Loss 2.9420e+00 (3.1958e+00)	Acc@1  38.28 ( 32.90)	Acc@5  62.50 ( 57.81)
Epoch: [2][1050/5005]	Time  0.679 ( 0.686)	Data  0.000 ( 0.012)	Loss 3.2799e+00 (3.1955e+00)	Acc@1  27.34 ( 32.91)	Acc@5  56.25 ( 57.83)
Epoch: [2][1100/5005]	Time  0.683 ( 0.686)	Data  0.000 ( 0.012)	Loss 3.2755e+00 (3.1951e+00)	Acc@1  31.25 ( 32.91)	Acc@5  59.77 ( 57.82)
Epoch: [2][1150/5005]	Time  0.682 ( 0.686)	Data  0.000 ( 0.012)	Loss 3.2772e+00 (3.1943e+00)	Acc@1  30.08 ( 32.92)	Acc@5  56.64 ( 57.82)
Epoch: [2][1200/5005]	Time  0.684 ( 0.685



Epoch: [2][3250/5005]	Time  0.680 ( 0.686)	Data  0.000 ( 0.010)	Loss 3.2077e+00 (3.1381e+00)	Acc@1  33.98 ( 33.89)	Acc@5  58.59 ( 58.88)
Epoch: [2][3300/5005]	Time  0.682 ( 0.686)	Data  0.000 ( 0.010)	Loss 2.8597e+00 (3.1366e+00)	Acc@1  39.06 ( 33.92)	Acc@5  62.89 ( 58.91)
Epoch: [2][3350/5005]	Time  0.685 ( 0.686)	Data  0.000 ( 0.010)	Loss 2.8144e+00 (3.1355e+00)	Acc@1  39.06 ( 33.94)	Acc@5  65.23 ( 58.93)
Epoch: [2][3400/5005]	Time  0.681 ( 0.686)	Data  0.000 ( 0.010)	Loss 3.1230e+00 (3.1345e+00)	Acc@1  34.77 ( 33.95)	Acc@5  60.16 ( 58.95)
Epoch: [2][3450/5005]	Time  0.683 ( 0.686)	Data  0.000 ( 0.010)	Loss 3.2215e+00 (3.1330e+00)	Acc@1  32.81 ( 33.98)	Acc@5  55.86 ( 58.98)
Epoch: [2][3500/5005]	Time  0.681 ( 0.686)	Data  0.000 ( 0.010)	Loss 3.1953e+00 (3.1321e+00)	Acc@1  31.64 ( 34.00)	Acc@5  59.38 ( 59.01)
Epoch: [2][3550/5005]	Time  0.679 ( 0.686)	Data  0.000 ( 0.010)	Loss 2.9541e+00 (3.1310e+00)	Acc@1  39.84 ( 34.02)	Acc@5  62.50 ( 59.02)
Epoch: [2][3600/5005]	Time  0.682 ( 0.686

Epoch: [3][1050/5005]	Time  0.680 ( 0.689)	Data  0.000 ( 0.012)	Loss 3.0105e+00 (2.9376e+00)	Acc@1  35.55 ( 37.24)	Acc@5  60.94 ( 62.43)
Epoch: [3][1100/5005]	Time  0.682 ( 0.689)	Data  0.000 ( 0.012)	Loss 2.9070e+00 (2.9369e+00)	Acc@1  41.80 ( 37.28)	Acc@5  63.28 ( 62.44)
Epoch: [3][1150/5005]	Time  0.684 ( 0.689)	Data  0.000 ( 0.012)	Loss 2.8659e+00 (2.9362e+00)	Acc@1  37.50 ( 37.29)	Acc@5  61.72 ( 62.45)
Epoch: [3][1200/5005]	Time  0.683 ( 0.689)	Data  0.000 ( 0.011)	Loss 3.0360e+00 (2.9363e+00)	Acc@1  35.55 ( 37.29)	Acc@5  59.38 ( 62.44)
Epoch: [3][1250/5005]	Time  0.683 ( 0.688)	Data  0.000 ( 0.011)	Loss 2.9855e+00 (2.9362e+00)	Acc@1  32.03 ( 37.30)	Acc@5  60.94 ( 62.45)
Epoch: [3][1300/5005]	Time  0.683 ( 0.688)	Data  0.000 ( 0.011)	Loss 2.6730e+00 (2.9359e+00)	Acc@1  36.33 ( 37.31)	Acc@5  68.75 ( 62.45)
Epoch: [3][1350/5005]	Time  0.678 ( 0.688)	Data  0.000 ( 0.011)	Loss 2.8310e+00 (2.9351e+00)	Acc@1  42.19 ( 37.33)	Acc@5  61.33 ( 62.48)
Epoch: [3][1400/5005]	Time  0.682 ( 0.688



Epoch: [3][3450/5005]	Time  0.684 ( 0.686)	Data  0.000 ( 0.010)	Loss 2.9206e+00 (2.9210e+00)	Acc@1  33.20 ( 37.58)	Acc@5  63.28 ( 62.80)
Epoch: [3][3500/5005]	Time  0.682 ( 0.686)	Data  0.000 ( 0.010)	Loss 2.6957e+00 (2.9207e+00)	Acc@1  42.19 ( 37.59)	Acc@5  65.62 ( 62.81)
Epoch: [3][3550/5005]	Time  0.684 ( 0.686)	Data  0.000 ( 0.010)	Loss 3.0041e+00 (2.9206e+00)	Acc@1  38.67 ( 37.59)	Acc@5  64.45 ( 62.81)
Epoch: [3][3600/5005]	Time  0.681 ( 0.686)	Data  0.000 ( 0.010)	Loss 2.8403e+00 (2.9201e+00)	Acc@1  40.62 ( 37.60)	Acc@5  66.02 ( 62.82)
Epoch: [3][3650/5005]	Time  0.680 ( 0.686)	Data  0.000 ( 0.010)	Loss 2.9501e+00 (2.9195e+00)	Acc@1  38.28 ( 37.61)	Acc@5  60.55 ( 62.82)
Epoch: [3][3700/5005]	Time  0.682 ( 0.686)	Data  0.000 ( 0.010)	Loss 3.2169e+00 (2.9188e+00)	Acc@1  33.20 ( 37.62)	Acc@5  60.16 ( 62.83)
Epoch: [3][3750/5005]	Time  0.683 ( 0.686)	Data  0.000 ( 0.010)	Loss 2.9865e+00 (2.9184e+00)	Acc@1  41.80 ( 37.63)	Acc@5  62.11 ( 62.84)
Epoch: [3][3800/5005]	Time  0.682 ( 0.686

Epoch: [4][1250/5005]	Time  0.684 ( 0.696)	Data  0.000 ( 0.012)	Loss 2.4817e+00 (2.8095e+00)	Acc@1  44.14 ( 39.51)	Acc@5  71.09 ( 64.61)
Epoch: [4][1300/5005]	Time  0.681 ( 0.695)	Data  0.000 ( 0.012)	Loss 2.6329e+00 (2.8088e+00)	Acc@1  42.19 ( 39.50)	Acc@5  65.23 ( 64.62)
Epoch: [4][1350/5005]	Time  0.682 ( 0.695)	Data  0.000 ( 0.011)	Loss 2.8912e+00 (2.8094e+00)	Acc@1  35.94 ( 39.48)	Acc@5  65.23 ( 64.60)
Epoch: [4][1400/5005]	Time  0.685 ( 0.695)	Data  0.000 ( 0.011)	Loss 2.7951e+00 (2.8072e+00)	Acc@1  36.72 ( 39.49)	Acc@5  66.41 ( 64.66)
Epoch: [4][1450/5005]	Time  0.684 ( 0.694)	Data  0.000 ( 0.011)	Loss 2.5368e+00 (2.8065e+00)	Acc@1  44.14 ( 39.50)	Acc@5  68.75 ( 64.68)
Epoch: [4][1500/5005]	Time  0.684 ( 0.694)	Data  0.000 ( 0.011)	Loss 2.6745e+00 (2.8062e+00)	Acc@1  41.80 ( 39.50)	Acc@5  67.58 ( 64.69)
Epoch: [4][1550/5005]	Time  0.683 ( 0.694)	Data  0.000 ( 0.011)	Loss 2.5306e+00 (2.8071e+00)	Acc@1  39.45 ( 39.49)	Acc@5  69.14 ( 64.68)
Epoch: [4][1600/5005]	Time  0.702 ( 0.693



Epoch: [4][1900/5005]	Time  0.689 ( 0.692)	Data  0.000 ( 0.011)	Loss 2.6659e+00 (2.8081e+00)	Acc@1  42.97 ( 39.49)	Acc@5  66.41 ( 64.69)
Epoch: [4][1950/5005]	Time  0.687 ( 0.692)	Data  0.000 ( 0.011)	Loss 2.7271e+00 (2.8087e+00)	Acc@1  41.02 ( 39.49)	Acc@5  65.23 ( 64.68)
Epoch: [4][2000/5005]	Time  0.683 ( 0.691)	Data  0.000 ( 0.011)	Loss 3.0658e+00 (2.8080e+00)	Acc@1  38.67 ( 39.51)	Acc@5  58.98 ( 64.70)
Epoch: [4][2050/5005]	Time  0.686 ( 0.691)	Data  0.000 ( 0.011)	Loss 2.7365e+00 (2.8077e+00)	Acc@1  40.23 ( 39.52)	Acc@5  68.75 ( 64.72)
Epoch: [4][2100/5005]	Time  0.683 ( 0.691)	Data  0.000 ( 0.011)	Loss 2.8208e+00 (2.8076e+00)	Acc@1  42.19 ( 39.53)	Acc@5  61.33 ( 64.71)
Epoch: [4][2150/5005]	Time  0.684 ( 0.691)	Data  0.000 ( 0.011)	Loss 2.7994e+00 (2.8071e+00)	Acc@1  39.06 ( 39.54)	Acc@5  63.28 ( 64.72)
Epoch: [4][2200/5005]	Time  0.687 ( 0.691)	Data  0.000 ( 0.011)	Loss 2.7239e+00 (2.8080e+00)	Acc@1  39.06 ( 39.53)	Acc@5  67.58 ( 64.71)
Epoch: [4][2250/5005]	Time  0.682 ( 0.691

Epoch: [4][4900/5005]	Time  0.705 ( 0.690)	Data  0.000 ( 0.010)	Loss 2.5602e+00 (2.7956e+00)	Acc@1  43.36 ( 39.75)	Acc@5  70.70 ( 64.98)
Epoch: [4][4950/5005]	Time  0.690 ( 0.690)	Data  0.000 ( 0.010)	Loss 2.8444e+00 (2.7959e+00)	Acc@1  40.62 ( 39.75)	Acc@5  63.28 ( 64.98)
Epoch: [4][5000/5005]	Time  0.689 ( 0.690)	Data  0.000 ( 0.010)	Loss 2.7908e+00 (2.7954e+00)	Acc@1  39.06 ( 39.76)	Acc@5  63.28 ( 64.99)
Test: [  0/196]	Time  3.270 ( 3.270)	Loss 1.9710e+00 (1.9710e+00)	Acc@1  58.20 ( 58.20)	Acc@5  77.73 ( 77.73)
Test: [ 50/196]	Time  0.202 ( 0.335)	Loss 2.0519e+00 (2.1667e+00)	Acc@1  49.22 ( 47.52)	Acc@5  79.30 ( 75.88)
Test: [100/196]	Time  0.202 ( 0.308)	Loss 3.4585e+00 (2.3369e+00)	Acc@1  22.66 ( 45.14)	Acc@5  56.25 ( 73.26)
Test: [150/196]	Time  0.204 ( 0.298)	Loss 2.8573e+00 (2.5311e+00)	Acc@1  40.62 ( 42.56)	Acc@5  65.23 ( 69.66)
 * Acc@1 41.758 Acc@5 68.618
lr: [0.09994447548276714]
Epoch: [5][   0/5005]	Time  3.292 ( 3.292)	Data  3.012 ( 3.012)	Loss 2.8207e+00 (2.8207e+00)	A



Epoch: [5][ 750/5005]	Time  0.690 ( 0.700)	Data  0.000 ( 0.014)	Loss 2.5176e+00 (2.7284e+00)	Acc@1  47.66 ( 40.92)	Acc@5  67.97 ( 66.18)
Epoch: [5][ 800/5005]	Time  0.689 ( 0.700)	Data  0.000 ( 0.013)	Loss 2.5737e+00 (2.7295e+00)	Acc@1  42.19 ( 40.90)	Acc@5  69.53 ( 66.16)
Epoch: [5][ 850/5005]	Time  0.685 ( 0.699)	Data  0.000 ( 0.013)	Loss 2.6664e+00 (2.7323e+00)	Acc@1  39.45 ( 40.87)	Acc@5  69.92 ( 66.10)
Epoch: [5][ 900/5005]	Time  0.686 ( 0.698)	Data  0.000 ( 0.013)	Loss 2.6443e+00 (2.7328e+00)	Acc@1  38.28 ( 40.86)	Acc@5  66.02 ( 66.10)
Epoch: [5][ 950/5005]	Time  0.683 ( 0.697)	Data  0.000 ( 0.013)	Loss 2.5582e+00 (2.7330e+00)	Acc@1  39.45 ( 40.85)	Acc@5  69.53 ( 66.08)
Epoch: [5][1000/5005]	Time  0.683 ( 0.697)	Data  0.000 ( 0.012)	Loss 2.5131e+00 (2.7330e+00)	Acc@1  40.23 ( 40.82)	Acc@5  70.70 ( 66.08)
Epoch: [5][1050/5005]	Time  0.686 ( 0.696)	Data  0.000 ( 0.012)	Loss 2.8945e+00 (2.7342e+00)	Acc@1  37.50 ( 40.80)	Acc@5  62.50 ( 66.07)
Epoch: [5][1100/5005]	Time  0.682 ( 0.695

Epoch: [5][3750/5005]	Time  0.695 ( 0.690)	Data  0.000 ( 0.010)	Loss 2.9082e+00 (2.7278e+00)	Acc@1  37.89 ( 40.94)	Acc@5  62.50 ( 66.12)
Epoch: [5][3800/5005]	Time  0.689 ( 0.690)	Data  0.000 ( 0.010)	Loss 2.6730e+00 (2.7275e+00)	Acc@1  41.80 ( 40.95)	Acc@5  68.36 ( 66.13)
Epoch: [5][3850/5005]	Time  0.685 ( 0.690)	Data  0.000 ( 0.010)	Loss 2.7735e+00 (2.7271e+00)	Acc@1  39.45 ( 40.96)	Acc@5  62.11 ( 66.14)
Epoch: [5][3900/5005]	Time  0.688 ( 0.690)	Data  0.000 ( 0.010)	Loss 2.6507e+00 (2.7270e+00)	Acc@1  41.02 ( 40.96)	Acc@5  67.58 ( 66.14)
Epoch: [5][3950/5005]	Time  0.687 ( 0.690)	Data  0.000 ( 0.010)	Loss 2.6709e+00 (2.7271e+00)	Acc@1  38.67 ( 40.95)	Acc@5  66.80 ( 66.13)
Epoch: [5][4000/5005]	Time  0.693 ( 0.690)	Data  0.000 ( 0.010)	Loss 2.6734e+00 (2.7271e+00)	Acc@1  42.19 ( 40.95)	Acc@5  66.41 ( 66.12)
Epoch: [5][4050/5005]	Time  0.700 ( 0.690)	Data  0.000 ( 0.010)	Loss 2.7369e+00 (2.7266e+00)	Acc@1  44.53 ( 40.97)	Acc@5  65.23 ( 66.13)
Epoch: [5][4100/5005]	Time  0.710 ( 0.691

Epoch: [6][1550/5005]	Time  0.690 ( 0.690)	Data  0.000 ( 0.011)	Loss 2.5406e+00 (2.6751e+00)	Acc@1  45.31 ( 41.73)	Acc@5  69.14 ( 66.96)
Epoch: [6][1600/5005]	Time  0.682 ( 0.690)	Data  0.000 ( 0.011)	Loss 2.8459e+00 (2.6741e+00)	Acc@1  39.45 ( 41.75)	Acc@5  66.80 ( 66.97)
Epoch: [6][1650/5005]	Time  0.683 ( 0.689)	Data  0.000 ( 0.011)	Loss 2.5956e+00 (2.6735e+00)	Acc@1  39.84 ( 41.77)	Acc@5  68.75 ( 66.99)
Epoch: [6][1700/5005]	Time  0.686 ( 0.689)	Data  0.000 ( 0.011)	Loss 2.8891e+00 (2.6728e+00)	Acc@1  41.02 ( 41.79)	Acc@5  62.89 ( 67.01)
Epoch: [6][1750/5005]	Time  0.684 ( 0.689)	Data  0.000 ( 0.011)	Loss 2.5763e+00 (2.6738e+00)	Acc@1  41.02 ( 41.76)	Acc@5  67.58 ( 67.00)
Epoch: [6][1800/5005]	Time  0.685 ( 0.689)	Data  0.000 ( 0.011)	Loss 2.7722e+00 (2.6744e+00)	Acc@1  37.89 ( 41.76)	Acc@5  65.62 ( 66.97)
Epoch: [6][1850/5005]	Time  0.688 ( 0.689)	Data  0.000 ( 0.011)	Loss 2.5675e+00 (2.6741e+00)	Acc@1  44.14 ( 41.77)	Acc@5  68.75 ( 66.97)
Epoch: [6][1900/5005]	Time  0.683 ( 0.689



Epoch: [6][2700/5005]	Time  0.686 ( 0.688)	Data  0.000 ( 0.010)	Loss 2.5099e+00 (2.6771e+00)	Acc@1  45.70 ( 41.76)	Acc@5  67.97 ( 66.92)
Epoch: [6][2750/5005]	Time  0.691 ( 0.688)	Data  0.000 ( 0.010)	Loss 2.6605e+00 (2.6771e+00)	Acc@1  41.02 ( 41.77)	Acc@5  70.31 ( 66.92)
Epoch: [6][2800/5005]	Time  0.689 ( 0.688)	Data  0.000 ( 0.010)	Loss 2.5742e+00 (2.6777e+00)	Acc@1  42.58 ( 41.76)	Acc@5  69.53 ( 66.92)
Epoch: [6][2850/5005]	Time  0.693 ( 0.688)	Data  0.000 ( 0.010)	Loss 2.6365e+00 (2.6773e+00)	Acc@1  40.62 ( 41.78)	Acc@5  70.70 ( 66.94)
Epoch: [6][2900/5005]	Time  0.704 ( 0.688)	Data  0.000 ( 0.010)	Loss 2.6484e+00 (2.6773e+00)	Acc@1  42.97 ( 41.79)	Acc@5  67.97 ( 66.94)
Epoch: [6][2950/5005]	Time  0.716 ( 0.688)	Data  0.000 ( 0.010)	Loss 2.7595e+00 (2.6774e+00)	Acc@1  40.62 ( 41.79)	Acc@5  64.06 ( 66.93)
Epoch: [6][3000/5005]	Time  0.697 ( 0.689)	Data  0.000 ( 0.010)	Loss 2.6760e+00 (2.6776e+00)	Acc@1  41.80 ( 41.79)	Acc@5  63.67 ( 66.93)
Epoch: [6][3050/5005]	Time  0.691 ( 0.689

Epoch: [7][ 500/5005]	Time  0.681 ( 0.695)	Data  0.000 ( 0.016)	Loss 2.6412e+00 (2.6131e+00)	Acc@1  42.97 ( 42.97)	Acc@5  68.36 ( 68.06)
Epoch: [7][ 550/5005]	Time  0.686 ( 0.694)	Data  0.000 ( 0.015)	Loss 2.7380e+00 (2.6133e+00)	Acc@1  46.48 ( 42.94)	Acc@5  67.19 ( 68.11)




Epoch: [7][ 600/5005]	Time  0.682 ( 0.693)	Data  0.000 ( 0.015)	Loss 2.7096e+00 (2.6147e+00)	Acc@1  43.36 ( 42.87)	Acc@5  65.23 ( 68.06)
Epoch: [7][ 650/5005]	Time  0.686 ( 0.693)	Data  0.000 ( 0.014)	Loss 2.5538e+00 (2.6187e+00)	Acc@1  44.53 ( 42.81)	Acc@5  70.31 ( 68.01)
Epoch: [7][ 700/5005]	Time  0.685 ( 0.692)	Data  0.000 ( 0.014)	Loss 2.4799e+00 (2.6217e+00)	Acc@1  46.48 ( 42.73)	Acc@5  71.48 ( 67.94)
Epoch: [7][ 750/5005]	Time  0.686 ( 0.691)	Data  0.000 ( 0.014)	Loss 2.5397e+00 (2.6228e+00)	Acc@1  46.09 ( 42.73)	Acc@5  70.31 ( 67.91)
Epoch: [7][ 800/5005]	Time  0.684 ( 0.691)	Data  0.000 ( 0.013)	Loss 2.3857e+00 (2.6208e+00)	Acc@1  44.53 ( 42.74)	Acc@5  74.61 ( 67.95)
Epoch: [7][ 850/5005]	Time  0.680 ( 0.691)	Data  0.000 ( 0.013)	Loss 2.7768e+00 (2.6220e+00)	Acc@1  41.80 ( 42.67)	Acc@5  65.62 ( 67.92)
Epoch: [7][ 900/5005]	Time  0.684 ( 0.690)	Data  0.000 ( 0.013)	Loss 2.4830e+00 (2.6259e+00)	Acc@1  46.48 ( 42.62)	Acc@5  69.53 ( 67.87)
Epoch: [7][ 950/5005]	Time  0.689 ( 0.690

Epoch: [7][3600/5005]	Time  0.690 ( 0.690)	Data  0.000 ( 0.010)	Loss 2.5461e+00 (2.6354e+00)	Acc@1  46.48 ( 42.51)	Acc@5  69.92 ( 67.68)
Epoch: [7][3650/5005]	Time  0.684 ( 0.690)	Data  0.000 ( 0.010)	Loss 3.0740e+00 (2.6361e+00)	Acc@1  36.33 ( 42.50)	Acc@5  59.38 ( 67.67)
Epoch: [7][3700/5005]	Time  0.681 ( 0.690)	Data  0.000 ( 0.010)	Loss 2.6225e+00 (2.6359e+00)	Acc@1  44.53 ( 42.50)	Acc@5  67.58 ( 67.68)
Epoch: [7][3750/5005]	Time  0.683 ( 0.690)	Data  0.000 ( 0.010)	Loss 2.9610e+00 (2.6358e+00)	Acc@1  35.55 ( 42.52)	Acc@5  62.89 ( 67.68)
Epoch: [7][3800/5005]	Time  0.683 ( 0.689)	Data  0.000 ( 0.010)	Loss 2.7215e+00 (2.6362e+00)	Acc@1  44.53 ( 42.51)	Acc@5  71.09 ( 67.67)
Epoch: [7][3850/5005]	Time  0.683 ( 0.689)	Data  0.000 ( 0.010)	Loss 2.4007e+00 (2.6361e+00)	Acc@1  47.66 ( 42.51)	Acc@5  71.48 ( 67.67)
Epoch: [7][3900/5005]	Time  0.683 ( 0.689)	Data  0.000 ( 0.010)	Loss 2.5542e+00 (2.6359e+00)	Acc@1  42.97 ( 42.51)	Acc@5  69.92 ( 67.67)
Epoch: [7][3950/5005]	Time  0.685 ( 0.689

Epoch: [8][1400/5005]	Time  0.681 ( 0.696)	Data  0.000 ( 0.012)	Loss 2.5872e+00 (2.6048e+00)	Acc@1  45.31 ( 43.13)	Acc@5  67.97 ( 68.26)
Epoch: [8][1450/5005]	Time  0.685 ( 0.696)	Data  0.000 ( 0.012)	Loss 2.6037e+00 (2.6053e+00)	Acc@1  44.92 ( 43.12)	Acc@5  71.09 ( 68.24)
Epoch: [8][1500/5005]	Time  0.682 ( 0.696)	Data  0.000 ( 0.012)	Loss 2.6822e+00 (2.6035e+00)	Acc@1  43.75 ( 43.14)	Acc@5  66.02 ( 68.28)
Epoch: [8][1550/5005]	Time  0.684 ( 0.695)	Data  0.000 ( 0.012)	Loss 2.3959e+00 (2.6045e+00)	Acc@1  46.88 ( 43.12)	Acc@5  71.09 ( 68.26)
Epoch: [8][1600/5005]	Time  0.685 ( 0.695)	Data  0.000 ( 0.011)	Loss 2.5774e+00 (2.6053e+00)	Acc@1  44.92 ( 43.12)	Acc@5  70.70 ( 68.24)
Epoch: [8][1650/5005]	Time  0.689 ( 0.695)	Data  0.000 ( 0.011)	Loss 2.5874e+00 (2.6062e+00)	Acc@1  43.75 ( 43.11)	Acc@5  66.80 ( 68.22)
Epoch: [8][1700/5005]	Time  0.692 ( 0.694)	Data  0.000 ( 0.011)	Loss 2.7015e+00 (2.6069e+00)	Acc@1  38.28 ( 43.09)	Acc@5  66.41 ( 68.20)
Epoch: [8][1750/5005]	Time  0.690 ( 0.694



Epoch: [8][2250/5005]	Time  0.686 ( 0.694)	Data  0.000 ( 0.011)	Loss 2.6844e+00 (2.6053e+00)	Acc@1  39.45 ( 43.10)	Acc@5  67.97 ( 68.21)
Epoch: [8][2300/5005]	Time  0.681 ( 0.694)	Data  0.000 ( 0.011)	Loss 2.6814e+00 (2.6054e+00)	Acc@1  42.97 ( 43.09)	Acc@5  69.53 ( 68.20)
Epoch: [8][2350/5005]	Time  0.687 ( 0.694)	Data  0.000 ( 0.011)	Loss 2.5581e+00 (2.6052e+00)	Acc@1  39.06 ( 43.09)	Acc@5  70.70 ( 68.20)
Epoch: [8][2400/5005]	Time  0.686 ( 0.693)	Data  0.000 ( 0.011)	Loss 2.7157e+00 (2.6054e+00)	Acc@1  41.80 ( 43.09)	Acc@5  66.41 ( 68.20)
Epoch: [8][2450/5005]	Time  0.681 ( 0.693)	Data  0.000 ( 0.011)	Loss 2.5041e+00 (2.6055e+00)	Acc@1  44.53 ( 43.08)	Acc@5  68.36 ( 68.20)
Epoch: [8][2500/5005]	Time  0.683 ( 0.693)	Data  0.000 ( 0.011)	Loss 2.5472e+00 (2.6060e+00)	Acc@1  42.97 ( 43.08)	Acc@5  69.53 ( 68.19)
Epoch: [8][2550/5005]	Time  0.684 ( 0.693)	Data  0.000 ( 0.011)	Loss 2.5737e+00 (2.6065e+00)	Acc@1  41.02 ( 43.07)	Acc@5  67.97 ( 68.18)
Epoch: [8][2600/5005]	Time  0.687 ( 0.693

Epoch: [9][  50/5005]	Time  0.685 ( 0.736)	Data  0.000 ( 0.069)	Loss 2.6231e+00 (2.5817e+00)	Acc@1  42.97 ( 43.41)	Acc@5  69.92 ( 68.52)
Epoch: [9][ 100/5005]	Time  0.688 ( 0.712)	Data  0.000 ( 0.040)	Loss 2.3870e+00 (2.5754e+00)	Acc@1  45.31 ( 43.37)	Acc@5  70.70 ( 68.83)
Epoch: [9][ 150/5005]	Time  0.691 ( 0.705)	Data  0.000 ( 0.030)	Loss 2.4318e+00 (2.5705e+00)	Acc@1  48.05 ( 43.55)	Acc@5  74.22 ( 68.76)
Epoch: [9][ 200/5005]	Time  0.697 ( 0.702)	Data  0.000 ( 0.025)	Loss 2.5570e+00 (2.5702e+00)	Acc@1  45.70 ( 43.57)	Acc@5  67.97 ( 68.92)
Epoch: [9][ 250/5005]	Time  0.702 ( 0.702)	Data  0.000 ( 0.022)	Loss 2.7783e+00 (2.5648e+00)	Acc@1  41.41 ( 43.64)	Acc@5  66.80 ( 69.02)
Epoch: [9][ 300/5005]	Time  0.717 ( 0.703)	Data  0.000 ( 0.020)	Loss 2.7141e+00 (2.5591e+00)	Acc@1  41.80 ( 43.71)	Acc@5  64.84 ( 69.04)
Epoch: [9][ 350/5005]	Time  0.693 ( 0.703)	Data  0.000 ( 0.018)	Loss 2.4974e+00 (2.5605e+00)	Acc@1  43.36 ( 43.69)	Acc@5  70.31 ( 68.97)
Epoch: [9][ 400/5005]	Time  0.690 ( 0.702

Epoch: [9][3050/5005]	Time  0.686 ( 0.690)	Data  0.000 ( 0.010)	Loss 2.6256e+00 (2.5814e+00)	Acc@1  42.19 ( 43.51)	Acc@5  67.19 ( 68.62)
Epoch: [9][3100/5005]	Time  0.684 ( 0.690)	Data  0.000 ( 0.010)	Loss 2.4578e+00 (2.5815e+00)	Acc@1  47.27 ( 43.51)	Acc@5  68.36 ( 68.61)
Epoch: [9][3150/5005]	Time  0.682 ( 0.689)	Data  0.000 ( 0.010)	Loss 2.6016e+00 (2.5818e+00)	Acc@1  40.62 ( 43.50)	Acc@5  66.80 ( 68.61)
Epoch: [9][3200/5005]	Time  0.685 ( 0.689)	Data  0.000 ( 0.010)	Loss 2.6468e+00 (2.5815e+00)	Acc@1  44.14 ( 43.51)	Acc@5  68.75 ( 68.61)
Epoch: [9][3250/5005]	Time  0.683 ( 0.689)	Data  0.000 ( 0.010)	Loss 2.8235e+00 (2.5816e+00)	Acc@1  36.72 ( 43.50)	Acc@5  67.97 ( 68.62)
Epoch: [9][3300/5005]	Time  0.683 ( 0.689)	Data  0.000 ( 0.010)	Loss 2.4144e+00 (2.5816e+00)	Acc@1  46.09 ( 43.50)	Acc@5  73.05 ( 68.62)
Epoch: [9][3350/5005]	Time  0.685 ( 0.689)	Data  0.000 ( 0.010)	Loss 2.7159e+00 (2.5816e+00)	Acc@1  43.75 ( 43.50)	Acc@5  67.58 ( 68.62)
Epoch: [9][3400/5005]	Time  0.682 ( 0.689



Epoch: [9][4050/5005]	Time  0.682 ( 0.689)	Data  0.000 ( 0.010)	Loss 2.7399e+00 (2.5838e+00)	Acc@1  39.84 ( 43.47)	Acc@5  67.58 ( 68.58)
Epoch: [9][4100/5005]	Time  0.680 ( 0.689)	Data  0.000 ( 0.010)	Loss 2.4457e+00 (2.5839e+00)	Acc@1  44.53 ( 43.47)	Acc@5  69.14 ( 68.58)
Epoch: [9][4150/5005]	Time  0.682 ( 0.689)	Data  0.000 ( 0.010)	Loss 2.6285e+00 (2.5842e+00)	Acc@1  42.19 ( 43.46)	Acc@5  66.41 ( 68.58)
Epoch: [9][4200/5005]	Time  0.683 ( 0.689)	Data  0.000 ( 0.010)	Loss 2.5643e+00 (2.5845e+00)	Acc@1  44.14 ( 43.47)	Acc@5  66.80 ( 68.57)
Epoch: [9][4250/5005]	Time  0.681 ( 0.689)	Data  0.000 ( 0.010)	Loss 2.6388e+00 (2.5847e+00)	Acc@1  41.41 ( 43.46)	Acc@5  66.41 ( 68.57)
Epoch: [9][4300/5005]	Time  0.684 ( 0.689)	Data  0.000 ( 0.010)	Loss 2.3519e+00 (2.5848e+00)	Acc@1  50.00 ( 43.46)	Acc@5  72.27 ( 68.57)
Epoch: [9][4350/5005]	Time  0.684 ( 0.689)	Data  0.000 ( 0.010)	Loss 2.5878e+00 (2.5850e+00)	Acc@1  43.36 ( 43.46)	Acc@5  68.75 ( 68.57)
Epoch: [9][4400/5005]	Time  0.686 ( 0.689

Epoch: [10][1800/5005]	Time  0.688 ( 0.695)	Data  0.000 ( 0.011)	Loss 2.4658e+00 (2.5586e+00)	Acc@1  42.97 ( 43.99)	Acc@5  69.92 ( 68.93)
Epoch: [10][1850/5005]	Time  0.684 ( 0.695)	Data  0.000 ( 0.011)	Loss 2.4407e+00 (2.5587e+00)	Acc@1  47.27 ( 43.98)	Acc@5  69.92 ( 68.93)
Epoch: [10][1900/5005]	Time  0.688 ( 0.695)	Data  0.000 ( 0.011)	Loss 2.4133e+00 (2.5593e+00)	Acc@1  42.58 ( 43.97)	Acc@5  72.27 ( 68.93)
Epoch: [10][1950/5005]	Time  0.684 ( 0.694)	Data  0.000 ( 0.011)	Loss 2.2722e+00 (2.5586e+00)	Acc@1  48.44 ( 43.97)	Acc@5  72.27 ( 68.93)
Epoch: [10][2000/5005]	Time  0.681 ( 0.694)	Data  0.000 ( 0.011)	Loss 2.7171e+00 (2.5592e+00)	Acc@1  40.62 ( 43.97)	Acc@5  65.23 ( 68.93)




Epoch: [10][2050/5005]	Time  0.683 ( 0.694)	Data  0.000 ( 0.011)	Loss 2.5187e+00 (2.5583e+00)	Acc@1  44.53 ( 43.98)	Acc@5  68.75 ( 68.94)
Epoch: [10][2100/5005]	Time  0.684 ( 0.694)	Data  0.000 ( 0.011)	Loss 2.6918e+00 (2.5590e+00)	Acc@1  42.97 ( 43.97)	Acc@5  62.89 ( 68.93)
Epoch: [10][2150/5005]	Time  0.686 ( 0.694)	Data  0.000 ( 0.011)	Loss 2.4607e+00 (2.5592e+00)	Acc@1  44.14 ( 43.96)	Acc@5  71.09 ( 68.94)
Epoch: [10][2200/5005]	Time  0.684 ( 0.693)	Data  0.000 ( 0.011)	Loss 2.5852e+00 (2.5605e+00)	Acc@1  42.97 ( 43.95)	Acc@5  69.92 ( 68.92)
Epoch: [10][2250/5005]	Time  0.685 ( 0.693)	Data  0.000 ( 0.011)	Loss 2.9754e+00 (2.5618e+00)	Acc@1  36.72 ( 43.93)	Acc@5  61.33 ( 68.89)
Epoch: [10][2300/5005]	Time  0.684 ( 0.693)	Data  0.000 ( 0.011)	Loss 2.5405e+00 (2.5619e+00)	Acc@1  46.09 ( 43.93)	Acc@5  69.14 ( 68.89)
Epoch: [10][2350/5005]	Time  0.686 ( 0.693)	Data  0.000 ( 0.011)	Loss 2.1930e+00 (2.5612e+00)	Acc@1  53.12 ( 43.94)	Acc@5  74.61 ( 68.90)
Epoch: [10][2400/5005]	Time  0.686

Test: [  0/196]	Time  3.425 ( 3.425)	Loss 1.7919e+00 (1.7919e+00)	Acc@1  58.20 ( 58.20)	Acc@5  83.59 ( 83.59)
Test: [ 50/196]	Time  0.204 ( 0.344)	Loss 1.9147e+00 (2.0064e+00)	Acc@1  49.61 ( 50.61)	Acc@5  80.47 ( 78.60)
Test: [100/196]	Time  0.204 ( 0.316)	Loss 3.2160e+00 (2.1481e+00)	Acc@1  28.91 ( 48.87)	Acc@5  55.86 ( 76.41)
Test: [150/196]	Time  0.202 ( 0.305)	Loss 2.9843e+00 (2.3144e+00)	Acc@1  37.50 ( 46.80)	Acc@5  66.80 ( 73.50)
 * Acc@1 46.224 Acc@5 72.652
lr: [0.09987025056254083]
Epoch: [11][   0/5005]	Time  3.062 ( 3.062)	Data  2.722 ( 2.722)	Loss 2.4783e+00 (2.4783e+00)	Acc@1  45.31 ( 45.31)	Acc@5  71.09 ( 71.09)
Epoch: [11][  50/5005]	Time  0.681 ( 0.729)	Data  0.000 ( 0.062)	Loss 2.6382e+00 (2.5082e+00)	Acc@1  43.75 ( 45.07)	Acc@5  68.36 ( 69.68)
Epoch: [11][ 100/5005]	Time  0.683 ( 0.707)	Data  0.000 ( 0.036)	Loss 2.5691e+00 (2.5064e+00)	Acc@1  45.31 ( 45.01)	Acc@5  69.92 ( 69.84)
Epoch: [11][ 150/5005]	Time  0.685 ( 0.699)	Data  0.000 ( 0.027)	Loss 2.4822e+00 (2.5006e+0



Epoch: [11][ 800/5005]	Time  0.689 ( 0.687)	Data  0.000 ( 0.013)	Loss 2.6549e+00 (2.5279e+00)	Acc@1  41.80 ( 44.67)	Acc@5  66.41 ( 69.49)
Epoch: [11][ 850/5005]	Time  0.689 ( 0.688)	Data  0.000 ( 0.013)	Loss 2.7443e+00 (2.5280e+00)	Acc@1  37.11 ( 44.67)	Acc@5  68.36 ( 69.47)
Epoch: [11][ 900/5005]	Time  0.700 ( 0.688)	Data  0.000 ( 0.012)	Loss 2.7608e+00 (2.5270e+00)	Acc@1  41.02 ( 44.65)	Acc@5  65.23 ( 69.47)
Epoch: [11][ 950/5005]	Time  0.706 ( 0.689)	Data  0.000 ( 0.012)	Loss 2.3518e+00 (2.5278e+00)	Acc@1  49.22 ( 44.65)	Acc@5  72.66 ( 69.45)
Epoch: [11][1000/5005]	Time  0.719 ( 0.690)	Data  0.000 ( 0.012)	Loss 2.3451e+00 (2.5278e+00)	Acc@1  44.53 ( 44.62)	Acc@5  73.05 ( 69.43)
Epoch: [11][1050/5005]	Time  0.695 ( 0.691)	Data  0.000 ( 0.012)	Loss 2.6172e+00 (2.5295e+00)	Acc@1  42.97 ( 44.58)	Acc@5  72.66 ( 69.38)
Epoch: [11][1100/5005]	Time  0.690 ( 0.691)	Data  0.000 ( 0.012)	Loss 2.4133e+00 (2.5289e+00)	Acc@1  45.70 ( 44.61)	Acc@5  73.83 ( 69.40)
Epoch: [11][1150/5005]	Time  0.688

Epoch: [11][3800/5005]	Time  0.686 ( 0.689)	Data  0.000 ( 0.010)	Loss 2.6602e+00 (2.5476e+00)	Acc@1  41.02 ( 44.19)	Acc@5  67.58 ( 69.18)
Epoch: [11][3850/5005]	Time  0.689 ( 0.689)	Data  0.000 ( 0.010)	Loss 2.5978e+00 (2.5477e+00)	Acc@1  44.14 ( 44.18)	Acc@5  68.75 ( 69.18)
Epoch: [11][3900/5005]	Time  0.694 ( 0.689)	Data  0.000 ( 0.010)	Loss 2.4541e+00 (2.5476e+00)	Acc@1  44.92 ( 44.19)	Acc@5  75.00 ( 69.18)
Epoch: [11][3950/5005]	Time  0.698 ( 0.689)	Data  0.000 ( 0.010)	Loss 2.5086e+00 (2.5473e+00)	Acc@1  41.80 ( 44.19)	Acc@5  70.31 ( 69.18)
Epoch: [11][4000/5005]	Time  0.708 ( 0.690)	Data  0.000 ( 0.010)	Loss 2.7735e+00 (2.5474e+00)	Acc@1  40.23 ( 44.19)	Acc@5  65.62 ( 69.18)
Epoch: [11][4050/5005]	Time  0.715 ( 0.690)	Data  0.000 ( 0.010)	Loss 2.6085e+00 (2.5476e+00)	Acc@1  44.92 ( 44.19)	Acc@5  68.36 ( 69.17)
Epoch: [11][4100/5005]	Time  0.687 ( 0.690)	Data  0.000 ( 0.010)	Loss 2.6023e+00 (2.5480e+00)	Acc@1  44.53 ( 44.18)	Acc@5  67.58 ( 69.16)
Epoch: [11][4150/5005]	Time  0.693

Epoch: [12][1550/5005]	Time  0.681 ( 0.692)	Data  0.000 ( 0.011)	Loss 2.5662e+00 (2.5242e+00)	Acc@1  41.41 ( 44.54)	Acc@5  69.92 ( 69.56)
Epoch: [12][1600/5005]	Time  0.682 ( 0.692)	Data  0.000 ( 0.011)	Loss 2.3013e+00 (2.5240e+00)	Acc@1  46.88 ( 44.53)	Acc@5  75.00 ( 69.57)
Epoch: [12][1650/5005]	Time  0.684 ( 0.692)	Data  0.000 ( 0.011)	Loss 2.5907e+00 (2.5239e+00)	Acc@1  42.19 ( 44.53)	Acc@5  66.02 ( 69.57)
Epoch: [12][1700/5005]	Time  0.686 ( 0.692)	Data  0.000 ( 0.011)	Loss 2.4592e+00 (2.5243e+00)	Acc@1  44.14 ( 44.54)	Acc@5  70.31 ( 69.56)
Epoch: [12][1750/5005]	Time  0.687 ( 0.691)	Data  0.000 ( 0.011)	Loss 2.5033e+00 (2.5251e+00)	Acc@1  47.27 ( 44.54)	Acc@5  69.53 ( 69.53)
Epoch: [12][1800/5005]	Time  0.689 ( 0.691)	Data  0.000 ( 0.011)	Loss 2.4792e+00 (2.5248e+00)	Acc@1  45.31 ( 44.55)	Acc@5  66.41 ( 69.53)
Epoch: [12][1850/5005]	Time  0.691 ( 0.691)	Data  0.000 ( 0.011)	Loss 2.6676e+00 (2.5257e+00)	Acc@1  44.14 ( 44.53)	Acc@5  66.80 ( 69.51)
Epoch: [12][1900/5005]	Time  0.700



Epoch: [12][3100/5005]	Time  0.683 ( 0.689)	Data  0.000 ( 0.010)	Loss 2.3738e+00 (2.5305e+00)	Acc@1  46.48 ( 44.46)	Acc@5  70.70 ( 69.42)
Epoch: [12][3150/5005]	Time  0.682 ( 0.689)	Data  0.000 ( 0.010)	Loss 2.7731e+00 (2.5310e+00)	Acc@1  41.80 ( 44.44)	Acc@5  65.23 ( 69.42)
Epoch: [12][3200/5005]	Time  0.680 ( 0.689)	Data  0.000 ( 0.010)	Loss 2.2845e+00 (2.5306e+00)	Acc@1  46.48 ( 44.46)	Acc@5  74.22 ( 69.42)
Epoch: [12][3250/5005]	Time  0.682 ( 0.689)	Data  0.000 ( 0.010)	Loss 2.5994e+00 (2.5307e+00)	Acc@1  41.41 ( 44.45)	Acc@5  70.31 ( 69.42)
Epoch: [12][3300/5005]	Time  0.685 ( 0.689)	Data  0.000 ( 0.010)	Loss 2.5490e+00 (2.5308e+00)	Acc@1  43.75 ( 44.45)	Acc@5  69.14 ( 69.42)
Epoch: [12][3350/5005]	Time  0.682 ( 0.689)	Data  0.000 ( 0.010)	Loss 2.3465e+00 (2.5308e+00)	Acc@1  50.39 ( 44.45)	Acc@5  74.22 ( 69.42)
Epoch: [12][3400/5005]	Time  0.681 ( 0.689)	Data  0.000 ( 0.010)	Loss 2.4398e+00 (2.5316e+00)	Acc@1  44.53 ( 44.45)	Acc@5  70.70 ( 69.41)
Epoch: [12][3450/5005]	Time  0.683

Epoch: [13][ 850/5005]	Time  0.684 ( 0.692)	Data  0.000 ( 0.013)	Loss 2.4971e+00 (2.5062e+00)	Acc@1  45.31 ( 44.73)	Acc@5  67.58 ( 69.82)
Epoch: [13][ 900/5005]	Time  0.682 ( 0.691)	Data  0.000 ( 0.013)	Loss 2.1409e+00 (2.5075e+00)	Acc@1  52.73 ( 44.71)	Acc@5  73.44 ( 69.78)
Epoch: [13][ 950/5005]	Time  0.687 ( 0.691)	Data  0.000 ( 0.013)	Loss 2.6554e+00 (2.5078e+00)	Acc@1  44.92 ( 44.70)	Acc@5  67.19 ( 69.77)
Epoch: [13][1000/5005]	Time  0.684 ( 0.691)	Data  0.000 ( 0.012)	Loss 2.3869e+00 (2.5059e+00)	Acc@1  47.27 ( 44.72)	Acc@5  71.88 ( 69.81)
Epoch: [13][1050/5005]	Time  0.688 ( 0.690)	Data  0.000 ( 0.012)	Loss 2.5659e+00 (2.5068e+00)	Acc@1  45.31 ( 44.70)	Acc@5  68.75 ( 69.81)
Epoch: [13][1100/5005]	Time  0.691 ( 0.690)	Data  0.000 ( 0.012)	Loss 2.4120e+00 (2.5092e+00)	Acc@1  46.48 ( 44.67)	Acc@5  71.09 ( 69.76)
Epoch: [13][1150/5005]	Time  0.695 ( 0.690)	Data  0.000 ( 0.012)	Loss 2.5223e+00 (2.5086e+00)	Acc@1  43.75 ( 44.69)	Acc@5  71.09 ( 69.77)
Epoch: [13][1200/5005]	Time  0.704



Epoch: [13][1850/5005]	Time  0.686 ( 0.692)	Data  0.000 ( 0.011)	Loss 2.4519e+00 (2.5159e+00)	Acc@1  43.75 ( 44.60)	Acc@5  73.44 ( 69.64)
Epoch: [13][1900/5005]	Time  0.679 ( 0.692)	Data  0.000 ( 0.011)	Loss 2.1861e+00 (2.5155e+00)	Acc@1  49.61 ( 44.62)	Acc@5  74.22 ( 69.65)
Epoch: [13][1950/5005]	Time  0.684 ( 0.692)	Data  0.000 ( 0.011)	Loss 2.5788e+00 (2.5161e+00)	Acc@1  45.70 ( 44.61)	Acc@5  69.14 ( 69.63)
Epoch: [13][2000/5005]	Time  0.684 ( 0.692)	Data  0.000 ( 0.011)	Loss 2.4032e+00 (2.5156e+00)	Acc@1  46.48 ( 44.61)	Acc@5  69.92 ( 69.64)
Epoch: [13][2050/5005]	Time  0.684 ( 0.691)	Data  0.000 ( 0.011)	Loss 2.4468e+00 (2.5161e+00)	Acc@1  44.92 ( 44.60)	Acc@5  69.14 ( 69.63)
Epoch: [13][2100/5005]	Time  0.688 ( 0.691)	Data  0.000 ( 0.011)	Loss 2.2291e+00 (2.5154e+00)	Acc@1  48.83 ( 44.63)	Acc@5  73.83 ( 69.65)
Epoch: [13][2150/5005]	Time  0.685 ( 0.691)	Data  0.000 ( 0.011)	Loss 2.6088e+00 (2.5169e+00)	Acc@1  42.97 ( 44.60)	Acc@5  69.53 ( 69.63)
Epoch: [13][2200/5005]	Time  0.681

Epoch: [13][4850/5005]	Time  0.685 ( 0.689)	Data  0.000 ( 0.010)	Loss 3.0372e+00 (2.5266e+00)	Acc@1  37.11 ( 44.51)	Acc@5  60.16 ( 69.50)
Epoch: [13][4900/5005]	Time  0.680 ( 0.689)	Data  0.000 ( 0.010)	Loss 2.6245e+00 (2.5272e+00)	Acc@1  42.97 ( 44.50)	Acc@5  69.92 ( 69.49)
Epoch: [13][4950/5005]	Time  0.683 ( 0.689)	Data  0.000 ( 0.010)	Loss 2.6432e+00 (2.5271e+00)	Acc@1  45.70 ( 44.50)	Acc@5  68.36 ( 69.49)
Epoch: [13][5000/5005]	Time  0.683 ( 0.689)	Data  0.000 ( 0.010)	Loss 2.6221e+00 (2.5268e+00)	Acc@1  39.45 ( 44.51)	Acc@5  69.92 ( 69.50)
Test: [  0/196]	Time  3.380 ( 3.380)	Loss 1.5756e+00 (1.5756e+00)	Acc@1  58.98 ( 58.98)	Acc@5  85.94 ( 85.94)
Test: [ 50/196]	Time  0.200 ( 0.342)	Loss 1.3680e+00 (1.9943e+00)	Acc@1  67.19 ( 50.55)	Acc@5  87.89 ( 79.36)
Test: [100/196]	Time  0.201 ( 0.315)	Loss 2.7386e+00 (2.1006e+00)	Acc@1  39.45 ( 49.66)	Acc@5  68.75 ( 77.57)
Test: [150/196]	Time  0.202 ( 0.305)	Loss 2.6699e+00 (2.2761e+00)	Acc@1  45.70 ( 47.41)	Acc@5  70.70 ( 74.22)
 * Acc@1

Epoch: [14][2600/5005]	Time  0.691 ( 0.684)	Data  0.000 ( 0.010)	Loss 2.4747e+00 (2.5107e+00)	Acc@1  44.53 ( 44.84)	Acc@5  71.48 ( 69.78)
Epoch: [14][2650/5005]	Time  0.698 ( 0.684)	Data  0.000 ( 0.010)	Loss 2.3928e+00 (2.5107e+00)	Acc@1  50.00 ( 44.85)	Acc@5  72.66 ( 69.78)
Epoch: [14][2700/5005]	Time  0.710 ( 0.685)	Data  0.000 ( 0.010)	Loss 2.4629e+00 (2.5116e+00)	Acc@1  47.66 ( 44.84)	Acc@5  70.70 ( 69.76)
Epoch: [14][2750/5005]	Time  0.694 ( 0.685)	Data  0.000 ( 0.010)	Loss 2.4256e+00 (2.5117e+00)	Acc@1  45.31 ( 44.84)	Acc@5  74.22 ( 69.76)
Epoch: [14][2800/5005]	Time  0.688 ( 0.685)	Data  0.000 ( 0.010)	Loss 2.6274e+00 (2.5113e+00)	Acc@1  42.58 ( 44.84)	Acc@5  68.36 ( 69.77)
Epoch: [14][2850/5005]	Time  0.680 ( 0.685)	Data  0.000 ( 0.010)	Loss 2.4650e+00 (2.5113e+00)	Acc@1  43.36 ( 44.84)	Acc@5  71.48 ( 69.77)
Epoch: [14][2900/5005]	Time  0.681 ( 0.685)	Data  0.000 ( 0.010)	Loss 2.3870e+00 (2.5114e+00)	Acc@1  47.27 ( 44.83)	Acc@5  69.92 ( 69.77)
Epoch: [14][2950/5005]	Time  0.683



Epoch: [14][3800/5005]	Time  0.688 ( 0.685)	Data  0.000 ( 0.010)	Loss 2.3139e+00 (2.5151e+00)	Acc@1  48.05 ( 44.75)	Acc@5  71.48 ( 69.71)
Epoch: [14][3850/5005]	Time  0.684 ( 0.685)	Data  0.000 ( 0.010)	Loss 2.4224e+00 (2.5152e+00)	Acc@1  42.19 ( 44.74)	Acc@5  70.31 ( 69.71)
Epoch: [14][3900/5005]	Time  0.679 ( 0.685)	Data  0.000 ( 0.010)	Loss 2.4475e+00 (2.5158e+00)	Acc@1  45.31 ( 44.73)	Acc@5  71.48 ( 69.69)
Epoch: [14][3950/5005]	Time  0.685 ( 0.685)	Data  0.000 ( 0.010)	Loss 2.5986e+00 (2.5156e+00)	Acc@1  43.36 ( 44.73)	Acc@5  71.48 ( 69.69)
Epoch: [14][4000/5005]	Time  0.690 ( 0.685)	Data  0.000 ( 0.010)	Loss 2.7464e+00 (2.5159e+00)	Acc@1  37.50 ( 44.72)	Acc@5  63.28 ( 69.69)
Epoch: [14][4050/5005]	Time  0.684 ( 0.685)	Data  0.000 ( 0.010)	Loss 2.6084e+00 (2.5163e+00)	Acc@1  44.53 ( 44.72)	Acc@5  67.19 ( 69.68)
Epoch: [14][4100/5005]	Time  0.682 ( 0.685)	Data  0.000 ( 0.010)	Loss 2.7267e+00 (2.5162e+00)	Acc@1  43.36 ( 44.72)	Acc@5  67.19 ( 69.69)
Epoch: [14][4150/5005]	Time  0.682



Epoch: [15][ 250/5005]	Time  0.711 ( 0.702)	Data  0.000 ( 0.020)	Loss 2.3607e+00 (2.4731e+00)	Acc@1  44.92 ( 45.39)	Acc@5  71.88 ( 70.28)
Epoch: [15][ 300/5005]	Time  0.692 ( 0.702)	Data  0.000 ( 0.018)	Loss 2.4364e+00 (2.4719e+00)	Acc@1  47.27 ( 45.46)	Acc@5  69.53 ( 70.32)
Epoch: [15][ 350/5005]	Time  0.685 ( 0.700)	Data  0.000 ( 0.017)	Loss 2.3415e+00 (2.4742e+00)	Acc@1  45.31 ( 45.48)	Acc@5  74.22 ( 70.27)
Epoch: [15][ 400/5005]	Time  0.683 ( 0.698)	Data  0.000 ( 0.016)	Loss 2.4682e+00 (2.4714e+00)	Acc@1  47.27 ( 45.53)	Acc@5  69.53 ( 70.37)
Epoch: [15][ 450/5005]	Time  0.684 ( 0.697)	Data  0.000 ( 0.015)	Loss 2.4788e+00 (2.4734e+00)	Acc@1  45.70 ( 45.50)	Acc@5  68.75 ( 70.33)
Epoch: [15][ 500/5005]	Time  0.689 ( 0.696)	Data  0.000 ( 0.015)	Loss 2.4204e+00 (2.4775e+00)	Acc@1  44.53 ( 45.41)	Acc@5  70.70 ( 70.23)
Epoch: [15][ 550/5005]	Time  0.687 ( 0.696)	Data  0.000 ( 0.014)	Loss 2.7027e+00 (2.4788e+00)	Acc@1  41.02 ( 45.36)	Acc@5  65.62 ( 70.15)
Epoch: [15][ 600/5005]	Time  0.695

Epoch: [15][3250/5005]	Time  0.684 ( 0.689)	Data  0.000 ( 0.010)	Loss 2.4325e+00 (2.5018e+00)	Acc@1  46.88 ( 44.92)	Acc@5  73.44 ( 69.92)
Epoch: [15][3300/5005]	Time  0.682 ( 0.689)	Data  0.000 ( 0.010)	Loss 2.4713e+00 (2.5023e+00)	Acc@1  46.09 ( 44.92)	Acc@5  68.75 ( 69.91)
Epoch: [15][3350/5005]	Time  0.683 ( 0.689)	Data  0.000 ( 0.010)	Loss 2.8018e+00 (2.5019e+00)	Acc@1  38.28 ( 44.92)	Acc@5  65.62 ( 69.92)
Epoch: [15][3400/5005]	Time  0.680 ( 0.689)	Data  0.000 ( 0.010)	Loss 2.3574e+00 (2.5017e+00)	Acc@1  49.22 ( 44.93)	Acc@5  71.09 ( 69.92)
Epoch: [15][3450/5005]	Time  0.685 ( 0.689)	Data  0.000 ( 0.010)	Loss 2.3915e+00 (2.5015e+00)	Acc@1  47.66 ( 44.94)	Acc@5  72.66 ( 69.92)
Epoch: [15][3500/5005]	Time  0.687 ( 0.689)	Data  0.000 ( 0.010)	Loss 2.5262e+00 (2.5012e+00)	Acc@1  45.70 ( 44.95)	Acc@5  68.75 ( 69.92)
Epoch: [15][3550/5005]	Time  0.686 ( 0.689)	Data  0.000 ( 0.010)	Loss 2.5605e+00 (2.5017e+00)	Acc@1  48.05 ( 44.94)	Acc@5  71.48 ( 69.92)
Epoch: [15][3600/5005]	Time  0.693

Epoch: [16][1000/5005]	Time  0.679 ( 0.686)	Data  0.000 ( 0.012)	Loss 2.5885e+00 (2.4855e+00)	Acc@1  47.66 ( 45.25)	Acc@5  70.31 ( 70.23)
Epoch: [16][1050/5005]	Time  0.691 ( 0.686)	Data  0.000 ( 0.012)	Loss 2.6782e+00 (2.4860e+00)	Acc@1  44.14 ( 45.24)	Acc@5  64.84 ( 70.22)
Epoch: [16][1100/5005]	Time  0.690 ( 0.686)	Data  0.000 ( 0.012)	Loss 2.6066e+00 (2.4859e+00)	Acc@1  42.19 ( 45.27)	Acc@5  67.19 ( 70.22)
Epoch: [16][1150/5005]	Time  0.692 ( 0.686)	Data  0.000 ( 0.012)	Loss 2.4172e+00 (2.4868e+00)	Acc@1  46.48 ( 45.26)	Acc@5  70.70 ( 70.20)




Epoch: [16][1200/5005]	Time  0.701 ( 0.686)	Data  0.000 ( 0.012)	Loss 2.2704e+00 (2.4863e+00)	Acc@1  49.61 ( 45.28)	Acc@5  75.00 ( 70.22)
Epoch: [16][1250/5005]	Time  0.708 ( 0.687)	Data  0.000 ( 0.012)	Loss 2.2014e+00 (2.4855e+00)	Acc@1  50.78 ( 45.27)	Acc@5  74.61 ( 70.21)
Epoch: [16][1300/5005]	Time  0.699 ( 0.688)	Data  0.000 ( 0.012)	Loss 2.2520e+00 (2.4851e+00)	Acc@1  49.61 ( 45.27)	Acc@5  76.56 ( 70.23)
Epoch: [16][1350/5005]	Time  0.689 ( 0.688)	Data  0.000 ( 0.012)	Loss 2.7807e+00 (2.4860e+00)	Acc@1  39.84 ( 45.24)	Acc@5  62.50 ( 70.21)
Epoch: [16][1400/5005]	Time  0.684 ( 0.688)	Data  0.000 ( 0.012)	Loss 2.5305e+00 (2.4865e+00)	Acc@1  43.75 ( 45.24)	Acc@5  69.92 ( 70.20)
Epoch: [16][1450/5005]	Time  0.686 ( 0.688)	Data  0.000 ( 0.012)	Loss 2.3592e+00 (2.4871e+00)	Acc@1  46.48 ( 45.25)	Acc@5  72.27 ( 70.18)
Epoch: [16][1500/5005]	Time  0.690 ( 0.688)	Data  0.000 ( 0.011)	Loss 2.5175e+00 (2.4872e+00)	Acc@1  46.88 ( 45.23)	Acc@5  69.92 ( 70.18)
Epoch: [16][1550/5005]	Time  0.692

Epoch: [16][4200/5005]	Time  0.682 ( 0.688)	Data  0.000 ( 0.010)	Loss 2.4638e+00 (2.4990e+00)	Acc@1  43.75 ( 45.04)	Acc@5  70.70 ( 69.97)
Epoch: [16][4250/5005]	Time  0.681 ( 0.688)	Data  0.000 ( 0.010)	Loss 2.4760e+00 (2.4991e+00)	Acc@1  48.44 ( 45.04)	Acc@5  69.53 ( 69.97)
Epoch: [16][4300/5005]	Time  0.683 ( 0.688)	Data  0.000 ( 0.010)	Loss 2.3488e+00 (2.4991e+00)	Acc@1  46.48 ( 45.04)	Acc@5  69.92 ( 69.98)
Epoch: [16][4350/5005]	Time  0.684 ( 0.688)	Data  0.000 ( 0.010)	Loss 2.5265e+00 (2.4992e+00)	Acc@1  42.58 ( 45.03)	Acc@5  69.14 ( 69.98)
Epoch: [16][4400/5005]	Time  0.684 ( 0.688)	Data  0.000 ( 0.010)	Loss 2.5305e+00 (2.4993e+00)	Acc@1  44.92 ( 45.03)	Acc@5  68.36 ( 69.98)
Epoch: [16][4450/5005]	Time  0.684 ( 0.688)	Data  0.000 ( 0.010)	Loss 2.6644e+00 (2.4995e+00)	Acc@1  38.67 ( 45.03)	Acc@5  67.97 ( 69.97)
Epoch: [16][4500/5005]	Time  0.682 ( 0.688)	Data  0.000 ( 0.010)	Loss 2.5494e+00 (2.4996e+00)	Acc@1  44.53 ( 45.03)	Acc@5  71.09 ( 69.97)
Epoch: [16][4550/5005]	Time  0.680

Epoch: [17][1950/5005]	Time  0.688 ( 0.691)	Data  0.000 ( 0.011)	Loss 2.2398e+00 (2.0491e+00)	Acc@1  50.78 ( 53.99)	Acc@5  72.66 ( 76.89)
Epoch: [17][2000/5005]	Time  0.686 ( 0.691)	Data  0.000 ( 0.011)	Loss 1.8610e+00 (2.0475e+00)	Acc@1  58.20 ( 54.03)	Acc@5  78.91 ( 76.91)
Epoch: [17][2050/5005]	Time  0.688 ( 0.690)	Data  0.000 ( 0.011)	Loss 1.9331e+00 (2.0454e+00)	Acc@1  55.08 ( 54.07)	Acc@5  76.95 ( 76.94)
Epoch: [17][2100/5005]	Time  0.691 ( 0.690)	Data  0.000 ( 0.011)	Loss 2.0269e+00 (2.0440e+00)	Acc@1  56.25 ( 54.09)	Acc@5  78.52 ( 76.96)
Epoch: [17][2150/5005]	Time  0.695 ( 0.690)	Data  0.000 ( 0.011)	Loss 1.8768e+00 (2.0425e+00)	Acc@1  57.81 ( 54.12)	Acc@5  80.47 ( 76.98)
Epoch: [17][2200/5005]	Time  0.698 ( 0.691)	Data  0.000 ( 0.011)	Loss 2.0009e+00 (2.0406e+00)	Acc@1  55.86 ( 54.16)	Acc@5  75.78 ( 77.02)
Epoch: [17][2250/5005]	Time  0.708 ( 0.691)	Data  0.000 ( 0.011)	Loss 2.0813e+00 (2.0394e+00)	Acc@1  50.39 ( 54.18)	Acc@5  75.00 ( 77.04)
Epoch: [17][2300/5005]	Time  0.696



Epoch: [17][4550/5005]	Time  0.685 ( 0.689)	Data  0.000 ( 0.010)	Loss 1.7790e+00 (1.9834e+00)	Acc@1  60.94 ( 55.23)	Acc@5  78.12 ( 77.86)
Epoch: [17][4600/5005]	Time  0.687 ( 0.689)	Data  0.000 ( 0.010)	Loss 1.7456e+00 (1.9827e+00)	Acc@1  59.77 ( 55.24)	Acc@5  82.42 ( 77.88)
Epoch: [17][4650/5005]	Time  0.682 ( 0.689)	Data  0.000 ( 0.010)	Loss 1.8997e+00 (1.9819e+00)	Acc@1  60.94 ( 55.26)	Acc@5  77.34 ( 77.88)
Epoch: [17][4700/5005]	Time  0.681 ( 0.689)	Data  0.000 ( 0.010)	Loss 2.0142e+00 (1.9811e+00)	Acc@1  54.30 ( 55.27)	Acc@5  78.12 ( 77.90)
Epoch: [17][4750/5005]	Time  0.678 ( 0.689)	Data  0.000 ( 0.010)	Loss 1.8462e+00 (1.9804e+00)	Acc@1  59.38 ( 55.28)	Acc@5  78.12 ( 77.91)
Epoch: [17][4800/5005]	Time  0.683 ( 0.689)	Data  0.000 ( 0.010)	Loss 1.8280e+00 (1.9795e+00)	Acc@1  57.03 ( 55.30)	Acc@5  77.73 ( 77.92)
Epoch: [17][4850/5005]	Time  0.681 ( 0.689)	Data  0.000 ( 0.010)	Loss 1.7234e+00 (1.9783e+00)	Acc@1  60.94 ( 55.33)	Acc@5  82.03 ( 77.94)
Epoch: [17][4900/5005]	Time  0.685

Epoch: [18][2300/5005]	Time  0.685 ( 0.686)	Data  0.000 ( 0.010)	Loss 1.8924e+00 (1.8660e+00)	Acc@1  56.64 ( 57.52)	Acc@5  78.52 ( 79.69)
Epoch: [18][2350/5005]	Time  0.686 ( 0.686)	Data  0.000 ( 0.010)	Loss 1.9005e+00 (1.8660e+00)	Acc@1  54.30 ( 57.51)	Acc@5  75.78 ( 79.69)
Epoch: [18][2400/5005]	Time  0.685 ( 0.686)	Data  0.000 ( 0.010)	Loss 1.7106e+00 (1.8661e+00)	Acc@1  60.55 ( 57.51)	Acc@5  82.81 ( 79.69)
Epoch: [18][2450/5005]	Time  0.683 ( 0.686)	Data  0.000 ( 0.010)	Loss 2.0223e+00 (1.8662e+00)	Acc@1  57.42 ( 57.51)	Acc@5  76.17 ( 79.69)
Epoch: [18][2500/5005]	Time  0.683 ( 0.686)	Data  0.000 ( 0.010)	Loss 1.8126e+00 (1.8666e+00)	Acc@1  53.52 ( 57.50)	Acc@5  79.69 ( 79.68)
Epoch: [18][2550/5005]	Time  0.682 ( 0.686)	Data  0.000 ( 0.010)	Loss 1.6035e+00 (1.8658e+00)	Acc@1  59.77 ( 57.51)	Acc@5  85.16 ( 79.69)
Epoch: [18][2600/5005]	Time  0.683 ( 0.686)	Data  0.000 ( 0.010)	Loss 2.1399e+00 (1.8657e+00)	Acc@1  56.25 ( 57.52)	Acc@5  75.39 ( 79.70)
Epoch: [18][2650/5005]	Time  0.683



Epoch: [18][4850/5005]	Time  0.695 ( 0.686)	Data  0.000 ( 0.010)	Loss 1.8924e+00 (1.8581e+00)	Acc@1  55.86 ( 57.66)	Acc@5  78.12 ( 79.78)
Epoch: [18][4900/5005]	Time  0.689 ( 0.686)	Data  0.000 ( 0.010)	Loss 1.8670e+00 (1.8576e+00)	Acc@1  59.38 ( 57.67)	Acc@5  80.08 ( 79.80)
Epoch: [18][4950/5005]	Time  0.695 ( 0.686)	Data  0.000 ( 0.010)	Loss 1.7613e+00 (1.8574e+00)	Acc@1  59.38 ( 57.68)	Acc@5  80.08 ( 79.80)
Epoch: [18][5000/5005]	Time  0.704 ( 0.686)	Data  0.000 ( 0.010)	Loss 1.7845e+00 (1.8572e+00)	Acc@1  57.81 ( 57.68)	Acc@5  80.08 ( 79.80)
Test: [  0/196]	Time  3.320 ( 3.320)	Loss 9.4870e-01 (9.4870e-01)	Acc@1  77.34 ( 77.34)	Acc@5  94.14 ( 94.14)
Test: [ 50/196]	Time  0.210 ( 0.343)	Loss 9.6845e-01 (1.1850e+00)	Acc@1  72.66 ( 68.99)	Acc@5  94.53 ( 90.17)
Test: [100/196]	Time  0.209 ( 0.313)	Loss 2.1701e+00 (1.3425e+00)	Acc@1  42.97 ( 65.89)	Acc@5  74.22 ( 88.12)
Test: [150/196]	Time  0.210 ( 0.301)	Loss 1.7569e+00 (1.5115e+00)	Acc@1  63.28 ( 62.96)	Acc@5  78.91 ( 85.32)
 * Acc@1

Epoch: [19][2600/5005]	Time  0.701 ( 0.688)	Data  0.000 ( 0.011)	Loss 1.7283e+00 (1.8087e+00)	Acc@1  57.03 ( 58.64)	Acc@5  84.38 ( 80.41)
Epoch: [19][2650/5005]	Time  0.692 ( 0.688)	Data  0.000 ( 0.011)	Loss 1.8159e+00 (1.8085e+00)	Acc@1  58.20 ( 58.64)	Acc@5  81.64 ( 80.42)
Epoch: [19][2700/5005]	Time  0.690 ( 0.688)	Data  0.000 ( 0.010)	Loss 1.8251e+00 (1.8085e+00)	Acc@1  59.38 ( 58.64)	Acc@5  80.47 ( 80.42)
Epoch: [19][2750/5005]	Time  0.684 ( 0.688)	Data  0.000 ( 0.010)	Loss 1.7851e+00 (1.8088e+00)	Acc@1  62.11 ( 58.64)	Acc@5  81.64 ( 80.42)
Epoch: [19][2800/5005]	Time  0.688 ( 0.688)	Data  0.000 ( 0.010)	Loss 1.7955e+00 (1.8079e+00)	Acc@1  59.77 ( 58.65)	Acc@5  81.25 ( 80.43)
Epoch: [19][2850/5005]	Time  0.691 ( 0.688)	Data  0.000 ( 0.010)	Loss 1.9431e+00 (1.8083e+00)	Acc@1  55.47 ( 58.64)	Acc@5  76.95 ( 80.42)
Epoch: [19][2900/5005]	Time  0.687 ( 0.688)	Data  0.000 ( 0.010)	Loss 1.7816e+00 (1.8082e+00)	Acc@1  62.11 ( 58.65)	Acc@5  79.69 ( 80.42)
Epoch: [19][2950/5005]	Time  0.702



Epoch: [19][3650/5005]	Time  0.681 ( 0.688)	Data  0.000 ( 0.010)	Loss 1.8769e+00 (1.8086e+00)	Acc@1  54.30 ( 58.62)	Acc@5  80.08 ( 80.40)
Epoch: [19][3700/5005]	Time  0.683 ( 0.688)	Data  0.000 ( 0.010)	Loss 1.6974e+00 (1.8082e+00)	Acc@1  61.33 ( 58.63)	Acc@5  78.91 ( 80.40)
Epoch: [19][3750/5005]	Time  0.683 ( 0.688)	Data  0.000 ( 0.010)	Loss 1.9258e+00 (1.8080e+00)	Acc@1  57.03 ( 58.64)	Acc@5  76.95 ( 80.40)
Epoch: [19][3800/5005]	Time  0.683 ( 0.688)	Data  0.000 ( 0.010)	Loss 1.9170e+00 (1.8084e+00)	Acc@1  58.20 ( 58.63)	Acc@5  76.17 ( 80.39)
Epoch: [19][3850/5005]	Time  0.684 ( 0.688)	Data  0.000 ( 0.010)	Loss 1.9499e+00 (1.8080e+00)	Acc@1  57.03 ( 58.63)	Acc@5  76.17 ( 80.40)
Epoch: [19][3900/5005]	Time  0.687 ( 0.688)	Data  0.000 ( 0.010)	Loss 1.8357e+00 (1.8081e+00)	Acc@1  62.50 ( 58.62)	Acc@5  80.08 ( 80.40)
Epoch: [19][3950/5005]	Time  0.686 ( 0.688)	Data  0.000 ( 0.010)	Loss 1.8395e+00 (1.8083e+00)	Acc@1  57.81 ( 58.62)	Acc@5  78.91 ( 80.40)
Epoch: [19][4000/5005]	Time  0.680

Epoch: [20][1400/5005]	Time  0.679 ( 0.688)	Data  0.000 ( 0.011)	Loss 1.8077e+00 (1.7724e+00)	Acc@1  57.42 ( 59.27)	Acc@5  81.25 ( 80.99)
Epoch: [20][1450/5005]	Time  0.679 ( 0.688)	Data  0.000 ( 0.011)	Loss 1.8296e+00 (1.7728e+00)	Acc@1  56.25 ( 59.26)	Acc@5  78.12 ( 80.97)
Epoch: [20][1500/5005]	Time  0.682 ( 0.688)	Data  0.000 ( 0.011)	Loss 1.6327e+00 (1.7722e+00)	Acc@1  62.11 ( 59.28)	Acc@5  84.38 ( 80.97)
Epoch: [20][1550/5005]	Time  0.683 ( 0.687)	Data  0.000 ( 0.011)	Loss 1.8732e+00 (1.7727e+00)	Acc@1  59.77 ( 59.27)	Acc@5  80.47 ( 80.97)
Epoch: [20][1600/5005]	Time  0.686 ( 0.687)	Data  0.000 ( 0.011)	Loss 1.8727e+00 (1.7740e+00)	Acc@1  60.55 ( 59.23)	Acc@5  78.52 ( 80.94)
Epoch: [20][1650/5005]	Time  0.683 ( 0.687)	Data  0.000 ( 0.011)	Loss 1.7933e+00 (1.7747e+00)	Acc@1  60.55 ( 59.23)	Acc@5  81.64 ( 80.94)
Epoch: [20][1700/5005]	Time  0.685 ( 0.687)	Data  0.000 ( 0.011)	Loss 1.8476e+00 (1.7752e+00)	Acc@1  56.64 ( 59.21)	Acc@5  80.08 ( 80.93)
Epoch: [20][1750/5005]	Time  0.682



Epoch: [20][2000/5005]	Time  0.681 ( 0.686)	Data  0.000 ( 0.011)	Loss 1.8078e+00 (1.7772e+00)	Acc@1  59.38 ( 59.20)	Acc@5  82.81 ( 80.90)
Epoch: [20][2050/5005]	Time  0.692 ( 0.686)	Data  0.000 ( 0.011)	Loss 1.9978e+00 (1.7772e+00)	Acc@1  57.42 ( 59.20)	Acc@5  76.56 ( 80.91)
Epoch: [20][2100/5005]	Time  0.689 ( 0.686)	Data  0.000 ( 0.011)	Loss 1.8611e+00 (1.7777e+00)	Acc@1  51.95 ( 59.18)	Acc@5  80.86 ( 80.91)
Epoch: [20][2150/5005]	Time  0.689 ( 0.687)	Data  0.000 ( 0.011)	Loss 1.5804e+00 (1.7781e+00)	Acc@1  63.28 ( 59.17)	Acc@5  83.98 ( 80.90)
Epoch: [20][2200/5005]	Time  0.697 ( 0.687)	Data  0.000 ( 0.011)	Loss 1.7390e+00 (1.7786e+00)	Acc@1  60.94 ( 59.18)	Acc@5  79.30 ( 80.89)
Epoch: [20][2250/5005]	Time  0.700 ( 0.687)	Data  0.000 ( 0.010)	Loss 1.9289e+00 (1.7783e+00)	Acc@1  55.86 ( 59.18)	Acc@5  79.30 ( 80.90)
Epoch: [20][2300/5005]	Time  0.711 ( 0.688)	Data  0.000 ( 0.010)	Loss 1.8134e+00 (1.7788e+00)	Acc@1  58.98 ( 59.17)	Acc@5  82.03 ( 80.89)
Epoch: [20][2350/5005]	Time  0.691

Epoch: [20][5000/5005]	Time  0.683 ( 0.688)	Data  0.000 ( 0.010)	Loss 1.5804e+00 (1.7787e+00)	Acc@1  62.50 ( 59.15)	Acc@5  84.38 ( 80.87)
Test: [  0/196]	Time  3.326 ( 3.326)	Loss 9.3046e-01 (9.3046e-01)	Acc@1  76.17 ( 76.17)	Acc@5  94.14 ( 94.14)
Test: [ 50/196]	Time  0.227 ( 0.340)	Loss 9.6849e-01 (1.1654e+00)	Acc@1  69.92 ( 69.58)	Acc@5  92.58 ( 90.42)
Test: [100/196]	Time  0.203 ( 0.314)	Loss 2.2442e+00 (1.3239e+00)	Acc@1  42.19 ( 66.33)	Acc@5  75.78 ( 88.27)
Test: [150/196]	Time  0.203 ( 0.304)	Loss 1.7477e+00 (1.4830e+00)	Acc@1  66.80 ( 63.55)	Acc@5  78.91 ( 85.73)
 * Acc@1 62.774 Acc@5 85.038
lr: [0.00997452068955415]
Epoch: [21][   0/5005]	Time  3.388 ( 3.388)	Data  3.095 ( 3.095)	Loss 1.6073e+00 (1.6073e+00)	Acc@1  62.50 ( 62.50)	Acc@5  83.20 ( 83.20)
Epoch: [21][  50/5005]	Time  0.686 ( 0.739)	Data  0.000 ( 0.070)	Loss 1.9005e+00 (1.7265e+00)	Acc@1  58.20 ( 60.22)	Acc@5  83.20 ( 81.63)
Epoch: [21][ 100/5005]	Time  0.692 ( 0.715)	Data  0.000 ( 0.040)	Loss 1.8107e+00 (1.7315e+0

Epoch: [21][2750/5005]	Time  0.684 ( 0.690)	Data  0.000 ( 0.011)	Loss 2.1184e+00 (1.7548e+00)	Acc@1  51.95 ( 59.64)	Acc@5  75.78 ( 81.18)
Epoch: [21][2800/5005]	Time  0.683 ( 0.690)	Data  0.000 ( 0.010)	Loss 1.7759e+00 (1.7546e+00)	Acc@1  57.81 ( 59.64)	Acc@5  80.47 ( 81.19)
Epoch: [21][2850/5005]	Time  0.684 ( 0.690)	Data  0.000 ( 0.010)	Loss 1.6239e+00 (1.7549e+00)	Acc@1  63.28 ( 59.64)	Acc@5  83.20 ( 81.18)
Epoch: [21][2900/5005]	Time  0.686 ( 0.690)	Data  0.000 ( 0.010)	Loss 1.6825e+00 (1.7550e+00)	Acc@1  61.72 ( 59.63)	Acc@5  80.86 ( 81.18)
Epoch: [21][2950/5005]	Time  0.684 ( 0.690)	Data  0.000 ( 0.010)	Loss 1.7434e+00 (1.7553e+00)	Acc@1  58.20 ( 59.62)	Acc@5  81.64 ( 81.17)
Epoch: [21][3000/5005]	Time  0.689 ( 0.690)	Data  0.000 ( 0.010)	Loss 1.7106e+00 (1.7549e+00)	Acc@1  63.28 ( 59.63)	Acc@5  81.64 ( 81.17)
Epoch: [21][3050/5005]	Time  0.689 ( 0.690)	Data  0.000 ( 0.010)	Loss 1.8406e+00 (1.7557e+00)	Acc@1  60.16 ( 59.62)	Acc@5  81.25 ( 81.16)
Epoch: [21][3100/5005]	Time  0.689



Epoch: [21][4450/5005]	Time  0.686 ( 0.692)	Data  0.000 ( 0.010)	Loss 1.6370e+00 (1.7563e+00)	Acc@1  61.33 ( 59.60)	Acc@5  81.64 ( 81.20)
Epoch: [21][4500/5005]	Time  0.687 ( 0.691)	Data  0.000 ( 0.010)	Loss 2.0172e+00 (1.7566e+00)	Acc@1  55.86 ( 59.59)	Acc@5  75.00 ( 81.20)
Epoch: [21][4550/5005]	Time  0.689 ( 0.691)	Data  0.000 ( 0.010)	Loss 1.8347e+00 (1.7569e+00)	Acc@1  57.81 ( 59.59)	Acc@5  80.86 ( 81.20)
Epoch: [21][4600/5005]	Time  0.690 ( 0.691)	Data  0.000 ( 0.010)	Loss 1.8294e+00 (1.7571e+00)	Acc@1  56.25 ( 59.59)	Acc@5  82.81 ( 81.19)
Epoch: [21][4650/5005]	Time  0.686 ( 0.691)	Data  0.000 ( 0.010)	Loss 1.6909e+00 (1.7572e+00)	Acc@1  60.55 ( 59.58)	Acc@5  82.03 ( 81.19)
Epoch: [21][4700/5005]	Time  0.682 ( 0.691)	Data  0.000 ( 0.010)	Loss 1.9560e+00 (1.7571e+00)	Acc@1  56.25 ( 59.58)	Acc@5  80.08 ( 81.19)
Epoch: [21][4750/5005]	Time  0.683 ( 0.691)	Data  0.000 ( 0.010)	Loss 1.6187e+00 (1.7574e+00)	Acc@1  62.50 ( 59.58)	Acc@5  82.81 ( 81.18)
Epoch: [21][4800/5005]	Time  0.685

Epoch: [22][2200/5005]	Time  0.684 ( 0.693)	Data  0.000 ( 0.011)	Loss 1.6396e+00 (1.7389e+00)	Acc@1  62.11 ( 59.89)	Acc@5  83.20 ( 81.46)
Epoch: [22][2250/5005]	Time  0.690 ( 0.693)	Data  0.000 ( 0.011)	Loss 1.8677e+00 (1.7390e+00)	Acc@1  58.20 ( 59.90)	Acc@5  78.52 ( 81.46)
Epoch: [22][2300/5005]	Time  0.688 ( 0.693)	Data  0.000 ( 0.011)	Loss 1.8215e+00 (1.7393e+00)	Acc@1  56.25 ( 59.90)	Acc@5  82.03 ( 81.45)
Epoch: [22][2350/5005]	Time  0.690 ( 0.693)	Data  0.000 ( 0.011)	Loss 1.8752e+00 (1.7394e+00)	Acc@1  51.95 ( 59.88)	Acc@5  78.91 ( 81.45)
Epoch: [22][2400/5005]	Time  0.683 ( 0.693)	Data  0.000 ( 0.011)	Loss 1.7125e+00 (1.7397e+00)	Acc@1  62.89 ( 59.88)	Acc@5  79.69 ( 81.45)
Epoch: [22][2450/5005]	Time  0.685 ( 0.692)	Data  0.000 ( 0.011)	Loss 1.6235e+00 (1.7394e+00)	Acc@1  61.33 ( 59.89)	Acc@5  82.81 ( 81.46)
Epoch: [22][2500/5005]	Time  0.686 ( 0.692)	Data  0.000 ( 0.011)	Loss 1.5489e+00 (1.7389e+00)	Acc@1  64.06 ( 59.90)	Acc@5  85.94 ( 81.47)
Epoch: [22][2550/5005]	Time  0.683



Epoch: [22][2850/5005]	Time  0.686 ( 0.691)	Data  0.000 ( 0.011)	Loss 1.6238e+00 (1.7412e+00)	Acc@1  62.50 ( 59.86)	Acc@5  84.38 ( 81.43)
Epoch: [22][2900/5005]	Time  0.683 ( 0.691)	Data  0.000 ( 0.011)	Loss 1.7842e+00 (1.7412e+00)	Acc@1  57.81 ( 59.86)	Acc@5  78.91 ( 81.42)
Epoch: [22][2950/5005]	Time  0.685 ( 0.691)	Data  0.000 ( 0.010)	Loss 1.6053e+00 (1.7413e+00)	Acc@1  60.94 ( 59.86)	Acc@5  85.16 ( 81.42)
Epoch: [22][3000/5005]	Time  0.687 ( 0.691)	Data  0.000 ( 0.010)	Loss 2.0003e+00 (1.7413e+00)	Acc@1  55.08 ( 59.86)	Acc@5  80.08 ( 81.42)
Epoch: [22][3050/5005]	Time  0.685 ( 0.691)	Data  0.000 ( 0.010)	Loss 2.0742e+00 (1.7419e+00)	Acc@1  53.12 ( 59.85)	Acc@5  75.78 ( 81.41)
Epoch: [22][3100/5005]	Time  0.684 ( 0.691)	Data  0.000 ( 0.010)	Loss 1.7531e+00 (1.7418e+00)	Acc@1  59.38 ( 59.86)	Acc@5  80.86 ( 81.41)
Epoch: [22][3150/5005]	Time  0.688 ( 0.691)	Data  0.000 ( 0.010)	Loss 1.8082e+00 (1.7423e+00)	Acc@1  54.30 ( 59.85)	Acc@5  82.81 ( 81.41)
Epoch: [22][3200/5005]	Time  0.682

Epoch: [23][ 600/5005]	Time  0.689 ( 0.697)	Data  0.000 ( 0.014)	Loss 1.9005e+00 (1.7132e+00)	Acc@1  56.25 ( 60.43)	Acc@5  76.56 ( 81.80)
Epoch: [23][ 650/5005]	Time  0.688 ( 0.697)	Data  0.000 ( 0.013)	Loss 1.5888e+00 (1.7146e+00)	Acc@1  64.06 ( 60.39)	Acc@5  84.38 ( 81.76)
Epoch: [23][ 700/5005]	Time  0.686 ( 0.696)	Data  0.000 ( 0.013)	Loss 1.5534e+00 (1.7156e+00)	Acc@1  61.72 ( 60.42)	Acc@5  84.38 ( 81.77)
Epoch: [23][ 750/5005]	Time  0.687 ( 0.695)	Data  0.000 ( 0.013)	Loss 1.7208e+00 (1.7186e+00)	Acc@1  59.38 ( 60.36)	Acc@5  82.03 ( 81.72)
Epoch: [23][ 800/5005]	Time  0.684 ( 0.695)	Data  0.000 ( 0.013)	Loss 1.5374e+00 (1.7199e+00)	Acc@1  64.84 ( 60.33)	Acc@5  83.59 ( 81.68)
Epoch: [23][ 850/5005]	Time  0.684 ( 0.694)	Data  0.000 ( 0.012)	Loss 1.6445e+00 (1.7207e+00)	Acc@1  61.33 ( 60.28)	Acc@5  84.38 ( 81.66)
Epoch: [23][ 900/5005]	Time  0.682 ( 0.693)	Data  0.000 ( 0.012)	Loss 1.7622e+00 (1.7223e+00)	Acc@1  61.33 ( 60.24)	Acc@5  81.64 ( 81.64)
Epoch: [23][ 950/5005]	Time  0.688

Epoch: [23][3600/5005]	Time  0.681 ( 0.688)	Data  0.000 ( 0.010)	Loss 1.8375e+00 (1.7341e+00)	Acc@1  53.91 ( 60.03)	Acc@5  80.08 ( 81.50)
Epoch: [23][3650/5005]	Time  0.688 ( 0.688)	Data  0.000 ( 0.010)	Loss 1.8057e+00 (1.7340e+00)	Acc@1  57.81 ( 60.03)	Acc@5  82.42 ( 81.50)
Epoch: [23][3700/5005]	Time  0.684 ( 0.688)	Data  0.000 ( 0.010)	Loss 1.7661e+00 (1.7342e+00)	Acc@1  62.50 ( 60.03)	Acc@5  80.47 ( 81.50)
Epoch: [23][3750/5005]	Time  0.688 ( 0.688)	Data  0.000 ( 0.010)	Loss 1.7880e+00 (1.7341e+00)	Acc@1  60.55 ( 60.03)	Acc@5  78.91 ( 81.50)
Epoch: [23][3800/5005]	Time  0.679 ( 0.688)	Data  0.000 ( 0.010)	Loss 1.7203e+00 (1.7343e+00)	Acc@1  64.06 ( 60.02)	Acc@5  81.64 ( 81.50)
Epoch: [23][3850/5005]	Time  0.682 ( 0.688)	Data  0.000 ( 0.010)	Loss 1.7848e+00 (1.7343e+00)	Acc@1  54.69 ( 60.02)	Acc@5  82.42 ( 81.50)
Epoch: [23][3900/5005]	Time  0.688 ( 0.688)	Data  0.000 ( 0.010)	Loss 1.8439e+00 (1.7345e+00)	Acc@1  53.91 ( 60.01)	Acc@5  81.64 ( 81.49)




Epoch: [23][3950/5005]	Time  0.680 ( 0.688)	Data  0.000 ( 0.010)	Loss 1.6127e+00 (1.7348e+00)	Acc@1  64.06 ( 60.01)	Acc@5  82.03 ( 81.49)
Epoch: [23][4000/5005]	Time  0.688 ( 0.688)	Data  0.000 ( 0.010)	Loss 1.8400e+00 (1.7349e+00)	Acc@1  60.55 ( 60.00)	Acc@5  79.69 ( 81.49)
Epoch: [23][4050/5005]	Time  0.681 ( 0.688)	Data  0.000 ( 0.010)	Loss 1.9537e+00 (1.7350e+00)	Acc@1  57.03 ( 60.00)	Acc@5  77.73 ( 81.49)
Epoch: [23][4100/5005]	Time  0.686 ( 0.688)	Data  0.000 ( 0.010)	Loss 1.6970e+00 (1.7350e+00)	Acc@1  60.16 ( 59.99)	Acc@5  82.81 ( 81.50)
Epoch: [23][4150/5005]	Time  0.683 ( 0.688)	Data  0.000 ( 0.010)	Loss 1.7905e+00 (1.7355e+00)	Acc@1  57.03 ( 59.99)	Acc@5  80.47 ( 81.49)
Epoch: [23][4200/5005]	Time  0.685 ( 0.688)	Data  0.000 ( 0.010)	Loss 1.8154e+00 (1.7356e+00)	Acc@1  60.94 ( 59.98)	Acc@5  80.08 ( 81.48)
Epoch: [23][4250/5005]	Time  0.683 ( 0.688)	Data  0.000 ( 0.010)	Loss 1.6749e+00 (1.7357e+00)	Acc@1  56.64 ( 59.97)	Acc@5  82.42 ( 81.48)
Epoch: [23][4300/5005]	Time  0.681

Epoch: [24][1700/5005]	Time  0.680 ( 0.692)	Data  0.000 ( 0.011)	Loss 1.6650e+00 (1.7150e+00)	Acc@1  60.55 ( 60.33)	Acc@5  85.55 ( 81.81)
Epoch: [24][1750/5005]	Time  0.688 ( 0.691)	Data  0.000 ( 0.011)	Loss 1.8588e+00 (1.7166e+00)	Acc@1  57.03 ( 60.31)	Acc@5  77.34 ( 81.78)
Epoch: [24][1800/5005]	Time  0.686 ( 0.691)	Data  0.000 ( 0.011)	Loss 1.5604e+00 (1.7170e+00)	Acc@1  63.67 ( 60.30)	Acc@5  84.77 ( 81.77)
Epoch: [24][1850/5005]	Time  0.691 ( 0.691)	Data  0.000 ( 0.011)	Loss 1.8067e+00 (1.7177e+00)	Acc@1  60.55 ( 60.29)	Acc@5  80.47 ( 81.77)
Epoch: [24][1900/5005]	Time  0.686 ( 0.691)	Data  0.000 ( 0.011)	Loss 1.8100e+00 (1.7182e+00)	Acc@1  60.55 ( 60.27)	Acc@5  78.12 ( 81.76)
Epoch: [24][1950/5005]	Time  0.687 ( 0.691)	Data  0.000 ( 0.011)	Loss 1.8575e+00 (1.7189e+00)	Acc@1  58.98 ( 60.27)	Acc@5  80.47 ( 81.74)
Epoch: [24][2000/5005]	Time  0.682 ( 0.691)	Data  0.000 ( 0.011)	Loss 1.7669e+00 (1.7199e+00)	Acc@1  63.28 ( 60.27)	Acc@5  82.81 ( 81.73)
Epoch: [24][2050/5005]	Time  0.685



Epoch: [24][2100/5005]	Time  0.688 ( 0.690)	Data  0.000 ( 0.011)	Loss 1.5952e+00 (1.7202e+00)	Acc@1  64.06 ( 60.26)	Acc@5  82.03 ( 81.73)
Epoch: [24][2150/5005]	Time  0.685 ( 0.690)	Data  0.000 ( 0.011)	Loss 1.7321e+00 (1.7205e+00)	Acc@1  59.77 ( 60.26)	Acc@5  81.25 ( 81.72)
Epoch: [24][2200/5005]	Time  0.685 ( 0.690)	Data  0.000 ( 0.011)	Loss 1.6209e+00 (1.7207e+00)	Acc@1  64.06 ( 60.26)	Acc@5  82.42 ( 81.72)
Epoch: [24][2250/5005]	Time  0.684 ( 0.690)	Data  0.000 ( 0.011)	Loss 1.4531e+00 (1.7211e+00)	Acc@1  66.80 ( 60.25)	Acc@5  85.94 ( 81.71)
Epoch: [24][2300/5005]	Time  0.683 ( 0.690)	Data  0.000 ( 0.011)	Loss 1.6193e+00 (1.7219e+00)	Acc@1  60.94 ( 60.25)	Acc@5  81.25 ( 81.69)
Epoch: [24][2350/5005]	Time  0.682 ( 0.690)	Data  0.000 ( 0.011)	Loss 1.6880e+00 (1.7223e+00)	Acc@1  60.16 ( 60.24)	Acc@5  82.42 ( 81.69)
Epoch: [24][2400/5005]	Time  0.686 ( 0.690)	Data  0.000 ( 0.011)	Loss 1.7576e+00 (1.7221e+00)	Acc@1  62.11 ( 60.24)	Acc@5  81.64 ( 81.69)
Epoch: [24][2450/5005]	Time  0.682

Test: [ 50/196]	Time  0.203 ( 0.341)	Loss 8.5326e-01 (1.1532e+00)	Acc@1  75.78 ( 69.86)	Acc@5  94.14 ( 90.79)
Test: [100/196]	Time  0.202 ( 0.313)	Loss 2.0199e+00 (1.3056e+00)	Acc@1  51.56 ( 66.96)	Acc@5  76.17 ( 88.77)
Test: [150/196]	Time  0.204 ( 0.302)	Loss 1.8001e+00 (1.4612e+00)	Acc@1  65.62 ( 64.23)	Acc@5  79.30 ( 86.22)
 * Acc@1 63.284 Acc@5 85.424
lr: [0.009969442298524795]
Epoch: [25][   0/5005]	Time  3.010 ( 3.010)	Data  2.689 ( 2.689)	Loss 1.5933e+00 (1.5933e+00)	Acc@1  62.89 ( 62.89)	Acc@5  84.38 ( 84.38)
Epoch: [25][  50/5005]	Time  0.685 ( 0.727)	Data  0.000 ( 0.061)	Loss 1.6438e+00 (1.7144e+00)	Acc@1  63.28 ( 60.54)	Acc@5  80.86 ( 81.97)
Epoch: [25][ 100/5005]	Time  0.681 ( 0.705)	Data  0.000 ( 0.036)	Loss 2.0235e+00 (1.7268e+00)	Acc@1  54.30 ( 60.11)	Acc@5  77.34 ( 81.79)
Epoch: [25][ 150/5005]	Time  0.683 ( 0.698)	Data  0.000 ( 0.027)	Loss 1.8527e+00 (1.7283e+00)	Acc@1  60.55 ( 60.07)	Acc@5  79.69 ( 81.73)
Epoch: [25][ 200/5005]	Time  0.686 ( 0.695)	Data  0.000 ( 0.02

Epoch: [25][2850/5005]	Time  0.694 ( 0.688)	Data  0.000 ( 0.010)	Loss 1.9806e+00 (1.7168e+00)	Acc@1  54.30 ( 60.41)	Acc@5  78.12 ( 81.78)
Epoch: [25][2900/5005]	Time  0.702 ( 0.689)	Data  0.000 ( 0.010)	Loss 1.7660e+00 (1.7170e+00)	Acc@1  57.42 ( 60.41)	Acc@5  82.42 ( 81.79)
Epoch: [25][2950/5005]	Time  0.711 ( 0.689)	Data  0.000 ( 0.010)	Loss 1.9375e+00 (1.7165e+00)	Acc@1  55.86 ( 60.41)	Acc@5  74.61 ( 81.79)
Epoch: [25][3000/5005]	Time  0.701 ( 0.689)	Data  0.000 ( 0.010)	Loss 1.6550e+00 (1.7165e+00)	Acc@1  63.67 ( 60.42)	Acc@5  82.81 ( 81.79)
Epoch: [25][3050/5005]	Time  0.690 ( 0.689)	Data  0.000 ( 0.010)	Loss 1.7072e+00 (1.7167e+00)	Acc@1  60.16 ( 60.42)	Acc@5  80.86 ( 81.79)
Epoch: [25][3100/5005]	Time  0.691 ( 0.689)	Data  0.000 ( 0.010)	Loss 1.6195e+00 (1.7173e+00)	Acc@1  59.38 ( 60.40)	Acc@5  83.98 ( 81.78)
Epoch: [25][3150/5005]	Time  0.693 ( 0.689)	Data  0.000 ( 0.010)	Loss 1.5737e+00 (1.7181e+00)	Acc@1  62.11 ( 60.39)	Acc@5  84.38 ( 81.76)
Epoch: [25][3200/5005]	Time  0.691



Epoch: [25][3650/5005]	Time  0.684 ( 0.690)	Data  0.000 ( 0.010)	Loss 1.7700e+00 (1.7205e+00)	Acc@1  58.20 ( 60.34)	Acc@5  81.25 ( 81.72)
Epoch: [25][3700/5005]	Time  0.685 ( 0.690)	Data  0.000 ( 0.010)	Loss 2.0010e+00 (1.7208e+00)	Acc@1  57.03 ( 60.34)	Acc@5  75.39 ( 81.71)
Epoch: [25][3750/5005]	Time  0.686 ( 0.690)	Data  0.000 ( 0.010)	Loss 1.7966e+00 (1.7215e+00)	Acc@1  61.33 ( 60.33)	Acc@5  80.08 ( 81.70)
Epoch: [25][3800/5005]	Time  0.688 ( 0.690)	Data  0.000 ( 0.010)	Loss 1.9220e+00 (1.7219e+00)	Acc@1  59.38 ( 60.32)	Acc@5  80.86 ( 81.70)
Epoch: [25][3850/5005]	Time  0.684 ( 0.690)	Data  0.000 ( 0.010)	Loss 1.6588e+00 (1.7221e+00)	Acc@1  60.55 ( 60.32)	Acc@5  83.98 ( 81.69)
Epoch: [25][3900/5005]	Time  0.683 ( 0.690)	Data  0.000 ( 0.010)	Loss 1.5519e+00 (1.7221e+00)	Acc@1  64.45 ( 60.32)	Acc@5  82.03 ( 81.70)
Epoch: [25][3950/5005]	Time  0.688 ( 0.690)	Data  0.000 ( 0.010)	Loss 1.7105e+00 (1.7223e+00)	Acc@1  61.72 ( 60.31)	Acc@5  82.03 ( 81.70)
Epoch: [25][4000/5005]	Time  0.682

Epoch: [26][1400/5005]	Time  0.679 ( 0.690)	Data  0.000 ( 0.011)	Loss 2.0200e+00 (1.7054e+00)	Acc@1  55.86 ( 60.49)	Acc@5  75.00 ( 81.92)
Epoch: [26][1450/5005]	Time  0.683 ( 0.689)	Data  0.000 ( 0.011)	Loss 1.4989e+00 (1.7051e+00)	Acc@1  68.36 ( 60.50)	Acc@5  85.16 ( 81.92)
Epoch: [26][1500/5005]	Time  0.688 ( 0.689)	Data  0.000 ( 0.011)	Loss 1.6806e+00 (1.7061e+00)	Acc@1  58.20 ( 60.48)	Acc@5  82.81 ( 81.91)
Epoch: [26][1550/5005]	Time  0.681 ( 0.689)	Data  0.000 ( 0.011)	Loss 1.6482e+00 (1.7057e+00)	Acc@1  62.50 ( 60.48)	Acc@5  82.42 ( 81.91)
Epoch: [26][1600/5005]	Time  0.685 ( 0.689)	Data  0.000 ( 0.011)	Loss 1.8206e+00 (1.7065e+00)	Acc@1  58.20 ( 60.45)	Acc@5  83.59 ( 81.91)
Epoch: [26][1650/5005]	Time  0.682 ( 0.689)	Data  0.000 ( 0.011)	Loss 1.8282e+00 (1.7065e+00)	Acc@1  59.38 ( 60.44)	Acc@5  80.86 ( 81.91)
Epoch: [26][1700/5005]	Time  0.686 ( 0.689)	Data  0.000 ( 0.011)	Loss 1.8097e+00 (1.7076e+00)	Acc@1  59.77 ( 60.42)	Acc@5  82.42 ( 81.90)
Epoch: [26][1750/5005]	Time  0.682



Epoch: [26][3600/5005]	Time  0.694 ( 0.689)	Data  0.000 ( 0.010)	Loss 1.7837e+00 (1.7187e+00)	Acc@1  60.16 ( 60.29)	Acc@5  78.52 ( 81.77)
Epoch: [26][3650/5005]	Time  0.690 ( 0.689)	Data  0.000 ( 0.010)	Loss 1.6367e+00 (1.7192e+00)	Acc@1  62.50 ( 60.28)	Acc@5  82.42 ( 81.77)
Epoch: [26][3700/5005]	Time  0.682 ( 0.689)	Data  0.000 ( 0.010)	Loss 1.7052e+00 (1.7196e+00)	Acc@1  63.28 ( 60.27)	Acc@5  78.91 ( 81.76)
Epoch: [26][3750/5005]	Time  0.686 ( 0.689)	Data  0.000 ( 0.010)	Loss 1.7947e+00 (1.7200e+00)	Acc@1  58.98 ( 60.26)	Acc@5  81.25 ( 81.75)
Epoch: [26][3800/5005]	Time  0.684 ( 0.689)	Data  0.000 ( 0.010)	Loss 1.8667e+00 (1.7197e+00)	Acc@1  56.64 ( 60.26)	Acc@5  79.30 ( 81.76)
Epoch: [26][3850/5005]	Time  0.681 ( 0.689)	Data  0.000 ( 0.010)	Loss 1.6754e+00 (1.7201e+00)	Acc@1  62.11 ( 60.25)	Acc@5  80.86 ( 81.75)
Epoch: [26][3900/5005]	Time  0.681 ( 0.689)	Data  0.000 ( 0.010)	Loss 1.8952e+00 (1.7205e+00)	Acc@1  59.38 ( 60.25)	Acc@5  76.95 ( 81.74)
Epoch: [26][3950/5005]	Time  0.686

KeyboardInterrupt: 