In [1]:
import torch
from torch.utils.data import DataLoader
from dataset.dataset import get_cdiscount_dataset
from model.model import assemble_model
from trainer.trainer import get_trainer

# Ignore warnings
import warnings
warnings.filterwarnings("ignore")

# redirect print to file
# import sys
# sys.stdout = open("PyTorch-resnet34-log.txt", "w")

In [None]:
# parameters
config = {
    'train_batch_size': 48, 'val_batch_size': 48,
    'arch': 'resnet152',
    'optimizer': 'Adam', 'learning_rate': 5e-6, 'decay_lr_freq': 3e5, 'weight_decay': 5e-4,
    'resume': None,
    'start_epoch': 0, 'epochs': 10,
    'print_freq': 10, 'validate_freq': 3e4, 'save_freq': 1e3,
    'best_val_prec1': 0
}

In [None]:
import torchvision.models as models

# get dataset
print('getting dataset...')
train_dataset = get_cdiscount_dataset(offsets_csv="train_offsets.csv",
                                      images_csv="train_images.csv",
                                      bson_file_path="/mnt/data/cdiscount/train.bson",
                                      with_label=True,
                                      resize=224)
val_dataset = get_cdiscount_dataset(offsets_csv="train_offsets.csv",
                                    images_csv="val_images.csv",
                                    bson_file_path="/mnt/data/cdiscount/train.bson",
                                    with_label=True,
                                    resize=224)

# get data loader
print('getting data loader...')
train_dataloader = DataLoader(train_dataset, batch_size=config['train_batch_size'], shuffle=True, num_workers=6)
val_dataloader = DataLoader(val_dataset, batch_size=config['val_batch_size'], shuffle=True, num_workers=6)

# define model
print("=> using pre-trained model '{}'".format(config['arch']))
model = models.__dict__[config['arch']](pretrained=True)
model = assemble_model(model, -1, 2048, 5270)
model = torch.nn.DataParallel(model).cuda()

# define loss function (criterion) and optimizer
criterion = torch.nn.CrossEntropyLoss().cuda()

# get trainer
Trainer = get_trainer(train_dataloader, val_dataloader, model, criterion, config)

# Run!
Trainer.run()

getting dataset...
getting data loader...
=> using pre-trained model 'resnet152'
start training
Epoch: [0][0/206270]	Time 23.269 (23.269)	Data 3.325 (3.325)	Loss 8.6347 (8.6347)	Prec@1 0.000 (0.000)	Prec@5 0.000 (0.000)
Epoch: [0][10/206270]	Time 2.559 (4.451)	Data 0.007 (0.310)	Loss 8.6234 (8.6162)	Prec@1 0.000 (0.000)	Prec@5 0.000 (0.000)
Epoch: [0][20/206270]	Time 2.557 (3.543)	Data 0.009 (0.167)	Loss 8.6363 (8.6019)	Prec@1 0.000 (0.000)	Prec@5 2.083 (0.397)
Epoch: [0][30/206270]	Time 2.564 (3.226)	Data 0.009 (0.116)	Loss 8.5990 (8.5756)	Prec@1 0.000 (0.000)	Prec@5 0.000 (0.336)
Epoch: [0][40/206270]	Time 2.549 (3.063)	Data 0.008 (0.090)	Loss 8.4095 (8.5665)	Prec@1 0.000 (0.000)	Prec@5 0.000 (0.254)
Epoch: [0][50/206270]	Time 2.558 (2.963)	Data 0.018 (0.074)	Loss 8.5124 (8.5533)	Prec@1 0.000 (0.000)	Prec@5 4.167 (0.408)
Epoch: [0][60/206270]	Time 2.562 (2.898)	Data 0.008 (0.064)	Loss 8.4454 (8.5297)	Prec@1 0.000 (0.102)	Prec@5 0.000 (0.444)
Epoch: [0][70/206270]	Time 2.546 (2.851)	D

Epoch: [0][650/206270]	Time 2.567 (2.591)	Data 0.008 (0.015)	Loss 6.9431 (7.5943)	Prec@1 10.417 (5.293)	Prec@5 16.667 (11.364)
Epoch: [0][660/206270]	Time 2.549 (2.590)	Data 0.008 (0.015)	Loss 7.1555 (7.5842)	Prec@1 10.417 (5.358)	Prec@5 16.667 (11.485)
Epoch: [0][670/206270]	Time 2.550 (2.590)	Data 0.010 (0.015)	Loss 6.9948 (7.5738)	Prec@1 10.417 (5.437)	Prec@5 18.750 (11.587)
Epoch: [0][680/206270]	Time 2.550 (2.589)	Data 0.008 (0.014)	Loss 7.0365 (7.5648)	Prec@1 18.750 (5.522)	Prec@5 18.750 (11.662)
Epoch: [0][690/206270]	Time 2.556 (2.589)	Data 0.008 (0.014)	Loss 6.9763 (7.5545)	Prec@1 8.333 (5.605)	Prec@5 18.750 (11.798)
Epoch: [0][700/206270]	Time 2.572 (2.588)	Data 0.010 (0.014)	Loss 6.2917 (7.5427)	Prec@1 16.667 (5.712)	Prec@5 27.083 (11.929)
Epoch: [0][710/206270]	Time 2.569 (2.588)	Data 0.008 (0.014)	Loss 6.7297 (7.5311)	Prec@1 10.417 (5.793)	Prec@5 25.000 (12.066)
Epoch: [0][720/206270]	Time 2.557 (2.587)	Data 0.010 (0.014)	Loss 6.7307 (7.5197)	Prec@1 12.500 (5.892)	Prec@5 2

Epoch: [0][1300/206270]	Time 2.555 (2.575)	Data 0.010 (0.013)	Loss 6.3068 (6.9818)	Prec@1 12.500 (9.530)	Prec@5 20.833 (17.943)
Epoch: [0][1310/206270]	Time 2.561 (2.575)	Data 0.009 (0.013)	Loss 5.8264 (6.9739)	Prec@1 18.750 (9.586)	Prec@5 29.167 (18.016)
Epoch: [0][1320/206270]	Time 2.561 (2.575)	Data 0.009 (0.013)	Loss 6.0056 (6.9659)	Prec@1 10.417 (9.645)	Prec@5 27.083 (18.102)
Epoch: [0][1330/206270]	Time 2.565 (2.575)	Data 0.012 (0.013)	Loss 5.6190 (6.9597)	Prec@1 20.833 (9.678)	Prec@5 33.333 (18.160)
Epoch: [0][1340/206270]	Time 2.559 (2.575)	Data 0.009 (0.013)	Loss 5.9369 (6.9524)	Prec@1 20.833 (9.736)	Prec@5 33.333 (18.245)
Epoch: [0][1350/206270]	Time 2.559 (2.575)	Data 0.011 (0.013)	Loss 5.5773 (6.9446)	Prec@1 22.917 (9.806)	Prec@5 35.417 (18.340)
Epoch: [0][1360/206270]	Time 2.557 (2.575)	Data 0.011 (0.013)	Loss 5.6456 (6.9372)	Prec@1 20.833 (9.849)	Prec@5 33.333 (18.410)
Epoch: [0][1370/206270]	Time 2.561 (2.575)	Data 0.010 (0.013)	Loss 6.1700 (6.9315)	Prec@1 16.667 (9.888)

Epoch: [0][1940/206270]	Time 2.550 (2.570)	Data 0.013 (0.013)	Loss 5.8099 (6.5940)	Prec@1 16.667 (12.284)	Prec@5 25.000 (21.866)
Epoch: [0][1950/206270]	Time 2.548 (2.570)	Data 0.010 (0.013)	Loss 5.6311 (6.5885)	Prec@1 14.583 (12.328)	Prec@5 27.083 (21.919)
Epoch: [0][1960/206270]	Time 2.562 (2.570)	Data 0.011 (0.013)	Loss 5.3995 (6.5820)	Prec@1 14.583 (12.385)	Prec@5 35.417 (21.991)
Epoch: [0][1970/206270]	Time 2.553 (2.569)	Data 0.014 (0.013)	Loss 5.4116 (6.5769)	Prec@1 20.833 (12.422)	Prec@5 39.583 (22.052)
Epoch: [0][1980/206270]	Time 2.565 (2.569)	Data 0.011 (0.013)	Loss 5.7652 (6.5723)	Prec@1 12.500 (12.454)	Prec@5 29.167 (22.101)
Epoch: [0][1990/206270]	Time 2.538 (2.569)	Data 0.013 (0.013)	Loss 5.3652 (6.5671)	Prec@1 25.000 (12.487)	Prec@5 37.500 (22.147)
Epoch: [0][2000/206270]	Time 2.553 (2.569)	Data 0.014 (0.013)	Loss 5.5447 (6.5616)	Prec@1 18.750 (12.526)	Prec@5 31.250 (22.192)
Epoch: [0][2010/206270]	Time 2.560 (2.570)	Data 0.012 (0.013)	Loss 6.1841 (6.5567)	Prec@1 14.583 

Epoch: [0][2580/206270]	Time 2.541 (2.567)	Data 0.011 (0.013)	Loss 5.3304 (6.3121)	Prec@1 18.750 (14.659)	Prec@5 35.417 (24.885)
Epoch: [0][2590/206270]	Time 2.548 (2.567)	Data 0.011 (0.013)	Loss 5.4610 (6.3076)	Prec@1 20.833 (14.702)	Prec@5 29.167 (24.944)
Epoch: [0][2600/206270]	Time 2.564 (2.567)	Data 0.016 (0.013)	Loss 5.0832 (6.3037)	Prec@1 22.917 (14.729)	Prec@5 43.750 (25.001)
Epoch: [0][2610/206270]	Time 2.563 (2.567)	Data 0.012 (0.013)	Loss 5.1029 (6.3000)	Prec@1 27.083 (14.757)	Prec@5 37.500 (25.032)
Epoch: [0][2620/206270]	Time 2.545 (2.567)	Data 0.014 (0.013)	Loss 4.8891 (6.2960)	Prec@1 27.083 (14.785)	Prec@5 35.417 (25.069)
Epoch: [0][2630/206270]	Time 2.553 (2.567)	Data 0.012 (0.013)	Loss 5.1842 (6.2918)	Prec@1 27.083 (14.821)	Prec@5 37.500 (25.119)
Epoch: [0][2640/206270]	Time 2.580 (2.567)	Data 0.012 (0.013)	Loss 4.7413 (6.2877)	Prec@1 31.250 (14.852)	Prec@5 43.750 (25.165)
Epoch: [0][2650/206270]	Time 2.562 (2.567)	Data 0.013 (0.013)	Loss 5.1125 (6.2833)	Prec@1 25.000 

Epoch: [0][3220/206270]	Time 2.559 (2.566)	Data 0.012 (0.013)	Loss 5.2192 (6.0890)	Prec@1 18.750 (16.500)	Prec@5 35.417 (27.374)
Epoch: [0][3230/206270]	Time 2.573 (2.566)	Data 0.021 (0.013)	Loss 5.1063 (6.0867)	Prec@1 18.750 (16.508)	Prec@5 37.500 (27.399)
Epoch: [0][3240/206270]	Time 2.564 (2.566)	Data 0.014 (0.013)	Loss 4.5828 (6.0829)	Prec@1 33.333 (16.545)	Prec@5 41.667 (27.449)
Epoch: [0][3250/206270]	Time 2.556 (2.565)	Data 0.016 (0.013)	Loss 4.9020 (6.0800)	Prec@1 27.083 (16.574)	Prec@5 37.500 (27.486)
Epoch: [0][3260/206270]	Time 2.549 (2.565)	Data 0.012 (0.013)	Loss 5.1972 (6.0775)	Prec@1 22.917 (16.593)	Prec@5 39.583 (27.512)
Epoch: [0][3270/206270]	Time 2.557 (2.565)	Data 0.012 (0.013)	Loss 5.0947 (6.0745)	Prec@1 18.750 (16.614)	Prec@5 45.833 (27.545)
Epoch: [0][3280/206270]	Time 2.561 (2.565)	Data 0.016 (0.013)	Loss 5.7553 (6.0717)	Prec@1 16.667 (16.644)	Prec@5 27.083 (27.570)
Epoch: [0][3290/206270]	Time 2.566 (2.565)	Data 0.018 (0.013)	Loss 5.3014 (6.0681)	Prec@1 27.083 

Epoch: [0][3860/206270]	Time 2.566 (2.564)	Data 0.017 (0.014)	Loss 5.4715 (5.9135)	Prec@1 20.833 (17.942)	Prec@5 35.417 (29.348)
Epoch: [0][3870/206270]	Time 2.559 (2.564)	Data 0.014 (0.014)	Loss 4.7322 (5.9107)	Prec@1 37.500 (17.971)	Prec@5 43.750 (29.378)
Epoch: [0][3880/206270]	Time 2.576 (2.564)	Data 0.014 (0.014)	Loss 4.8589 (5.9081)	Prec@1 18.750 (17.995)	Prec@5 37.500 (29.408)
Epoch: [0][3890/206270]	Time 2.565 (2.564)	Data 0.020 (0.014)	Loss 4.9263 (5.9056)	Prec@1 31.250 (18.016)	Prec@5 43.750 (29.438)
Epoch: [0][3900/206270]	Time 2.568 (2.564)	Data 0.013 (0.014)	Loss 4.5508 (5.9034)	Prec@1 27.083 (18.034)	Prec@5 41.667 (29.457)
Epoch: [0][3910/206270]	Time 2.567 (2.564)	Data 0.014 (0.014)	Loss 4.5794 (5.9004)	Prec@1 35.417 (18.060)	Prec@5 50.000 (29.496)
Epoch: [0][3920/206270]	Time 2.546 (2.564)	Data 0.016 (0.014)	Loss 4.9191 (5.8982)	Prec@1 27.083 (18.083)	Prec@5 43.750 (29.517)
Epoch: [0][3930/206270]	Time 2.572 (2.564)	Data 0.013 (0.014)	Loss 4.6575 (5.8955)	Prec@1 27.083 

Epoch: [0][4500/206270]	Time 2.553 (2.564)	Data 0.014 (0.014)	Loss 5.1257 (5.7662)	Prec@1 25.000 (19.184)	Prec@5 39.583 (31.001)
Epoch: [0][4510/206270]	Time 2.568 (2.564)	Data 0.014 (0.014)	Loss 5.3826 (5.7641)	Prec@1 22.917 (19.201)	Prec@5 35.417 (31.025)
Epoch: [0][4520/206270]	Time 2.550 (2.564)	Data 0.015 (0.014)	Loss 5.0443 (5.7620)	Prec@1 27.083 (19.216)	Prec@5 41.667 (31.054)
Epoch: [0][4530/206270]	Time 2.562 (2.564)	Data 0.014 (0.014)	Loss 5.1698 (5.7598)	Prec@1 25.000 (19.236)	Prec@5 37.500 (31.080)
Epoch: [0][4540/206270]	Time 2.568 (2.564)	Data 0.036 (0.014)	Loss 4.8824 (5.7581)	Prec@1 22.917 (19.248)	Prec@5 41.667 (31.099)
Epoch: [0][4550/206270]	Time 2.557 (2.564)	Data 0.014 (0.014)	Loss 4.4005 (5.7556)	Prec@1 22.917 (19.266)	Prec@5 45.833 (31.126)
Epoch: [0][4560/206270]	Time 2.557 (2.564)	Data 0.018 (0.014)	Loss 4.4280 (5.7537)	Prec@1 29.167 (19.283)	Prec@5 47.917 (31.148)
Epoch: [0][4570/206270]	Time 2.563 (2.564)	Data 0.014 (0.014)	Loss 3.9962 (5.7510)	Prec@1 35.417 

Epoch: [0][5140/206270]	Time 2.579 (2.564)	Data 0.014 (0.015)	Loss 3.9031 (5.6365)	Prec@1 41.667 (20.315)	Prec@5 52.083 (32.476)
Epoch: [0][5150/206270]	Time 2.600 (2.564)	Data 0.022 (0.015)	Loss 4.7742 (5.6346)	Prec@1 27.083 (20.334)	Prec@5 45.833 (32.501)
Epoch: [0][5160/206270]	Time 2.580 (2.564)	Data 0.017 (0.015)	Loss 4.5564 (5.6328)	Prec@1 33.333 (20.350)	Prec@5 50.000 (32.521)
Epoch: [0][5170/206270]	Time 2.587 (2.564)	Data 0.015 (0.015)	Loss 5.1566 (5.6305)	Prec@1 18.750 (20.375)	Prec@5 37.500 (32.548)
Epoch: [0][5180/206270]	Time 2.568 (2.564)	Data 0.015 (0.015)	Loss 4.3458 (5.6286)	Prec@1 31.250 (20.392)	Prec@5 52.083 (32.571)
Epoch: [0][5190/206270]	Time 2.584 (2.564)	Data 0.017 (0.015)	Loss 4.8032 (5.6270)	Prec@1 27.083 (20.404)	Prec@5 35.417 (32.588)
Epoch: [0][5200/206270]	Time 2.570 (2.564)	Data 0.015 (0.015)	Loss 5.0871 (5.6260)	Prec@1 20.833 (20.411)	Prec@5 39.583 (32.596)
Epoch: [0][5210/206270]	Time 2.576 (2.564)	Data 0.017 (0.015)	Loss 4.8222 (5.6243)	Prec@1 20.833 

Epoch: [0][5780/206270]	Time 2.588 (2.566)	Data 0.023 (0.015)	Loss 4.5366 (5.5244)	Prec@1 27.083 (21.309)	Prec@5 37.500 (33.726)
Epoch: [0][5790/206270]	Time 2.574 (2.566)	Data 0.015 (0.015)	Loss 5.3098 (5.5230)	Prec@1 18.750 (21.319)	Prec@5 35.417 (33.738)
Epoch: [0][5800/206270]	Time 2.575 (2.566)	Data 0.016 (0.015)	Loss 4.1931 (5.5212)	Prec@1 37.500 (21.335)	Prec@5 45.833 (33.757)
Epoch: [0][5810/206270]	Time 2.583 (2.566)	Data 0.016 (0.015)	Loss 3.9917 (5.5195)	Prec@1 33.333 (21.348)	Prec@5 52.083 (33.777)
Epoch: [0][5820/206270]	Time 2.576 (2.566)	Data 0.016 (0.015)	Loss 4.7879 (5.5181)	Prec@1 29.167 (21.360)	Prec@5 39.583 (33.793)
Epoch: [0][5830/206270]	Time 2.574 (2.566)	Data 0.017 (0.015)	Loss 4.8501 (5.5167)	Prec@1 31.250 (21.371)	Prec@5 39.583 (33.807)
Epoch: [0][5840/206270]	Time 2.591 (2.566)	Data 0.016 (0.015)	Loss 4.0357 (5.5150)	Prec@1 31.250 (21.383)	Prec@5 52.083 (33.824)
Epoch: [0][5850/206270]	Time 2.572 (2.566)	Data 0.019 (0.015)	Loss 5.2198 (5.5131)	Prec@1 27.083 

Epoch: [0][6420/206270]	Time 2.563 (2.567)	Data 0.021 (0.016)	Loss 4.5238 (5.4234)	Prec@1 29.167 (22.187)	Prec@5 47.917 (34.844)
Epoch: [0][6430/206270]	Time 2.578 (2.567)	Data 0.022 (0.016)	Loss 3.6619 (5.4217)	Prec@1 39.583 (22.203)	Prec@5 56.250 (34.865)
Epoch: [0][6440/206270]	Time 2.569 (2.567)	Data 0.017 (0.016)	Loss 3.5278 (5.4202)	Prec@1 43.750 (22.216)	Prec@5 60.417 (34.881)
Epoch: [0][6450/206270]	Time 2.578 (2.567)	Data 0.017 (0.016)	Loss 3.8225 (5.4185)	Prec@1 35.417 (22.231)	Prec@5 52.083 (34.905)
Epoch: [0][6460/206270]	Time 2.576 (2.567)	Data 0.022 (0.016)	Loss 3.9276 (5.4168)	Prec@1 33.333 (22.248)	Prec@5 56.250 (34.927)
Epoch: [0][6470/206270]	Time 2.564 (2.567)	Data 0.017 (0.016)	Loss 5.1986 (5.4156)	Prec@1 22.917 (22.254)	Prec@5 35.417 (34.938)
Epoch: [0][6480/206270]	Time 2.558 (2.567)	Data 0.017 (0.016)	Loss 4.4361 (5.4142)	Prec@1 29.167 (22.268)	Prec@5 39.583 (34.952)
Epoch: [0][6490/206270]	Time 2.587 (2.567)	Data 0.017 (0.016)	Loss 4.0760 (5.4129)	Prec@1 37.500 

Epoch: [0][7060/206270]	Time 2.568 (2.568)	Data 0.018 (0.016)	Loss 4.7730 (5.3337)	Prec@1 27.083 (22.986)	Prec@5 41.667 (35.858)
Epoch: [0][7070/206270]	Time 2.578 (2.568)	Data 0.019 (0.016)	Loss 3.9050 (5.3321)	Prec@1 37.500 (23.000)	Prec@5 54.167 (35.877)
Epoch: [0][7080/206270]	Time 2.579 (2.568)	Data 0.033 (0.016)	Loss 4.7027 (5.3305)	Prec@1 27.083 (23.016)	Prec@5 35.417 (35.894)
Epoch: [0][7090/206270]	Time 2.569 (2.568)	Data 0.018 (0.016)	Loss 4.6723 (5.3293)	Prec@1 22.917 (23.024)	Prec@5 43.750 (35.907)
Epoch: [0][7100/206270]	Time 2.578 (2.568)	Data 0.018 (0.016)	Loss 5.0802 (5.3281)	Prec@1 25.000 (23.038)	Prec@5 37.500 (35.923)
Epoch: [0][7110/206270]	Time 2.573 (2.568)	Data 0.019 (0.016)	Loss 4.9293 (5.3268)	Prec@1 20.833 (23.047)	Prec@5 39.583 (35.936)
Epoch: [0][7120/206270]	Time 2.564 (2.568)	Data 0.019 (0.016)	Loss 4.1355 (5.3252)	Prec@1 39.583 (23.063)	Prec@5 50.000 (35.953)
Epoch: [0][7130/206270]	Time 2.594 (2.568)	Data 0.031 (0.016)	Loss 4.5809 (5.3238)	Prec@1 29.167 

Epoch: [0][7700/206270]	Time 2.568 (2.569)	Data 0.019 (0.017)	Loss 3.7120 (5.2488)	Prec@1 47.917 (23.771)	Prec@5 56.250 (36.856)
Epoch: [0][7710/206270]	Time 2.574 (2.569)	Data 0.019 (0.017)	Loss 3.7576 (5.2475)	Prec@1 39.583 (23.782)	Prec@5 54.167 (36.873)
Epoch: [0][7720/206270]	Time 2.582 (2.569)	Data 0.019 (0.017)	Loss 4.5266 (5.2463)	Prec@1 33.333 (23.796)	Prec@5 45.833 (36.890)
Epoch: [0][7730/206270]	Time 2.585 (2.569)	Data 0.024 (0.017)	Loss 4.4396 (5.2452)	Prec@1 31.250 (23.804)	Prec@5 47.917 (36.901)
Epoch: [0][7740/206270]	Time 2.592 (2.569)	Data 0.023 (0.017)	Loss 4.3240 (5.2442)	Prec@1 29.167 (23.813)	Prec@5 50.000 (36.914)
Epoch: [0][7750/206270]	Time 2.586 (2.569)	Data 0.022 (0.017)	Loss 4.2903 (5.2433)	Prec@1 37.500 (23.819)	Prec@5 50.000 (36.922)
Epoch: [0][7760/206270]	Time 2.588 (2.569)	Data 0.028 (0.017)	Loss 4.5193 (5.2422)	Prec@1 33.333 (23.830)	Prec@5 45.833 (36.935)
Epoch: [0][7770/206270]	Time 2.585 (2.569)	Data 0.022 (0.017)	Loss 4.3504 (5.2409)	Prec@1 31.250 

Epoch: [0][8340/206270]	Time 2.606 (2.570)	Data 0.044 (0.017)	Loss 4.2783 (5.1747)	Prec@1 31.250 (24.448)	Prec@5 50.000 (37.718)
Epoch: [0][8350/206270]	Time 2.593 (2.570)	Data 0.027 (0.017)	Loss 4.7734 (5.1735)	Prec@1 31.250 (24.457)	Prec@5 41.667 (37.732)
Epoch: [0][8360/206270]	Time 2.571 (2.570)	Data 0.020 (0.017)	Loss 4.9037 (5.1724)	Prec@1 22.917 (24.469)	Prec@5 45.833 (37.745)
Epoch: [0][8370/206270]	Time 2.582 (2.570)	Data 0.025 (0.017)	Loss 3.6536 (5.1712)	Prec@1 43.750 (24.479)	Prec@5 56.250 (37.760)
Epoch: [0][8380/206270]	Time 2.597 (2.570)	Data 0.025 (0.017)	Loss 4.4045 (5.1700)	Prec@1 35.417 (24.494)	Prec@5 45.833 (37.776)
Epoch: [0][8390/206270]	Time 2.581 (2.570)	Data 0.020 (0.017)	Loss 4.2308 (5.1687)	Prec@1 33.333 (24.507)	Prec@5 54.167 (37.790)
Epoch: [0][8400/206270]	Time 2.584 (2.570)	Data 0.021 (0.017)	Loss 3.9189 (5.1673)	Prec@1 33.333 (24.521)	Prec@5 52.083 (37.808)
Epoch: [0][8410/206270]	Time 2.585 (2.570)	Data 0.020 (0.017)	Loss 4.2289 (5.1663)	Prec@1 27.083 

Epoch: [0][8980/206270]	Time 2.575 (2.570)	Data 0.022 (0.018)	Loss 3.7860 (5.1042)	Prec@1 37.500 (25.114)	Prec@5 58.333 (38.541)
Epoch: [0][8990/206270]	Time 2.569 (2.570)	Data 0.033 (0.018)	Loss 4.4785 (5.1033)	Prec@1 29.167 (25.120)	Prec@5 43.750 (38.552)
Epoch: [0][9000/206270]	Time 2.563 (2.570)	Data 0.024 (0.018)	Loss 4.5792 (5.1023)	Prec@1 29.167 (25.128)	Prec@5 43.750 (38.562)
Epoch: [0][9010/206270]	Time 2.581 (2.570)	Data 0.025 (0.018)	Loss 3.9219 (5.1012)	Prec@1 43.750 (25.139)	Prec@5 56.250 (38.576)
Epoch: [0][9020/206270]	Time 2.586 (2.570)	Data 0.022 (0.018)	Loss 3.5137 (5.1003)	Prec@1 47.917 (25.148)	Prec@5 54.167 (38.586)
Epoch: [0][9030/206270]	Time 2.578 (2.570)	Data 0.022 (0.018)	Loss 4.2965 (5.0993)	Prec@1 29.167 (25.154)	Prec@5 45.833 (38.597)
Epoch: [0][9040/206270]	Time 2.593 (2.570)	Data 0.021 (0.018)	Loss 4.0844 (5.0981)	Prec@1 35.417 (25.168)	Prec@5 52.083 (38.613)
Epoch: [0][9050/206270]	Time 2.593 (2.570)	Data 0.022 (0.018)	Loss 3.5264 (5.0969)	Prec@1 45.833 

Epoch: [0][9620/206270]	Time 2.583 (2.571)	Data 0.025 (0.018)	Loss 3.5054 (5.0393)	Prec@1 37.500 (25.710)	Prec@5 60.417 (39.301)
Epoch: [0][9630/206270]	Time 2.568 (2.571)	Data 0.022 (0.018)	Loss 4.8630 (5.0383)	Prec@1 18.750 (25.718)	Prec@5 43.750 (39.311)
Epoch: [0][9640/206270]	Time 2.588 (2.571)	Data 0.031 (0.018)	Loss 2.9683 (5.0372)	Prec@1 52.083 (25.728)	Prec@5 70.833 (39.325)
Epoch: [0][9650/206270]	Time 2.582 (2.571)	Data 0.031 (0.018)	Loss 5.0955 (5.0364)	Prec@1 16.667 (25.735)	Prec@5 39.583 (39.336)
Epoch: [0][9660/206270]	Time 2.570 (2.571)	Data 0.024 (0.018)	Loss 3.8341 (5.0352)	Prec@1 43.750 (25.745)	Prec@5 54.167 (39.349)
Epoch: [0][9670/206270]	Time 2.588 (2.571)	Data 0.031 (0.018)	Loss 4.6852 (5.0344)	Prec@1 31.250 (25.753)	Prec@5 37.500 (39.357)
Epoch: [0][9680/206270]	Time 2.608 (2.571)	Data 0.023 (0.018)	Loss 4.2166 (5.0333)	Prec@1 31.250 (25.762)	Prec@5 45.833 (39.370)
Epoch: [0][9690/206270]	Time 2.606 (2.571)	Data 0.032 (0.018)	Loss 4.3907 (5.0326)	Prec@1 27.083 

Epoch: [0][10260/206270]	Time 2.568 (2.574)	Data 0.023 (0.021)	Loss 4.2704 (4.9782)	Prec@1 43.750 (26.289)	Prec@5 47.917 (40.028)
Epoch: [0][10270/206270]	Time 2.602 (2.574)	Data 0.027 (0.021)	Loss 3.8151 (4.9771)	Prec@1 35.417 (26.299)	Prec@5 54.167 (40.039)
Epoch: [0][10280/206270]	Time 2.609 (2.574)	Data 0.030 (0.021)	Loss 4.0418 (4.9761)	Prec@1 37.500 (26.310)	Prec@5 50.000 (40.052)
Epoch: [0][10290/206270]	Time 2.577 (2.574)	Data 0.023 (0.021)	Loss 3.5911 (4.9751)	Prec@1 47.917 (26.318)	Prec@5 58.333 (40.064)
Epoch: [0][10300/206270]	Time 2.570 (2.574)	Data 0.023 (0.021)	Loss 4.1317 (4.9741)	Prec@1 35.417 (26.328)	Prec@5 52.083 (40.077)
