In [1]:
import dgl
import time
import torch as th
import numpy as np
import torch.nn.functional as F

from load_data import load_ogb
from model import SAGE, GAT, get_eigen
from train_eval import train_sample

Using backend: pytorch


This notebook shows the performance of GraphSage on the OGBN-products graph with scaled eigenvectors as positional embeddings for nodes. The positional node embeddings are fixed in this model.

In [4]:
g, num_labels = load_ogb('ogbn-products')
g.ndata.pop('features')

in_feats = 128
eigen_vals, eigen_vecs = get_eigen(g, in_feats, 'ogbn-products')
train_g = val_g = test_g = g
train_nfeat = val_nfeat = test_nfeat = th.tensor(eigen_vecs * np.sqrt(eigen_vals).reshape((1, len(eigen_vals))),
                                                 dtype=th.float32)
train_labels = val_labels = test_labels = g.ndata.pop('labels')

hyperparams = {
    'batch_size': 1024,
    'num_workers': 4,
    'num_hidden': 256,
    'num_layers': 3,
    'dropout': 0.5,
    'lr': 0.003,
    'num_epochs': 50,
    'fanouts': [15,10,5],
    'eval_batch_size': 10000
}
device = th.device('cuda:1')

# Pack data
data = train_g, val_g, test_g, train_nfeat, train_labels, \
           val_nfeat, val_labels, test_nfeat, test_labels
# Define model
in_feats = train_nfeat.shape[1]
model = SAGE(in_feats, hyperparams['num_hidden'], num_labels,
             hyperparams['num_layers'], F.relu, hyperparams['dropout'])
train_sample(model, data, hyperparams, device, 3)

load ogbn-products
finish loading ogbn-products
finish constructing ogbn-products
Epoch 00000 | Step 00000 | Loss 3.8544 | Train Acc 0.0176 | Speed (samples/sec) nan | GPU 780.6 MB
Epoch 00000 | Step 00020 | Loss 1.9016 | Train Acc 0.5156 | Speed (samples/sec) 6019.9496 | GPU 788.2 MB
Epoch 00000 | Step 00040 | Loss 1.2882 | Train Acc 0.6602 | Speed (samples/sec) 5974.9644 | GPU 789.3 MB
Epoch 00000 | Step 00060 | Loss 1.1621 | Train Acc 0.6973 | Speed (samples/sec) 5980.1294 | GPU 790.0 MB
Epoch 00000 | Step 00080 | Loss 1.0794 | Train Acc 0.7061 | Speed (samples/sec) 5997.3360 | GPU 790.0 MB
Epoch 00000 | Step 00100 | Loss 0.9954 | Train Acc 0.7412 | Speed (samples/sec) 5979.2930 | GPU 790.0 MB
Epoch 00000 | Step 00120 | Loss 0.9324 | Train Acc 0.7305 | Speed (samples/sec) 6042.2025 | GPU 790.0 MB
Epoch 00000 | Step 00140 | Loss 0.8243 | Train Acc 0.7783 | Speed (samples/sec) 6063.7062 | GPU 790.6 MB
Epoch 00000 | Step 00160 | Loss 0.8547 | Train Acc 0.7705 | Speed (samples/sec) 6107

  0%|          | 0/245 [00:00<?, ?it/s]

Epoch Time(s): 35.8194


100%|██████████| 245/245 [00:38<00:00,  6.36it/s]
100%|██████████| 245/245 [00:50<00:00,  4.88it/s]
100%|██████████| 245/245 [00:46<00:00,  5.31it/s]


Val acc 0.8298, Test Acc: 0.6761
Best val acc 0.8298, best test acc: 0.6761
Epoch 00004 | Step 00000 | Loss 0.5744 | Train Acc 0.8408 | Speed (samples/sec) 6107.6874 | GPU 791.4 MB
Epoch 00004 | Step 00020 | Loss 0.6007 | Train Acc 0.8359 | Speed (samples/sec) 6113.7388 | GPU 791.4 MB
Epoch 00004 | Step 00040 | Loss 0.6034 | Train Acc 0.8301 | Speed (samples/sec) 6116.8245 | GPU 791.4 MB
Epoch 00004 | Step 00060 | Loss 0.5607 | Train Acc 0.8398 | Speed (samples/sec) 6120.2550 | GPU 791.4 MB
Epoch 00004 | Step 00080 | Loss 0.5402 | Train Acc 0.8418 | Speed (samples/sec) 6121.5181 | GPU 791.4 MB
Epoch 00004 | Step 00100 | Loss 0.5812 | Train Acc 0.8564 | Speed (samples/sec) 6117.7308 | GPU 791.4 MB
Epoch 00004 | Step 00120 | Loss 0.5674 | Train Acc 0.8477 | Speed (samples/sec) 6122.2888 | GPU 791.4 MB
Epoch 00004 | Step 00140 | Loss 0.5463 | Train Acc 0.8398 | Speed (samples/sec) 6125.5965 | GPU 791.4 MB
Epoch 00004 | Step 00160 | Loss 0.5821 | Train Acc 0.8350 | Speed (samples/sec) 6131

  0%|          | 0/245 [00:00<?, ?it/s]

Epoch Time(s): 36.4076


100%|██████████| 245/245 [00:39<00:00,  6.18it/s]
100%|██████████| 245/245 [00:48<00:00,  5.02it/s]
100%|██████████| 245/245 [00:47<00:00,  5.14it/s]


Val acc 0.7764, Test Acc: 0.6117
Epoch 00007 | Step 00000 | Loss 0.7289 | Train Acc 0.7988 | Speed (samples/sec) 6121.4543 | GPU 791.8 MB
Epoch 00007 | Step 00020 | Loss 0.5493 | Train Acc 0.8447 | Speed (samples/sec) 6126.2350 | GPU 791.8 MB
Epoch 00007 | Step 00040 | Loss 0.5425 | Train Acc 0.8438 | Speed (samples/sec) 6130.9755 | GPU 791.8 MB
Epoch 00007 | Step 00060 | Loss 0.5311 | Train Acc 0.8516 | Speed (samples/sec) 6131.9336 | GPU 791.8 MB
Epoch 00007 | Step 00080 | Loss 0.6043 | Train Acc 0.8242 | Speed (samples/sec) 6132.7007 | GPU 791.8 MB
Epoch 00007 | Step 00100 | Loss 0.4780 | Train Acc 0.8555 | Speed (samples/sec) 6138.1277 | GPU 791.8 MB
Epoch 00007 | Step 00120 | Loss 0.5044 | Train Acc 0.8535 | Speed (samples/sec) 6143.2546 | GPU 791.8 MB
Epoch 00007 | Step 00140 | Loss 0.4776 | Train Acc 0.8623 | Speed (samples/sec) 6146.5125 | GPU 791.8 MB
Epoch 00007 | Step 00160 | Loss 0.4892 | Train Acc 0.8633 | Speed (samples/sec) 6149.7394 | GPU 791.8 MB
Epoch 00007 | Step 001

  0%|          | 0/245 [00:00<?, ?it/s]

Epoch Time(s): 36.5858


100%|██████████| 245/245 [00:38<00:00,  6.31it/s]
100%|██████████| 245/245 [00:47<00:00,  5.17it/s]
100%|██████████| 245/245 [00:48<00:00,  5.04it/s]


Val acc 0.8594, Test Acc: 0.7056
Best val acc 0.8594, best test acc: 0.7056
Epoch 00010 | Step 00000 | Loss 0.5822 | Train Acc 0.8369 | Speed (samples/sec) 6148.4466 | GPU 791.8 MB
Epoch 00010 | Step 00020 | Loss 0.5442 | Train Acc 0.8408 | Speed (samples/sec) 6149.0747 | GPU 791.8 MB
Epoch 00010 | Step 00040 | Loss 0.5436 | Train Acc 0.8477 | Speed (samples/sec) 6149.5069 | GPU 791.8 MB
Epoch 00010 | Step 00060 | Loss 0.4992 | Train Acc 0.8574 | Speed (samples/sec) 6150.0209 | GPU 791.8 MB
Epoch 00010 | Step 00080 | Loss 0.5596 | Train Acc 0.8330 | Speed (samples/sec) 6150.4253 | GPU 791.8 MB
Epoch 00010 | Step 00100 | Loss 0.5257 | Train Acc 0.8564 | Speed (samples/sec) 6150.8144 | GPU 791.8 MB
Epoch 00010 | Step 00120 | Loss 0.5315 | Train Acc 0.8477 | Speed (samples/sec) 6151.5088 | GPU 791.8 MB
Epoch 00010 | Step 00140 | Loss 0.5407 | Train Acc 0.8486 | Speed (samples/sec) 6153.1639 | GPU 791.8 MB
Epoch 00010 | Step 00160 | Loss 0.5158 | Train Acc 0.8564 | Speed (samples/sec) 6153

  0%|          | 0/245 [00:00<?, ?it/s]

Epoch Time(s): 35.5599


100%|██████████| 245/245 [00:39<00:00,  6.23it/s]
100%|██████████| 245/245 [00:49<00:00,  4.95it/s]
100%|██████████| 245/245 [00:48<00:00,  5.03it/s]


Val acc 0.7914, Test Acc: 0.6285
Epoch 00013 | Step 00000 | Loss 0.7152 | Train Acc 0.8027 | Speed (samples/sec) 6145.7797 | GPU 791.8 MB
Epoch 00013 | Step 00020 | Loss 0.4954 | Train Acc 0.8574 | Speed (samples/sec) 6145.4460 | GPU 791.8 MB
Epoch 00013 | Step 00040 | Loss 0.5039 | Train Acc 0.8564 | Speed (samples/sec) 6144.7758 | GPU 791.8 MB
Epoch 00013 | Step 00060 | Loss 0.4361 | Train Acc 0.8643 | Speed (samples/sec) 6145.1595 | GPU 791.8 MB
Epoch 00013 | Step 00080 | Loss 0.4801 | Train Acc 0.8662 | Speed (samples/sec) 6146.2020 | GPU 791.8 MB
Epoch 00013 | Step 00100 | Loss 0.4733 | Train Acc 0.8662 | Speed (samples/sec) 6147.2955 | GPU 791.8 MB
Epoch 00013 | Step 00120 | Loss 0.4503 | Train Acc 0.8604 | Speed (samples/sec) 6148.9212 | GPU 791.8 MB
Epoch 00013 | Step 00140 | Loss 0.4936 | Train Acc 0.8604 | Speed (samples/sec) 6147.3651 | GPU 791.8 MB
Epoch 00013 | Step 00160 | Loss 0.4691 | Train Acc 0.8564 | Speed (samples/sec) 6148.3299 | GPU 791.8 MB
Epoch 00013 | Step 001

  0%|          | 0/245 [00:00<?, ?it/s]

Epoch Time(s): 34.8824


100%|██████████| 245/245 [00:38<00:00,  6.40it/s]
100%|██████████| 245/245 [00:48<00:00,  5.01it/s]
100%|██████████| 245/245 [00:48<00:00,  5.03it/s]


Val acc 0.8752, Test Acc: 0.7439
Best val acc 0.8752, best test acc: 0.7439
Epoch 00016 | Step 00000 | Loss 0.4461 | Train Acc 0.8730 | Speed (samples/sec) 6155.6904 | GPU 791.8 MB
Epoch 00016 | Step 00020 | Loss 0.4201 | Train Acc 0.8916 | Speed (samples/sec) 6154.8901 | GPU 791.8 MB
Epoch 00016 | Step 00040 | Loss 0.4060 | Train Acc 0.8867 | Speed (samples/sec) 6153.1934 | GPU 791.8 MB
Epoch 00016 | Step 00060 | Loss 0.4487 | Train Acc 0.8701 | Speed (samples/sec) 6153.4593 | GPU 791.8 MB
Epoch 00016 | Step 00080 | Loss 0.4492 | Train Acc 0.8633 | Speed (samples/sec) 6154.1611 | GPU 791.8 MB
Epoch 00016 | Step 00100 | Loss 0.4696 | Train Acc 0.8613 | Speed (samples/sec) 6153.1460 | GPU 791.8 MB
Epoch 00016 | Step 00120 | Loss 0.4631 | Train Acc 0.8486 | Speed (samples/sec) 6151.8756 | GPU 791.8 MB
Epoch 00016 | Step 00140 | Loss 0.4084 | Train Acc 0.8799 | Speed (samples/sec) 6152.3095 | GPU 791.8 MB
Epoch 00016 | Step 00160 | Loss 0.4665 | Train Acc 0.8623 | Speed (samples/sec) 6152

  0%|          | 0/245 [00:00<?, ?it/s]

Epoch Time(s): 37.1903


100%|██████████| 245/245 [00:38<00:00,  6.34it/s]
100%|██████████| 245/245 [00:52<00:00,  4.70it/s]
100%|██████████| 245/245 [00:52<00:00,  4.66it/s]


Val acc 0.8741, Test Acc: 0.7163
Epoch 00019 | Step 00000 | Loss 0.3862 | Train Acc 0.8828 | Speed (samples/sec) 6137.5992 | GPU 791.8 MB
Epoch 00019 | Step 00020 | Loss 0.4564 | Train Acc 0.8691 | Speed (samples/sec) 6133.6706 | GPU 791.8 MB
Epoch 00019 | Step 00040 | Loss 0.5154 | Train Acc 0.8613 | Speed (samples/sec) 6132.9414 | GPU 791.8 MB
Epoch 00019 | Step 00060 | Loss 0.4601 | Train Acc 0.8701 | Speed (samples/sec) 6131.6125 | GPU 791.8 MB
Epoch 00019 | Step 00080 | Loss 0.4061 | Train Acc 0.8906 | Speed (samples/sec) 6129.7509 | GPU 791.8 MB
Epoch 00019 | Step 00100 | Loss 0.4178 | Train Acc 0.8691 | Speed (samples/sec) 6127.4091 | GPU 791.8 MB
Epoch 00019 | Step 00120 | Loss 0.4388 | Train Acc 0.8848 | Speed (samples/sec) 6125.6230 | GPU 791.8 MB
Epoch 00019 | Step 00140 | Loss 0.4589 | Train Acc 0.8809 | Speed (samples/sec) 6123.6024 | GPU 791.8 MB
Epoch 00019 | Step 00160 | Loss 0.4922 | Train Acc 0.8633 | Speed (samples/sec) 6120.7244 | GPU 791.8 MB
Epoch 00019 | Step 001

  0%|          | 0/245 [00:00<?, ?it/s]

Epoch Time(s): 39.1095


100%|██████████| 245/245 [00:42<00:00,  5.75it/s]
100%|██████████| 245/245 [00:53<00:00,  4.59it/s]
100%|██████████| 245/245 [00:53<00:00,  4.56it/s]


Val acc 0.8773, Test Acc: 0.7180
Best val acc 0.8773, best test acc: 0.7180
Epoch 00022 | Step 00000 | Loss 0.4637 | Train Acc 0.8721 | Speed (samples/sec) 6073.2675 | GPU 791.8 MB
Epoch 00022 | Step 00020 | Loss 0.4183 | Train Acc 0.8906 | Speed (samples/sec) 6070.6106 | GPU 791.8 MB
Epoch 00022 | Step 00040 | Loss 0.4503 | Train Acc 0.8730 | Speed (samples/sec) 6070.1145 | GPU 791.8 MB
Epoch 00022 | Step 00060 | Loss 0.4669 | Train Acc 0.8770 | Speed (samples/sec) 6069.0622 | GPU 791.8 MB
Epoch 00022 | Step 00080 | Loss 0.4466 | Train Acc 0.8691 | Speed (samples/sec) 6066.9555 | GPU 791.8 MB
Epoch 00022 | Step 00100 | Loss 0.5028 | Train Acc 0.8555 | Speed (samples/sec) 6066.3180 | GPU 791.8 MB
Epoch 00022 | Step 00120 | Loss 0.4907 | Train Acc 0.8535 | Speed (samples/sec) 6065.0176 | GPU 791.8 MB
Epoch 00022 | Step 00140 | Loss 0.4761 | Train Acc 0.8691 | Speed (samples/sec) 6063.7724 | GPU 791.8 MB
Epoch 00022 | Step 00160 | Loss 0.4106 | Train Acc 0.8838 | Speed (samples/sec) 6061

  0%|          | 0/245 [00:00<?, ?it/s]

Epoch Time(s): 40.3105


100%|██████████| 245/245 [00:43<00:00,  5.62it/s]
100%|██████████| 245/245 [00:52<00:00,  4.68it/s]
100%|██████████| 245/245 [00:50<00:00,  4.85it/s]


Val acc 0.8809, Test Acc: 0.7252
Best val acc 0.8809, best test acc: 0.7252
Epoch 00025 | Step 00000 | Loss 0.3849 | Train Acc 0.8867 | Speed (samples/sec) 6012.8511 | GPU 792.3 MB
Epoch 00025 | Step 00020 | Loss 0.4681 | Train Acc 0.8623 | Speed (samples/sec) 6010.4121 | GPU 792.3 MB
Epoch 00025 | Step 00040 | Loss 0.4191 | Train Acc 0.8721 | Speed (samples/sec) 6009.2713 | GPU 792.3 MB
Epoch 00025 | Step 00060 | Loss 0.3854 | Train Acc 0.8887 | Speed (samples/sec) 6008.1685 | GPU 792.3 MB
Epoch 00025 | Step 00080 | Loss 0.4004 | Train Acc 0.9004 | Speed (samples/sec) 6007.0615 | GPU 792.3 MB
Epoch 00025 | Step 00100 | Loss 0.4645 | Train Acc 0.8721 | Speed (samples/sec) 6006.3592 | GPU 792.3 MB
Epoch 00025 | Step 00120 | Loss 0.4344 | Train Acc 0.8750 | Speed (samples/sec) 6006.3770 | GPU 792.3 MB
Epoch 00025 | Step 00140 | Loss 0.4009 | Train Acc 0.8789 | Speed (samples/sec) 6005.8891 | GPU 792.3 MB
Epoch 00025 | Step 00160 | Loss 0.5018 | Train Acc 0.8643 | Speed (samples/sec) 6005

  0%|          | 0/245 [00:00<?, ?it/s]

Epoch Time(s): 38.4514


100%|██████████| 245/245 [00:43<00:00,  5.58it/s]
100%|██████████| 245/245 [00:55<00:00,  4.42it/s]
100%|██████████| 245/245 [00:55<00:00,  4.41it/s]


Val acc 0.8739, Test Acc: 0.7090
Epoch 00028 | Step 00000 | Loss 0.4328 | Train Acc 0.8730 | Speed (samples/sec) 5983.1011 | GPU 792.3 MB
Epoch 00028 | Step 00020 | Loss 0.4862 | Train Acc 0.8672 | Speed (samples/sec) 5982.4179 | GPU 792.3 MB
Epoch 00028 | Step 00040 | Loss 0.4186 | Train Acc 0.8838 | Speed (samples/sec) 5980.7022 | GPU 792.3 MB
Epoch 00028 | Step 00060 | Loss 0.3829 | Train Acc 0.8760 | Speed (samples/sec) 5978.6426 | GPU 792.3 MB
Epoch 00028 | Step 00080 | Loss 0.4207 | Train Acc 0.8848 | Speed (samples/sec) 5977.4320 | GPU 792.3 MB
Epoch 00028 | Step 00100 | Loss 0.4200 | Train Acc 0.8809 | Speed (samples/sec) 5976.2690 | GPU 792.3 MB
Epoch 00028 | Step 00120 | Loss 0.4467 | Train Acc 0.8799 | Speed (samples/sec) 5975.3417 | GPU 792.3 MB
Epoch 00028 | Step 00140 | Loss 0.3276 | Train Acc 0.9082 | Speed (samples/sec) 5974.6011 | GPU 792.3 MB
Epoch 00028 | Step 00160 | Loss 0.4136 | Train Acc 0.8779 | Speed (samples/sec) 5973.5651 | GPU 792.3 MB
Epoch 00028 | Step 001

  0%|          | 0/245 [00:00<?, ?it/s]

Epoch Time(s): 38.0709


100%|██████████| 245/245 [00:42<00:00,  5.75it/s]
100%|██████████| 245/245 [00:54<00:00,  4.50it/s]
100%|██████████| 245/245 [00:50<00:00,  4.81it/s]


Val acc 0.8773, Test Acc: 0.7175
Epoch 00031 | Step 00000 | Loss 0.3961 | Train Acc 0.8828 | Speed (samples/sec) 5955.1060 | GPU 792.3 MB
Epoch 00031 | Step 00020 | Loss 0.3705 | Train Acc 0.8945 | Speed (samples/sec) 5954.2725 | GPU 792.3 MB
Epoch 00031 | Step 00040 | Loss 0.3941 | Train Acc 0.8760 | Speed (samples/sec) 5953.7363 | GPU 792.3 MB
Epoch 00031 | Step 00060 | Loss 0.3927 | Train Acc 0.9004 | Speed (samples/sec) 5953.1380 | GPU 792.3 MB
Epoch 00031 | Step 00080 | Loss 0.4155 | Train Acc 0.8740 | Speed (samples/sec) 5952.5978 | GPU 792.3 MB
Epoch 00031 | Step 00100 | Loss 0.4178 | Train Acc 0.8828 | Speed (samples/sec) 5952.4549 | GPU 792.3 MB
Epoch 00031 | Step 00120 | Loss 0.4006 | Train Acc 0.8838 | Speed (samples/sec) 5951.0390 | GPU 792.3 MB
Epoch 00031 | Step 00140 | Loss 0.4589 | Train Acc 0.8613 | Speed (samples/sec) 5950.0411 | GPU 792.3 MB
Epoch 00031 | Step 00160 | Loss 0.4895 | Train Acc 0.8633 | Speed (samples/sec) 5949.8745 | GPU 792.3 MB
Epoch 00031 | Step 001

  0%|          | 0/245 [00:00<?, ?it/s]

Epoch Time(s): 37.0802


100%|██████████| 245/245 [00:39<00:00,  6.25it/s]
100%|██████████| 245/245 [00:49<00:00,  4.99it/s]
100%|██████████| 245/245 [00:49<00:00,  4.93it/s]


Val acc 0.8357, Test Acc: 0.6852
Epoch 00034 | Step 00000 | Loss 0.5607 | Train Acc 0.8408 | Speed (samples/sec) 5937.9568 | GPU 792.3 MB
Epoch 00034 | Step 00020 | Loss 0.4663 | Train Acc 0.8682 | Speed (samples/sec) 5938.0981 | GPU 792.3 MB
Epoch 00034 | Step 00040 | Loss 0.4115 | Train Acc 0.8828 | Speed (samples/sec) 5938.0037 | GPU 792.3 MB
Epoch 00034 | Step 00060 | Loss 0.4033 | Train Acc 0.8838 | Speed (samples/sec) 5938.3521 | GPU 792.3 MB
Epoch 00034 | Step 00080 | Loss 0.3906 | Train Acc 0.8828 | Speed (samples/sec) 5938.2788 | GPU 792.3 MB
Epoch 00034 | Step 00100 | Loss 0.4143 | Train Acc 0.8809 | Speed (samples/sec) 5938.0419 | GPU 792.3 MB
Epoch 00034 | Step 00120 | Loss 0.4320 | Train Acc 0.8750 | Speed (samples/sec) 5937.1887 | GPU 792.3 MB
Epoch 00034 | Step 00140 | Loss 0.4616 | Train Acc 0.8564 | Speed (samples/sec) 5937.6832 | GPU 792.3 MB
Epoch 00034 | Step 00160 | Loss 0.4324 | Train Acc 0.8682 | Speed (samples/sec) 5937.8791 | GPU 792.3 MB
Epoch 00034 | Step 001

  0%|          | 0/245 [00:00<?, ?it/s]

Epoch Time(s): 37.9210


100%|██████████| 245/245 [00:41<00:00,  5.95it/s]
100%|██████████| 245/245 [00:49<00:00,  4.93it/s]
100%|██████████| 245/245 [00:51<00:00,  4.76it/s]


Val acc 0.8824, Test Acc: 0.7508
Best val acc 0.8824, best test acc: 0.7508
Epoch 00037 | Step 00000 | Loss 0.4295 | Train Acc 0.8848 | Speed (samples/sec) 5934.8470 | GPU 792.3 MB
Epoch 00037 | Step 00020 | Loss 0.3696 | Train Acc 0.8906 | Speed (samples/sec) 5934.3321 | GPU 792.3 MB
Epoch 00037 | Step 00040 | Loss 0.4447 | Train Acc 0.8877 | Speed (samples/sec) 5934.9164 | GPU 792.3 MB
Epoch 00037 | Step 00060 | Loss 0.4573 | Train Acc 0.8750 | Speed (samples/sec) 5934.4157 | GPU 792.3 MB
Epoch 00037 | Step 00080 | Loss 0.4351 | Train Acc 0.8760 | Speed (samples/sec) 5935.3200 | GPU 792.3 MB
Epoch 00037 | Step 00100 | Loss 0.3766 | Train Acc 0.8984 | Speed (samples/sec) 5935.7015 | GPU 792.3 MB
Epoch 00037 | Step 00120 | Loss 0.4377 | Train Acc 0.8770 | Speed (samples/sec) 5935.9417 | GPU 792.3 MB
Epoch 00037 | Step 00140 | Loss 0.4047 | Train Acc 0.8789 | Speed (samples/sec) 5935.9255 | GPU 792.3 MB
Epoch 00037 | Step 00160 | Loss 0.3741 | Train Acc 0.8945 | Speed (samples/sec) 5936

  0%|          | 0/245 [00:00<?, ?it/s]

Epoch Time(s): 38.3240


100%|██████████| 245/245 [00:41<00:00,  5.90it/s]
100%|██████████| 245/245 [00:53<00:00,  4.62it/s]
100%|██████████| 245/245 [00:50<00:00,  4.83it/s]


Val acc 0.8635, Test Acc: 0.7160
Epoch 00040 | Step 00000 | Loss 0.4438 | Train Acc 0.8721 | Speed (samples/sec) 5931.1993 | GPU 792.3 MB
Epoch 00040 | Step 00020 | Loss 0.4558 | Train Acc 0.8555 | Speed (samples/sec) 5931.5191 | GPU 792.3 MB
Epoch 00040 | Step 00040 | Loss 0.3326 | Train Acc 0.9004 | Speed (samples/sec) 5931.2591 | GPU 792.3 MB
Epoch 00040 | Step 00060 | Loss 0.4425 | Train Acc 0.8770 | Speed (samples/sec) 5930.6048 | GPU 792.3 MB
Epoch 00040 | Step 00080 | Loss 0.3740 | Train Acc 0.8926 | Speed (samples/sec) 5930.7380 | GPU 792.3 MB
Epoch 00040 | Step 00100 | Loss 0.4401 | Train Acc 0.8652 | Speed (samples/sec) 5930.3695 | GPU 792.3 MB
Epoch 00040 | Step 00120 | Loss 0.3803 | Train Acc 0.8955 | Speed (samples/sec) 5930.8324 | GPU 792.3 MB
Epoch 00040 | Step 00140 | Loss 0.4279 | Train Acc 0.8848 | Speed (samples/sec) 5930.4701 | GPU 792.3 MB
Epoch 00040 | Step 00160 | Loss 0.3567 | Train Acc 0.8955 | Speed (samples/sec) 5930.3318 | GPU 792.3 MB
Epoch 00040 | Step 001

  0%|          | 0/245 [00:00<?, ?it/s]

Epoch Time(s): 36.9172


100%|██████████| 245/245 [00:39<00:00,  6.18it/s]
100%|██████████| 245/245 [00:51<00:00,  4.74it/s]
100%|██████████| 245/245 [00:49<00:00,  4.93it/s]


Val acc 0.8858, Test Acc: 0.7279
Best val acc 0.8858, best test acc: 0.7279
Epoch 00043 | Step 00000 | Loss 0.3827 | Train Acc 0.8926 | Speed (samples/sec) 5929.9041 | GPU 792.3 MB
Epoch 00043 | Step 00020 | Loss 0.4326 | Train Acc 0.8740 | Speed (samples/sec) 5930.0099 | GPU 792.3 MB
Epoch 00043 | Step 00040 | Loss 0.4315 | Train Acc 0.8682 | Speed (samples/sec) 5930.6868 | GPU 792.3 MB
Epoch 00043 | Step 00060 | Loss 0.4274 | Train Acc 0.8730 | Speed (samples/sec) 5931.0474 | GPU 792.3 MB
Epoch 00043 | Step 00080 | Loss 0.4020 | Train Acc 0.8936 | Speed (samples/sec) 5931.7264 | GPU 792.3 MB
Epoch 00043 | Step 00100 | Loss 0.4550 | Train Acc 0.8818 | Speed (samples/sec) 5931.4391 | GPU 792.3 MB
Epoch 00043 | Step 00120 | Loss 0.4108 | Train Acc 0.8779 | Speed (samples/sec) 5931.8824 | GPU 792.3 MB
Epoch 00043 | Step 00140 | Loss 0.3896 | Train Acc 0.8809 | Speed (samples/sec) 5932.1424 | GPU 792.3 MB
Epoch 00043 | Step 00160 | Loss 0.4448 | Train Acc 0.8779 | Speed (samples/sec) 5932

  0%|          | 0/245 [00:00<?, ?it/s]

Epoch Time(s): 36.2868


100%|██████████| 245/245 [00:40<00:00,  6.12it/s]
100%|██████████| 245/245 [00:51<00:00,  4.80it/s]
100%|██████████| 245/245 [00:49<00:00,  4.99it/s]


Val acc 0.8847, Test Acc: 0.7111
Epoch 00046 | Step 00000 | Loss 0.4711 | Train Acc 0.8691 | Speed (samples/sec) 5935.0547 | GPU 792.3 MB
Epoch 00046 | Step 00020 | Loss 0.4282 | Train Acc 0.8828 | Speed (samples/sec) 5936.2986 | GPU 792.3 MB
Epoch 00046 | Step 00040 | Loss 0.3499 | Train Acc 0.9004 | Speed (samples/sec) 5937.4623 | GPU 792.3 MB
Epoch 00046 | Step 00060 | Loss 0.4556 | Train Acc 0.8760 | Speed (samples/sec) 5938.5340 | GPU 792.3 MB
Epoch 00046 | Step 00080 | Loss 0.4067 | Train Acc 0.8809 | Speed (samples/sec) 5939.5502 | GPU 792.3 MB
Epoch 00046 | Step 00100 | Loss 0.4251 | Train Acc 0.8760 | Speed (samples/sec) 5939.9162 | GPU 792.3 MB
Epoch 00046 | Step 00120 | Loss 0.3999 | Train Acc 0.8838 | Speed (samples/sec) 5940.3261 | GPU 792.3 MB
Epoch 00046 | Step 00140 | Loss 0.4475 | Train Acc 0.8789 | Speed (samples/sec) 5941.0026 | GPU 792.3 MB
Epoch 00046 | Step 00160 | Loss 0.4180 | Train Acc 0.8867 | Speed (samples/sec) 5941.2900 | GPU 792.3 MB
Epoch 00046 | Step 001

  0%|          | 0/245 [00:00<?, ?it/s]

Epoch Time(s): 36.7697


100%|██████████| 245/245 [00:39<00:00,  6.25it/s]
100%|██████████| 245/245 [00:50<00:00,  4.85it/s]
100%|██████████| 245/245 [00:51<00:00,  4.79it/s]


Val acc 0.8863, Test Acc: 0.7074
Best val acc 0.8863, best test acc: 0.7074
Epoch 00049 | Step 00000 | Loss 0.3805 | Train Acc 0.8906 | Speed (samples/sec) 5939.3450 | GPU 792.3 MB
Epoch 00049 | Step 00020 | Loss 0.3424 | Train Acc 0.8965 | Speed (samples/sec) 5938.9181 | GPU 792.3 MB
Epoch 00049 | Step 00040 | Loss 0.4212 | Train Acc 0.8760 | Speed (samples/sec) 5938.6383 | GPU 792.3 MB
Epoch 00049 | Step 00060 | Loss 0.3989 | Train Acc 0.8809 | Speed (samples/sec) 5938.2831 | GPU 792.3 MB
Epoch 00049 | Step 00080 | Loss 0.4668 | Train Acc 0.8555 | Speed (samples/sec) 5938.5465 | GPU 792.3 MB
Epoch 00049 | Step 00100 | Loss 0.4271 | Train Acc 0.8809 | Speed (samples/sec) 5938.3405 | GPU 792.3 MB
Epoch 00049 | Step 00120 | Loss 0.4044 | Train Acc 0.8838 | Speed (samples/sec) 5938.2036 | GPU 792.3 MB
Epoch 00049 | Step 00140 | Loss 0.3922 | Train Acc 0.8809 | Speed (samples/sec) 5938.5685 | GPU 792.3 MB
Epoch 00049 | Step 00160 | Loss 0.4372 | Train Acc 0.8770 | Speed (samples/sec) 5939

The experiment below is to show that we have to scale eigenvectors with square root of eigenvalues to achieve good performance. If we don't scale the eigenvectors, the performance is worse.

In [5]:
g, num_labels = load_ogb('ogbn-products')
g.ndata.pop('features')

in_feats = 128
eigen_vals, eigen_vecs = get_eigen(g, in_feats, 'ogbn-products')
train_g = val_g = test_g = g
# Don't scale eigenvectors.
train_nfeat = val_nfeat = test_nfeat = th.tensor(eigen_vecs, dtype=th.float32)
train_labels = val_labels = test_labels = g.ndata.pop('labels')

hyperparams = {
    'batch_size': 1024,
    'num_workers': 4,
    'num_hidden': 256,
    'num_layers': 3,
    'dropout': 0.5,
    'lr': 0.003,
    'num_epochs': 50,
    'fanouts': [15,10,5],
    'eval_batch_size': 10000
}
device = th.device('cuda:1')

# Pack data
data = train_g, val_g, test_g, train_nfeat, train_labels, \
           val_nfeat, val_labels, test_nfeat, test_labels
# Define model
in_feats = train_nfeat.shape[1]
model = SAGE(in_feats, hyperparams['num_hidden'], num_labels,
             hyperparams['num_layers'], F.relu, hyperparams['dropout'])
train_sample(model, data, hyperparams, device, 3)

load ogbn-products
finish loading ogbn-products
finish constructing ogbn-products
Epoch 00000 | Step 00000 | Loss 3.8492 | Train Acc 0.0391 | Speed (samples/sec) nan | GPU 792.3 MB
Epoch 00000 | Step 00020 | Loss 2.5491 | Train Acc 0.3066 | Speed (samples/sec) 5920.3537 | GPU 792.3 MB
Epoch 00000 | Step 00040 | Loss 2.5437 | Train Acc 0.2900 | Speed (samples/sec) 6031.4227 | GPU 792.3 MB
Epoch 00000 | Step 00060 | Loss 2.2843 | Train Acc 0.3301 | Speed (samples/sec) 5926.8878 | GPU 792.3 MB
Epoch 00000 | Step 00080 | Loss 2.0064 | Train Acc 0.4482 | Speed (samples/sec) 5861.9924 | GPU 792.3 MB
Epoch 00000 | Step 00100 | Loss 1.6505 | Train Acc 0.5488 | Speed (samples/sec) 5835.7202 | GPU 792.3 MB
Epoch 00000 | Step 00120 | Loss 1.4899 | Train Acc 0.6006 | Speed (samples/sec) 5788.7462 | GPU 792.3 MB
Epoch 00000 | Step 00140 | Loss 1.2912 | Train Acc 0.6475 | Speed (samples/sec) 5721.5846 | GPU 792.3 MB
Epoch 00000 | Step 00160 | Loss 1.1949 | Train Acc 0.6738 | Speed (samples/sec) 5729

  0%|          | 0/245 [00:00<?, ?it/s]

Epoch Time(s): 38.2594


100%|██████████| 245/245 [00:41<00:00,  5.89it/s]
100%|██████████| 245/245 [00:51<00:00,  4.79it/s]
100%|██████████| 245/245 [00:51<00:00,  4.80it/s]


Val acc 0.7648, Test Acc: 0.5986
Best val acc 0.7648, best test acc: 0.5986
Epoch 00004 | Step 00000 | Loss 0.8630 | Train Acc 0.7627 | Speed (samples/sec) 5684.6560 | GPU 792.3 MB
Epoch 00004 | Step 00020 | Loss 0.7219 | Train Acc 0.7988 | Speed (samples/sec) 5690.6060 | GPU 792.3 MB
Epoch 00004 | Step 00040 | Loss 0.7355 | Train Acc 0.7988 | Speed (samples/sec) 5701.0012 | GPU 792.3 MB
Epoch 00004 | Step 00060 | Loss 0.7399 | Train Acc 0.7920 | Speed (samples/sec) 5709.0480 | GPU 792.3 MB
Epoch 00004 | Step 00080 | Loss 0.7502 | Train Acc 0.7783 | Speed (samples/sec) 5712.6029 | GPU 792.3 MB
Epoch 00004 | Step 00100 | Loss 0.6806 | Train Acc 0.8066 | Speed (samples/sec) 5722.7550 | GPU 792.3 MB
Epoch 00004 | Step 00120 | Loss 0.7247 | Train Acc 0.7959 | Speed (samples/sec) 5728.8752 | GPU 792.3 MB
Epoch 00004 | Step 00140 | Loss 0.7185 | Train Acc 0.8135 | Speed (samples/sec) 5733.8097 | GPU 792.3 MB
Epoch 00004 | Step 00160 | Loss 0.6016 | Train Acc 0.8457 | Speed (samples/sec) 5736

  0%|          | 0/245 [00:00<?, ?it/s]

Epoch Time(s): 36.6953


100%|██████████| 245/245 [00:40<00:00,  6.04it/s]
100%|██████████| 245/245 [00:50<00:00,  4.86it/s]
100%|██████████| 245/245 [00:49<00:00,  4.90it/s]


Val acc 0.8105, Test Acc: 0.6464
Best val acc 0.8105, best test acc: 0.6464
Epoch 00007 | Step 00000 | Loss 0.6884 | Train Acc 0.8174 | Speed (samples/sec) 5787.9332 | GPU 792.3 MB
Epoch 00007 | Step 00020 | Loss 0.6162 | Train Acc 0.8359 | Speed (samples/sec) 5783.8225 | GPU 792.3 MB
Epoch 00007 | Step 00040 | Loss 0.6884 | Train Acc 0.8105 | Speed (samples/sec) 5787.6885 | GPU 792.3 MB
Epoch 00007 | Step 00060 | Loss 0.6162 | Train Acc 0.8252 | Speed (samples/sec) 5792.9322 | GPU 792.3 MB
Epoch 00007 | Step 00080 | Loss 0.6767 | Train Acc 0.8086 | Speed (samples/sec) 5798.6604 | GPU 792.3 MB
Epoch 00007 | Step 00100 | Loss 0.6376 | Train Acc 0.8164 | Speed (samples/sec) 5804.9585 | GPU 792.3 MB
Epoch 00007 | Step 00120 | Loss 0.6511 | Train Acc 0.8125 | Speed (samples/sec) 5806.1263 | GPU 792.3 MB
Epoch 00007 | Step 00140 | Loss 0.6869 | Train Acc 0.8066 | Speed (samples/sec) 5811.9025 | GPU 792.3 MB
Epoch 00007 | Step 00160 | Loss 0.6490 | Train Acc 0.8252 | Speed (samples/sec) 5816

  0%|          | 0/245 [00:00<?, ?it/s]

Epoch Time(s): 37.3515


100%|██████████| 245/245 [00:40<00:00,  6.01it/s]
100%|██████████| 245/245 [00:51<00:00,  4.76it/s]
100%|██████████| 245/245 [00:50<00:00,  4.82it/s]


Val acc 0.8396, Test Acc: 0.6995
Best val acc 0.8396, best test acc: 0.6995
Epoch 00010 | Step 00000 | Loss 0.5972 | Train Acc 0.8330 | Speed (samples/sec) 5849.2357 | GPU 793.4 MB
Epoch 00010 | Step 00020 | Loss 0.6139 | Train Acc 0.8301 | Speed (samples/sec) 5845.9355 | GPU 793.4 MB
Epoch 00010 | Step 00040 | Loss 0.5536 | Train Acc 0.8369 | Speed (samples/sec) 5844.8828 | GPU 793.4 MB
Epoch 00010 | Step 00060 | Loss 0.6526 | Train Acc 0.8115 | Speed (samples/sec) 5845.1208 | GPU 793.4 MB
Epoch 00010 | Step 00080 | Loss 0.6168 | Train Acc 0.8174 | Speed (samples/sec) 5845.5274 | GPU 793.4 MB
Epoch 00010 | Step 00100 | Loss 0.6014 | Train Acc 0.8223 | Speed (samples/sec) 5845.5442 | GPU 793.4 MB
Epoch 00010 | Step 00120 | Loss 0.5646 | Train Acc 0.8398 | Speed (samples/sec) 5845.0011 | GPU 793.4 MB
Epoch 00010 | Step 00140 | Loss 0.6784 | Train Acc 0.8105 | Speed (samples/sec) 5846.6006 | GPU 793.4 MB
Epoch 00010 | Step 00160 | Loss 0.5653 | Train Acc 0.8311 | Speed (samples/sec) 5847

  0%|          | 0/245 [00:00<?, ?it/s]

Epoch Time(s): 35.6829


100%|██████████| 245/245 [00:40<00:00,  6.03it/s]
100%|██████████| 245/245 [00:50<00:00,  4.83it/s]
100%|██████████| 245/245 [00:49<00:00,  4.98it/s]


Val acc 0.8167, Test Acc: 0.6601
Epoch 00013 | Step 00000 | Loss 0.6674 | Train Acc 0.8047 | Speed (samples/sec) 5880.2467 | GPU 793.4 MB
Epoch 00013 | Step 00020 | Loss 0.5327 | Train Acc 0.8525 | Speed (samples/sec) 5880.9835 | GPU 793.4 MB
Epoch 00013 | Step 00040 | Loss 0.5588 | Train Acc 0.8467 | Speed (samples/sec) 5881.3071 | GPU 793.4 MB
Epoch 00013 | Step 00060 | Loss 0.5363 | Train Acc 0.8428 | Speed (samples/sec) 5881.4215 | GPU 793.4 MB
Epoch 00013 | Step 00080 | Loss 0.5346 | Train Acc 0.8398 | Speed (samples/sec) 5881.0711 | GPU 793.4 MB
Epoch 00013 | Step 00100 | Loss 0.4943 | Train Acc 0.8604 | Speed (samples/sec) 5882.1066 | GPU 793.4 MB
Epoch 00013 | Step 00120 | Loss 0.5858 | Train Acc 0.8457 | Speed (samples/sec) 5882.2913 | GPU 793.4 MB
Epoch 00013 | Step 00140 | Loss 0.5727 | Train Acc 0.8359 | Speed (samples/sec) 5881.9124 | GPU 793.4 MB
Epoch 00013 | Step 00160 | Loss 0.5016 | Train Acc 0.8477 | Speed (samples/sec) 5881.2993 | GPU 793.4 MB
Epoch 00013 | Step 001

  0%|          | 0/245 [00:00<?, ?it/s]

Epoch Time(s): 37.3120


100%|██████████| 245/245 [00:40<00:00,  6.05it/s]
100%|██████████| 245/245 [00:51<00:00,  4.75it/s]
100%|██████████| 245/245 [00:49<00:00,  4.92it/s]


Val acc 0.7441, Test Acc: 0.5948
Epoch 00016 | Step 00000 | Loss 1.0339 | Train Acc 0.7402 | Speed (samples/sec) 5873.7165 | GPU 793.4 MB
Epoch 00016 | Step 00020 | Loss 0.6036 | Train Acc 0.8311 | Speed (samples/sec) 5874.1890 | GPU 793.4 MB
Epoch 00016 | Step 00040 | Loss 0.5047 | Train Acc 0.8555 | Speed (samples/sec) 5875.3425 | GPU 793.4 MB
Epoch 00016 | Step 00060 | Loss 0.5483 | Train Acc 0.8496 | Speed (samples/sec) 5874.8266 | GPU 793.4 MB
Epoch 00016 | Step 00080 | Loss 0.5554 | Train Acc 0.8359 | Speed (samples/sec) 5875.7813 | GPU 793.4 MB
Epoch 00016 | Step 00100 | Loss 0.5795 | Train Acc 0.8242 | Speed (samples/sec) 5876.4488 | GPU 793.4 MB
Epoch 00016 | Step 00120 | Loss 0.5951 | Train Acc 0.8369 | Speed (samples/sec) 5876.6048 | GPU 793.4 MB
Epoch 00016 | Step 00140 | Loss 0.5812 | Train Acc 0.8359 | Speed (samples/sec) 5877.5858 | GPU 793.4 MB
Epoch 00016 | Step 00160 | Loss 0.6305 | Train Acc 0.8301 | Speed (samples/sec) 5878.8014 | GPU 793.4 MB
Epoch 00016 | Step 001

  0%|          | 0/245 [00:00<?, ?it/s]

Epoch Time(s): 37.0399


100%|██████████| 245/245 [00:41<00:00,  5.90it/s]
100%|██████████| 245/245 [00:48<00:00,  5.06it/s]
100%|██████████| 245/245 [00:50<00:00,  4.88it/s]


Val acc 0.8342, Test Acc: 0.6845
Epoch 00019 | Step 00000 | Loss 0.5439 | Train Acc 0.8477 | Speed (samples/sec) 5883.0856 | GPU 793.4 MB
Epoch 00019 | Step 00020 | Loss 0.5371 | Train Acc 0.8418 | Speed (samples/sec) 5883.8895 | GPU 793.4 MB
Epoch 00019 | Step 00040 | Loss 0.5783 | Train Acc 0.8486 | Speed (samples/sec) 5883.8580 | GPU 793.4 MB
Epoch 00019 | Step 00060 | Loss 0.5424 | Train Acc 0.8389 | Speed (samples/sec) 5884.3116 | GPU 793.4 MB
Epoch 00019 | Step 00080 | Loss 0.4901 | Train Acc 0.8643 | Speed (samples/sec) 5885.0921 | GPU 793.4 MB
Epoch 00019 | Step 00100 | Loss 0.5804 | Train Acc 0.8379 | Speed (samples/sec) 5885.3696 | GPU 793.4 MB
Epoch 00019 | Step 00120 | Loss 0.5582 | Train Acc 0.8389 | Speed (samples/sec) 5886.5591 | GPU 793.4 MB
Epoch 00019 | Step 00140 | Loss 0.5069 | Train Acc 0.8750 | Speed (samples/sec) 5888.0592 | GPU 793.4 MB
Epoch 00019 | Step 00160 | Loss 0.5721 | Train Acc 0.8389 | Speed (samples/sec) 5888.0882 | GPU 793.4 MB
Epoch 00019 | Step 001

  0%|          | 0/245 [00:00<?, ?it/s]

Epoch Time(s): 36.9199


100%|██████████| 245/245 [00:41<00:00,  5.93it/s]
100%|██████████| 245/245 [00:51<00:00,  4.71it/s]
100%|██████████| 245/245 [00:50<00:00,  4.90it/s]


Val acc 0.8182, Test Acc: 0.6575
Epoch 00022 | Step 00000 | Loss 0.6775 | Train Acc 0.7988 | Speed (samples/sec) 5889.8396 | GPU 793.4 MB
Epoch 00022 | Step 00020 | Loss 0.5580 | Train Acc 0.8408 | Speed (samples/sec) 5890.9054 | GPU 793.4 MB
Epoch 00022 | Step 00040 | Loss 0.5825 | Train Acc 0.8271 | Speed (samples/sec) 5892.0171 | GPU 793.4 MB
Epoch 00022 | Step 00060 | Loss 0.5173 | Train Acc 0.8623 | Speed (samples/sec) 5892.3774 | GPU 793.4 MB
Epoch 00022 | Step 00080 | Loss 0.5369 | Train Acc 0.8535 | Speed (samples/sec) 5892.1058 | GPU 793.4 MB
Epoch 00022 | Step 00100 | Loss 0.5091 | Train Acc 0.8496 | Speed (samples/sec) 5894.3851 | GPU 793.4 MB
Epoch 00022 | Step 00120 | Loss 0.5113 | Train Acc 0.8486 | Speed (samples/sec) 5895.8497 | GPU 793.4 MB
Epoch 00022 | Step 00140 | Loss 0.4908 | Train Acc 0.8525 | Speed (samples/sec) 5896.7390 | GPU 793.4 MB
Epoch 00022 | Step 00160 | Loss 0.5023 | Train Acc 0.8506 | Speed (samples/sec) 5897.6785 | GPU 793.4 MB
Epoch 00022 | Step 001

  0%|          | 0/245 [00:00<?, ?it/s]

Epoch Time(s): 36.8023


100%|██████████| 245/245 [00:40<00:00,  6.02it/s]
100%|██████████| 245/245 [00:50<00:00,  4.85it/s]
100%|██████████| 245/245 [00:49<00:00,  4.96it/s]


Val acc 0.8392, Test Acc: 0.6922
Epoch 00025 | Step 00000 | Loss 0.5162 | Train Acc 0.8604 | Speed (samples/sec) 5905.3516 | GPU 793.4 MB
Epoch 00025 | Step 00020 | Loss 0.5258 | Train Acc 0.8643 | Speed (samples/sec) 5905.5916 | GPU 793.4 MB
Epoch 00025 | Step 00040 | Loss 0.5481 | Train Acc 0.8398 | Speed (samples/sec) 5905.8770 | GPU 793.4 MB
Epoch 00025 | Step 00060 | Loss 0.5412 | Train Acc 0.8291 | Speed (samples/sec) 5905.6284 | GPU 793.4 MB
Epoch 00025 | Step 00080 | Loss 0.5506 | Train Acc 0.8408 | Speed (samples/sec) 5906.5443 | GPU 793.4 MB
Epoch 00025 | Step 00100 | Loss 0.4937 | Train Acc 0.8496 | Speed (samples/sec) 5907.2090 | GPU 793.4 MB
Epoch 00025 | Step 00120 | Loss 0.4814 | Train Acc 0.8643 | Speed (samples/sec) 5907.5137 | GPU 793.4 MB
Epoch 00025 | Step 00140 | Loss 0.4975 | Train Acc 0.8516 | Speed (samples/sec) 5907.3937 | GPU 793.4 MB
Epoch 00025 | Step 00160 | Loss 0.4878 | Train Acc 0.8535 | Speed (samples/sec) 5907.5047 | GPU 793.4 MB
Epoch 00025 | Step 001

  0%|          | 0/245 [00:00<?, ?it/s]

Epoch Time(s): 36.7262


100%|██████████| 245/245 [00:41<00:00,  5.94it/s]
100%|██████████| 245/245 [00:50<00:00,  4.86it/s]
100%|██████████| 245/245 [00:50<00:00,  4.85it/s]


Val acc 0.7752, Test Acc: 0.6237
Epoch 00028 | Step 00000 | Loss 0.8237 | Train Acc 0.7744 | Speed (samples/sec) 5902.3555 | GPU 793.4 MB
Epoch 00028 | Step 00020 | Loss 0.5735 | Train Acc 0.8467 | Speed (samples/sec) 5902.3605 | GPU 793.4 MB
Epoch 00028 | Step 00040 | Loss 0.5083 | Train Acc 0.8535 | Speed (samples/sec) 5903.8161 | GPU 793.4 MB
Epoch 00028 | Step 00060 | Loss 0.5350 | Train Acc 0.8418 | Speed (samples/sec) 5905.3371 | GPU 793.4 MB
Epoch 00028 | Step 00080 | Loss 0.5107 | Train Acc 0.8594 | Speed (samples/sec) 5906.4831 | GPU 793.4 MB
Epoch 00028 | Step 00100 | Loss 0.5378 | Train Acc 0.8477 | Speed (samples/sec) 5907.4068 | GPU 793.4 MB
Epoch 00028 | Step 00120 | Loss 0.4742 | Train Acc 0.8701 | Speed (samples/sec) 5908.1726 | GPU 793.4 MB
Epoch 00028 | Step 00140 | Loss 0.4938 | Train Acc 0.8643 | Speed (samples/sec) 5909.6665 | GPU 793.4 MB
Epoch 00028 | Step 00160 | Loss 0.4892 | Train Acc 0.8623 | Speed (samples/sec) 5910.2121 | GPU 793.4 MB
Epoch 00028 | Step 001

  0%|          | 0/245 [00:00<?, ?it/s]

Epoch Time(s): 36.5472


100%|██████████| 245/245 [00:41<00:00,  5.94it/s]
100%|██████████| 245/245 [00:49<00:00,  4.91it/s]
100%|██████████| 245/245 [00:50<00:00,  4.89it/s]


Val acc 0.8368, Test Acc: 0.6884
Epoch 00031 | Step 00000 | Loss 0.5774 | Train Acc 0.8320 | Speed (samples/sec) 5915.6863 | GPU 793.5 MB
Epoch 00031 | Step 00020 | Loss 0.5012 | Train Acc 0.8584 | Speed (samples/sec) 5915.7557 | GPU 793.5 MB
Epoch 00031 | Step 00040 | Loss 0.4452 | Train Acc 0.8701 | Speed (samples/sec) 5914.9021 | GPU 793.5 MB
Epoch 00031 | Step 00060 | Loss 0.5066 | Train Acc 0.8564 | Speed (samples/sec) 5914.3876 | GPU 793.5 MB
Epoch 00031 | Step 00080 | Loss 0.5260 | Train Acc 0.8545 | Speed (samples/sec) 5914.9184 | GPU 793.5 MB
Epoch 00031 | Step 00100 | Loss 0.4634 | Train Acc 0.8652 | Speed (samples/sec) 5915.1267 | GPU 793.5 MB
Epoch 00031 | Step 00120 | Loss 0.5367 | Train Acc 0.8535 | Speed (samples/sec) 5915.0526 | GPU 793.5 MB
Epoch 00031 | Step 00140 | Loss 0.5078 | Train Acc 0.8525 | Speed (samples/sec) 5915.1658 | GPU 793.5 MB
Epoch 00031 | Step 00160 | Loss 0.4232 | Train Acc 0.8760 | Speed (samples/sec) 5915.6578 | GPU 793.5 MB
Epoch 00031 | Step 001

  0%|          | 0/245 [00:00<?, ?it/s]

Epoch Time(s): 36.7671


100%|██████████| 245/245 [00:40<00:00,  6.01it/s]
100%|██████████| 245/245 [00:50<00:00,  4.85it/s]
100%|██████████| 245/245 [00:49<00:00,  4.98it/s]


Val acc 0.8498, Test Acc: 0.6983
Best val acc 0.8498, best test acc: 0.6983
Epoch 00034 | Step 00000 | Loss 0.5010 | Train Acc 0.8643 | Speed (samples/sec) 5914.2675 | GPU 793.5 MB
Epoch 00034 | Step 00020 | Loss 0.5700 | Train Acc 0.8320 | Speed (samples/sec) 5914.8286 | GPU 793.5 MB
Epoch 00034 | Step 00040 | Loss 0.4920 | Train Acc 0.8564 | Speed (samples/sec) 5915.3794 | GPU 793.5 MB
Epoch 00034 | Step 00060 | Loss 0.5404 | Train Acc 0.8398 | Speed (samples/sec) 5915.4919 | GPU 793.5 MB
Epoch 00034 | Step 00080 | Loss 0.5306 | Train Acc 0.8506 | Speed (samples/sec) 5915.3955 | GPU 793.5 MB
Epoch 00034 | Step 00100 | Loss 0.4910 | Train Acc 0.8643 | Speed (samples/sec) 5915.5709 | GPU 793.5 MB
Epoch 00034 | Step 00120 | Loss 0.4957 | Train Acc 0.8633 | Speed (samples/sec) 5916.1678 | GPU 793.5 MB
Epoch 00034 | Step 00140 | Loss 0.4791 | Train Acc 0.8613 | Speed (samples/sec) 5916.0245 | GPU 793.5 MB
Epoch 00034 | Step 00160 | Loss 0.5060 | Train Acc 0.8730 | Speed (samples/sec) 5915

  0%|          | 0/245 [00:00<?, ?it/s]

Epoch Time(s): 37.2463


100%|██████████| 245/245 [00:40<00:00,  6.12it/s]
100%|██████████| 245/245 [00:49<00:00,  4.92it/s]
100%|██████████| 245/245 [00:48<00:00,  5.07it/s]


Val acc 0.7949, Test Acc: 0.6338
Epoch 00037 | Step 00000 | Loss 0.7432 | Train Acc 0.7959 | Speed (samples/sec) 5915.2410 | GPU 793.5 MB
Epoch 00037 | Step 00020 | Loss 0.5821 | Train Acc 0.8320 | Speed (samples/sec) 5915.0670 | GPU 793.5 MB
Epoch 00037 | Step 00040 | Loss 0.4984 | Train Acc 0.8486 | Speed (samples/sec) 5915.3179 | GPU 793.5 MB
Epoch 00037 | Step 00060 | Loss 0.5291 | Train Acc 0.8594 | Speed (samples/sec) 5914.9378 | GPU 793.5 MB
Epoch 00037 | Step 00080 | Loss 0.5022 | Train Acc 0.8643 | Speed (samples/sec) 5914.9526 | GPU 793.5 MB
Epoch 00037 | Step 00100 | Loss 0.4726 | Train Acc 0.8623 | Speed (samples/sec) 5914.7465 | GPU 793.5 MB
Epoch 00037 | Step 00120 | Loss 0.4861 | Train Acc 0.8584 | Speed (samples/sec) 5915.1767 | GPU 793.5 MB
Epoch 00037 | Step 00140 | Loss 0.5972 | Train Acc 0.8330 | Speed (samples/sec) 5915.3261 | GPU 793.5 MB
Epoch 00037 | Step 00160 | Loss 0.4734 | Train Acc 0.8525 | Speed (samples/sec) 5915.5258 | GPU 793.5 MB
Epoch 00037 | Step 001

  0%|          | 0/245 [00:00<?, ?it/s]

Epoch Time(s): 36.3895


100%|██████████| 245/245 [00:41<00:00,  5.97it/s]
100%|██████████| 245/245 [00:49<00:00,  4.91it/s]
100%|██████████| 245/245 [00:51<00:00,  4.79it/s]


Val acc 0.8524, Test Acc: 0.7015
Best val acc 0.8524, best test acc: 0.7015
Epoch 00040 | Step 00000 | Loss 0.4976 | Train Acc 0.8457 | Speed (samples/sec) 5917.1799 | GPU 793.5 MB
Epoch 00040 | Step 00020 | Loss 0.4588 | Train Acc 0.8672 | Speed (samples/sec) 5916.8199 | GPU 793.5 MB
Epoch 00040 | Step 00040 | Loss 0.4963 | Train Acc 0.8584 | Speed (samples/sec) 5916.6979 | GPU 793.5 MB
Epoch 00040 | Step 00060 | Loss 0.4786 | Train Acc 0.8604 | Speed (samples/sec) 5916.9112 | GPU 793.5 MB
Epoch 00040 | Step 00080 | Loss 0.4949 | Train Acc 0.8506 | Speed (samples/sec) 5917.1283 | GPU 793.5 MB
Epoch 00040 | Step 00100 | Loss 0.4967 | Train Acc 0.8516 | Speed (samples/sec) 5916.9296 | GPU 793.5 MB
Epoch 00040 | Step 00120 | Loss 0.4997 | Train Acc 0.8613 | Speed (samples/sec) 5916.8854 | GPU 793.5 MB
Epoch 00040 | Step 00140 | Loss 0.5527 | Train Acc 0.8398 | Speed (samples/sec) 5917.2307 | GPU 793.5 MB
Epoch 00040 | Step 00160 | Loss 0.4512 | Train Acc 0.8672 | Speed (samples/sec) 5917

  0%|          | 0/245 [00:00<?, ?it/s]

Epoch Time(s): 37.0849


100%|██████████| 245/245 [00:41<00:00,  5.92it/s]
100%|██████████| 245/245 [00:50<00:00,  4.88it/s]
100%|██████████| 245/245 [00:50<00:00,  4.84it/s]


Val acc 0.8650, Test Acc: 0.7015
Best val acc 0.8650, best test acc: 0.7015
Epoch 00043 | Step 00000 | Loss 0.5175 | Train Acc 0.8633 | Speed (samples/sec) 5911.2870 | GPU 793.5 MB
Epoch 00043 | Step 00020 | Loss 0.4789 | Train Acc 0.8613 | Speed (samples/sec) 5910.9740 | GPU 793.5 MB
Epoch 00043 | Step 00040 | Loss 0.5095 | Train Acc 0.8613 | Speed (samples/sec) 5910.7056 | GPU 793.5 MB
Epoch 00043 | Step 00060 | Loss 0.5084 | Train Acc 0.8574 | Speed (samples/sec) 5911.3015 | GPU 793.5 MB
Epoch 00043 | Step 00080 | Loss 0.4849 | Train Acc 0.8604 | Speed (samples/sec) 5911.4334 | GPU 793.5 MB
Epoch 00043 | Step 00100 | Loss 0.4813 | Train Acc 0.8604 | Speed (samples/sec) 5911.2419 | GPU 793.5 MB
Epoch 00043 | Step 00120 | Loss 0.4902 | Train Acc 0.8672 | Speed (samples/sec) 5912.0491 | GPU 793.5 MB
Epoch 00043 | Step 00140 | Loss 0.5131 | Train Acc 0.8633 | Speed (samples/sec) 5911.8833 | GPU 793.5 MB
Epoch 00043 | Step 00160 | Loss 0.5291 | Train Acc 0.8467 | Speed (samples/sec) 5912

  0%|          | 0/245 [00:00<?, ?it/s]

Epoch Time(s): 36.4351


100%|██████████| 245/245 [00:41<00:00,  5.91it/s]
100%|██████████| 245/245 [00:48<00:00,  5.03it/s]
100%|██████████| 245/245 [00:48<00:00,  5.02it/s]


Val acc 0.8466, Test Acc: 0.6890
Epoch 00046 | Step 00000 | Loss 0.4957 | Train Acc 0.8447 | Speed (samples/sec) 5912.9835 | GPU 793.5 MB
Epoch 00046 | Step 00020 | Loss 0.4769 | Train Acc 0.8496 | Speed (samples/sec) 5913.1762 | GPU 793.5 MB
Epoch 00046 | Step 00040 | Loss 0.4341 | Train Acc 0.8750 | Speed (samples/sec) 5912.8257 | GPU 793.5 MB
Epoch 00046 | Step 00060 | Loss 0.4338 | Train Acc 0.8711 | Speed (samples/sec) 5912.8255 | GPU 793.5 MB
Epoch 00046 | Step 00080 | Loss 0.4515 | Train Acc 0.8721 | Speed (samples/sec) 5913.1611 | GPU 793.5 MB
Epoch 00046 | Step 00100 | Loss 0.4737 | Train Acc 0.8701 | Speed (samples/sec) 5913.5636 | GPU 793.5 MB
Epoch 00046 | Step 00120 | Loss 0.5422 | Train Acc 0.8555 | Speed (samples/sec) 5913.8796 | GPU 793.5 MB
Epoch 00046 | Step 00140 | Loss 0.4511 | Train Acc 0.8740 | Speed (samples/sec) 5914.0924 | GPU 793.5 MB
Epoch 00046 | Step 00160 | Loss 0.4875 | Train Acc 0.8584 | Speed (samples/sec) 5914.1689 | GPU 793.5 MB
Epoch 00046 | Step 001

  0%|          | 0/245 [00:00<?, ?it/s]

Epoch Time(s): 36.8791


100%|██████████| 245/245 [00:41<00:00,  5.97it/s]
100%|██████████| 245/245 [00:52<00:00,  4.68it/s]
100%|██████████| 245/245 [00:49<00:00,  4.99it/s]


Val acc 0.7696, Test Acc: 0.6354
Epoch 00049 | Step 00000 | Loss 1.0017 | Train Acc 0.7432 | Speed (samples/sec) 5913.9363 | GPU 793.5 MB
Epoch 00049 | Step 00020 | Loss 0.7232 | Train Acc 0.7900 | Speed (samples/sec) 5913.9449 | GPU 793.5 MB
Epoch 00049 | Step 00040 | Loss 0.5584 | Train Acc 0.8379 | Speed (samples/sec) 5914.0973 | GPU 793.5 MB
Epoch 00049 | Step 00060 | Loss 0.5969 | Train Acc 0.8447 | Speed (samples/sec) 5914.1447 | GPU 793.5 MB
Epoch 00049 | Step 00080 | Loss 0.5389 | Train Acc 0.8516 | Speed (samples/sec) 5914.2318 | GPU 793.5 MB
Epoch 00049 | Step 00100 | Loss 0.4937 | Train Acc 0.8633 | Speed (samples/sec) 5913.7983 | GPU 793.5 MB
Epoch 00049 | Step 00120 | Loss 0.5446 | Train Acc 0.8447 | Speed (samples/sec) 5913.8996 | GPU 793.5 MB
Epoch 00049 | Step 00140 | Loss 0.4961 | Train Acc 0.8525 | Speed (samples/sec) 5913.9018 | GPU 793.5 MB
Epoch 00049 | Step 00160 | Loss 0.5539 | Train Acc 0.8467 | Speed (samples/sec) 5913.9655 | GPU 793.5 MB
Epoch 00049 | Step 001