In [1]:
%load_ext autoreload
%autoreload 2

In [2]:
import numpy as np
import tensorflow as tf

from model import SiameseNet
from data_utils import QuoraDataset, DataIterator
from config import Config
from embeddings import load_embeddings

Using TensorFlow backend.


In [3]:
### Loading config and pretrained Glove embeddings
config = Config()
loaded_embeddings, (w2idx, idx2w) = load_embeddings(config.glove_filename, binary=False)

Loading from saved word_embeddings
Loading vocab


In [4]:
### Loading Quora Datasets
qd_train = QuoraDataset(config.train_filename, save_path=config.train_save)
w2idx_train, idx2w_train = qd_train.w2idx, qd_train.idx2w

embeddings = np.random.normal(scale=0.001, size=(len(w2idx_train), config.we_dim))

In [5]:
for w, i in w2idx_train.items():
    idx = w2idx.get(w)
    if idx is not None:
        embeddings[i] = loaded_embeddings[idx]

In [6]:
qd_dev  = QuoraDataset(config.dev_filename, w2idx=w2idx_train, save_path=config.dev_save)
qd_test = QuoraDataset(config.test_filename, w2idx=w2idx_train, save_path=config.test_save)

In [7]:
train_data = qd_train.data()
dev_data = qd_dev.data()
test_data = qd_test.data()

In [8]:
### SiameseNet
model = SiameseNet(config, embeddings)
model.build()

In [9]:
model.train(train_data, dev_data, test_data)

  0%|          | 0/6005 [00:00<?, ?it/s]

Training in hid-256_lr-adam-0.001-tanh_bs-64_drop-0.0_tremb-0_nep-20/
Epoch 1/20 :
dev acc 62.16


  0%|          | 3/6005 [00:06<7:20:19,  4.40s/it] 

test acc 62.48


 17%|█▋        | 999/6005 [01:06<04:48, 17.38it/s] 

dev acc 80.08


 17%|█▋        | 1003/6005 [01:12<54:58,  1.52it/s]  

test acc 79.50


 33%|███▎      | 1999/6005 [02:10<03:50, 17.38it/s]

dev acc 81.43


 33%|███▎      | 2003/6005 [02:16<44:03,  1.51it/s]  

test acc 81.35


 50%|████▉     | 2999/6005 [03:18<03:06, 16.11it/s]

dev acc 81.92


 50%|█████     | 3003/6005 [03:24<33:20,  1.50it/s]

test acc 82.29


 67%|██████▋   | 3999/6005 [04:22<01:59, 16.82it/s]

dev acc 83.02


 67%|██████▋   | 4003/6005 [04:28<22:09,  1.51it/s]

test acc 83.03


 83%|████████▎ | 4999/6005 [05:27<00:57, 17.38it/s]

dev acc 83.63


 83%|████████▎ | 5003/6005 [05:33<11:04,  1.51it/s]

test acc 83.41


100%|█████████▉| 5999/6005 [06:32<00:00, 16.86it/s]

dev acc 83.86


100%|█████████▉| 6003/6005 [06:38<00:01,  1.51it/s]

test acc 83.96


100%|██████████| 6005/6005 [06:38<00:00,  2.06it/s]
  0%|          | 0/6005 [00:00<?, ?it/s]

New best score on dev !
Epoch 2/20 :
dev acc 83.75


  0%|          | 3/6005 [00:05<6:49:39,  4.10s/it]

test acc 83.56


 17%|█▋        | 999/6005 [01:04<04:53, 17.07it/s] 

dev acc 84.18


 17%|█▋        | 1003/6005 [01:10<55:34,  1.50it/s]  

test acc 84.13


 33%|███▎      | 1999/6005 [02:11<03:56, 16.96it/s]

dev acc 84.37


 33%|███▎      | 2003/6005 [02:17<44:14,  1.51it/s]  

test acc 84.23


 50%|████▉     | 2999/6005 [03:16<02:56, 17.04it/s]

dev acc 84.47


 50%|█████     | 3003/6005 [03:22<33:14,  1.51it/s]

test acc 84.76


 67%|██████▋   | 3999/6005 [04:21<01:57, 17.14it/s]

dev acc 85.15


 67%|██████▋   | 4003/6005 [04:27<22:06,  1.51it/s]

test acc 85.05


 83%|████████▎ | 4999/6005 [05:26<00:59, 17.01it/s]

dev acc 85.14


 83%|████████▎ | 5003/6005 [05:32<11:04,  1.51it/s]

test acc 84.92


100%|█████████▉| 5999/6005 [06:32<00:00, 17.13it/s]

dev acc 85.36


100%|█████████▉| 6003/6005 [06:38<00:01,  1.51it/s]

test acc 85.07


100%|██████████| 6005/6005 [06:38<00:00,  2.07it/s]
  0%|          | 0/6005 [00:00<?, ?it/s]

New best score on dev !
Epoch 3/20 :
dev acc 85.29


  0%|          | 3/6005 [00:05<6:49:18,  4.09s/it]

test acc 84.80


 17%|█▋        | 999/6005 [01:06<04:56, 16.89it/s] 

dev acc 86.03


 17%|█▋        | 1003/6005 [01:12<55:19,  1.51it/s]  

test acc 85.63


 33%|███▎      | 1999/6005 [02:11<03:53, 17.15it/s]

dev acc 85.78


 33%|███▎      | 2003/6005 [02:17<44:13,  1.51it/s]  

test acc 85.16


 50%|████▉     | 2999/6005 [03:16<02:51, 17.49it/s]

dev acc 85.81


 50%|█████     | 3003/6005 [03:22<33:05,  1.51it/s]

test acc 85.45


 67%|██████▋   | 3999/6005 [04:23<02:03, 16.18it/s]

dev acc 85.98


 67%|██████▋   | 4003/6005 [04:29<22:11,  1.50it/s]

test acc 85.14


 83%|████████▎ | 4999/6005 [05:28<00:59, 16.94it/s]

dev acc 85.64


 83%|████████▎ | 5003/6005 [05:34<11:13,  1.49it/s]

test acc 85.57


100%|█████████▉| 5999/6005 [06:33<00:00, 16.89it/s]

dev acc 85.95


100%|█████████▉| 6003/6005 [06:39<00:01,  1.51it/s]

test acc 85.24


100%|██████████| 6005/6005 [06:39<00:00,  2.07it/s]
  0%|          | 0/6005 [00:00<?, ?it/s]

New best score on dev !
Epoch 4/20 :
dev acc 85.83


  0%|          | 3/6005 [00:05<6:50:37,  4.10s/it]

test acc 84.90


 17%|█▋        | 999/6005 [01:06<05:07, 16.30it/s] 

dev acc 86.46


 17%|█▋        | 1003/6005 [01:12<55:22,  1.51it/s]  

test acc 85.67


 33%|███▎      | 1999/6005 [02:11<03:56, 16.95it/s]

dev acc 86.18


 33%|███▎      | 2003/6005 [02:17<44:13,  1.51it/s]  

test acc 85.55


 50%|████▉     | 2999/6005 [03:15<02:57, 16.92it/s]

dev acc 86.19


 50%|█████     | 3003/6005 [03:21<33:34,  1.49it/s]

test acc 85.64


 67%|██████▋   | 3999/6005 [04:19<01:54, 17.55it/s]

dev acc 85.91


 67%|██████▋   | 4003/6005 [04:25<22:26,  1.49it/s]

test acc 84.80


 83%|████████▎ | 4999/6005 [05:22<00:58, 17.32it/s]

dev acc 85.66


 83%|████████▎ | 5003/6005 [05:28<11:11,  1.49it/s]

test acc 85.13


100%|█████████▉| 5999/6005 [06:25<00:00, 17.27it/s]

dev acc 86.13


100%|█████████▉| 6003/6005 [06:31<00:01,  1.50it/s]

test acc 85.16


100%|██████████| 6005/6005 [06:31<00:00,  2.06it/s]
  0%|          | 0/6005 [00:00<?, ?it/s]

New best score on dev !
Epoch 5/20 :
dev acc 86.15


  0%|          | 3/6005 [00:05<6:53:16,  4.13s/it]

test acc 85.15


 17%|█▋        | 999/6005 [01:03<04:53, 17.05it/s] 

dev acc 86.73


 17%|█▋        | 1003/6005 [01:09<55:41,  1.50it/s]  

test acc 85.74


 33%|███▎      | 1999/6005 [02:06<03:52, 17.24it/s]

dev acc 86.56


 33%|███▎      | 2003/6005 [02:12<44:39,  1.49it/s]  

test acc 85.43


 50%|████▉     | 2999/6005 [03:09<03:01, 16.57it/s]

dev acc 86.50


 50%|█████     | 3003/6005 [03:15<33:26,  1.50it/s]

test acc 85.60


 67%|██████▋   | 3999/6005 [04:13<01:57, 17.11it/s]

dev acc 85.78


 67%|██████▋   | 4003/6005 [04:19<22:20,  1.49it/s]

test acc 85.28


 83%|████████▎ | 4999/6005 [05:16<00:58, 17.22it/s]

dev acc 86.19


 83%|████████▎ | 5003/6005 [05:22<11:11,  1.49it/s]

test acc 85.54


100%|█████████▉| 5999/6005 [06:20<00:00, 17.55it/s]

dev acc 86.04


100%|█████████▉| 6003/6005 [06:26<00:01,  1.49it/s]

test acc 85.36


100%|██████████| 6005/6005 [06:26<00:00,  2.05it/s]
  0%|          | 0/6005 [00:00<?, ?it/s]

Epoch 6/20 :
dev acc 86.16


  0%|          | 3/6005 [00:05<6:53:26,  4.13s/it]

test acc 85.46


 17%|█▋        | 999/6005 [01:03<04:52, 17.14it/s] 

dev acc 86.49


 17%|█▋        | 1003/6005 [01:09<55:43,  1.50it/s]  

test acc 85.38


 33%|███▎      | 1999/6005 [02:06<03:50, 17.40it/s]

dev acc 86.17


 33%|███▎      | 2003/6005 [02:12<44:29,  1.50it/s]  

test acc 85.35


 50%|████▉     | 2999/6005 [03:10<02:54, 17.20it/s]

dev acc 86.35


 50%|█████     | 3003/6005 [03:16<33:26,  1.50it/s]

test acc 85.57


 67%|██████▋   | 3999/6005 [04:13<01:56, 17.23it/s]

dev acc 85.69


 67%|██████▋   | 4003/6005 [04:19<22:28,  1.48it/s]

test acc 85.00


 83%|████████▎ | 4999/6005 [05:17<00:59, 16.93it/s]

dev acc 85.95


 83%|████████▎ | 5003/6005 [05:23<11:11,  1.49it/s]

test acc 85.08


100%|█████████▉| 5999/6005 [06:20<00:00, 17.09it/s]

dev acc 85.99


100%|█████████▉| 6003/6005 [06:26<00:01,  1.49it/s]

test acc 85.09


100%|██████████| 6005/6005 [06:26<00:00,  2.04it/s]
  0%|          | 0/6005 [00:00<?, ?it/s]

Epoch 7/20 :
dev acc 86.57


  0%|          | 3/6005 [00:05<6:53:21,  4.13s/it]

test acc 85.54


 17%|█▋        | 999/6005 [01:07<05:21, 15.59it/s] 

dev acc 85.98


 17%|█▋        | 1003/6005 [01:14<57:26,  1.45it/s]  

test acc 85.17


 33%|███▎      | 1999/6005 [02:13<03:54, 17.09it/s]

dev acc 85.74


 33%|███▎      | 2003/6005 [02:19<44:28,  1.50it/s]  

test acc 85.18


 50%|████▉     | 2999/6005 [03:18<02:56, 17.01it/s]

dev acc 86.57


 50%|█████     | 3003/6005 [03:24<33:23,  1.50it/s]

test acc 85.69


 67%|██████▋   | 3999/6005 [04:23<02:02, 16.35it/s]

dev acc 84.20


 67%|██████▋   | 4003/6005 [04:29<22:12,  1.50it/s]

test acc 83.62


 83%|████████▎ | 4999/6005 [05:28<00:59, 17.03it/s]

dev acc 86.18


 83%|████████▎ | 5003/6005 [05:34<11:10,  1.49it/s]

test acc 85.21


100%|█████████▉| 5999/6005 [06:34<00:00, 17.32it/s]

dev acc 85.73


100%|█████████▉| 6003/6005 [06:40<00:01,  1.49it/s]

test acc 85.35


100%|██████████| 6005/6005 [06:40<00:00,  2.05it/s]
  0%|          | 0/6005 [00:00<?, ?it/s]

Epoch 8/20 :
dev acc 86.02


  0%|          | 3/6005 [00:06<6:53:55,  4.14s/it]

test acc 85.43


 17%|█▋        | 999/6005 [01:03<04:46, 17.48it/s] 

dev acc 86.28


 17%|█▋        | 1003/6005 [01:09<55:46,  1.49it/s]  

test acc 85.56


 33%|███▎      | 1999/6005 [02:06<03:51, 17.32it/s]

dev acc 86.58


 33%|███▎      | 2003/6005 [02:13<44:50,  1.49it/s]  

test acc 85.47


 50%|████▉     | 2999/6005 [03:10<02:56, 17.04it/s]

dev acc 86.77


 50%|█████     | 3003/6005 [03:16<33:41,  1.48it/s]

test acc 85.40


 67%|██████▋   | 3999/6005 [04:14<01:53, 17.66it/s]

dev acc 86.02


 67%|██████▋   | 4003/6005 [04:20<22:21,  1.49it/s]

test acc 85.25


 83%|████████▎ | 4999/6005 [05:17<00:57, 17.42it/s]

dev acc 86.74


 83%|████████▎ | 5003/6005 [05:23<11:08,  1.50it/s]

test acc 85.77


100%|█████████▉| 5999/6005 [06:20<00:00, 17.37it/s]

dev acc 86.37


100%|█████████▉| 6003/6005 [06:27<00:01,  1.49it/s]

test acc 85.67


100%|██████████| 6005/6005 [06:27<00:00,  2.06it/s]
  0%|          | 0/6005 [00:00<?, ?it/s]

New best score on dev !
Epoch 9/20 :
dev acc 86.37


  0%|          | 3/6005 [00:06<6:54:45,  4.15s/it]

test acc 85.61


 17%|█▋        | 999/6005 [01:03<04:47, 17.43it/s] 

dev acc 86.37


 17%|█▋        | 1003/6005 [01:09<55:46,  1.49it/s]  

test acc 85.88


 33%|███▎      | 1999/6005 [02:07<04:03, 16.47it/s]

dev acc 86.81


 33%|███▎      | 2003/6005 [02:13<44:43,  1.49it/s]  

test acc 85.98


 50%|████▉     | 2999/6005 [03:10<02:53, 17.28it/s]

dev acc 86.53


 50%|█████     | 3003/6005 [03:16<33:36,  1.49it/s]

test acc 85.65


 67%|██████▋   | 3999/6005 [04:13<01:53, 17.60it/s]

dev acc 86.36


 67%|██████▋   | 4003/6005 [04:19<22:21,  1.49it/s]

test acc 85.73


 83%|████████▎ | 4999/6005 [05:17<00:58, 17.25it/s]

dev acc 86.64


 83%|████████▎ | 5003/6005 [05:23<11:10,  1.49it/s]

test acc 85.77


100%|█████████▉| 5999/6005 [06:20<00:00, 17.11it/s]

dev acc 86.65


100%|█████████▉| 6003/6005 [06:26<00:01,  1.49it/s]

test acc 85.96


100%|██████████| 6005/6005 [06:26<00:00,  2.05it/s]
  0%|          | 0/6005 [00:00<?, ?it/s]

New best score on dev !
Epoch 10/20 :
dev acc 86.73


  0%|          | 3/6005 [00:06<6:53:27,  4.13s/it]

test acc 85.92


 17%|█▋        | 999/6005 [01:03<04:45, 17.52it/s] 

dev acc 86.57


 17%|█▋        | 1003/6005 [01:09<55:42,  1.50it/s]  

test acc 85.93


 33%|███▎      | 1999/6005 [02:07<03:50, 17.39it/s]

dev acc 86.57


 33%|███▎      | 2003/6005 [02:13<44:37,  1.49it/s]  

test acc 86.01


 50%|████▉     | 2999/6005 [03:10<02:52, 17.42it/s]

dev acc 86.14


 50%|█████     | 3003/6005 [03:16<33:24,  1.50it/s]

test acc 85.13


 67%|██████▋   | 3999/6005 [04:13<01:54, 17.50it/s]

dev acc 86.83


 67%|██████▋   | 4003/6005 [04:20<22:26,  1.49it/s]

test acc 85.83


 83%|████████▎ | 4999/6005 [05:17<00:58, 17.29it/s]

dev acc 86.77


 83%|████████▎ | 5003/6005 [05:23<11:10,  1.49it/s]

test acc 85.85


100%|█████████▉| 5999/6005 [06:21<00:00, 17.40it/s]

dev acc 86.46


100%|█████████▉| 6003/6005 [06:27<00:01,  1.49it/s]

test acc 85.76


100%|██████████| 6005/6005 [06:27<00:00,  2.06it/s]
  0%|          | 0/6005 [00:00<?, ?it/s]

Epoch 11/20 :
dev acc 86.55


  0%|          | 3/6005 [00:06<6:54:16,  4.14s/it]

test acc 85.96


 17%|█▋        | 999/6005 [01:03<04:47, 17.41it/s] 

dev acc 86.28


 17%|█▋        | 1003/6005 [01:09<55:37,  1.50it/s]  

test acc 85.85


 33%|███▎      | 1999/6005 [02:06<03:49, 17.48it/s]

dev acc 86.71


 33%|███▎      | 2003/6005 [02:13<44:42,  1.49it/s]  

test acc 86.28


 50%|████▉     | 2999/6005 [03:10<02:51, 17.53it/s]

dev acc 86.89


 50%|█████     | 3003/6005 [03:16<33:22,  1.50it/s]

test acc 86.16


 67%|██████▋   | 3999/6005 [04:13<01:54, 17.51it/s]

dev acc 86.70


 67%|██████▋   | 4003/6005 [04:19<22:22,  1.49it/s]

test acc 86.30


 83%|████████▎ | 4999/6005 [05:17<00:58, 17.22it/s]

dev acc 86.86


 83%|████████▎ | 5003/6005 [05:23<11:11,  1.49it/s]

test acc 86.07


100%|█████████▉| 5999/6005 [06:20<00:00, 17.43it/s]

dev acc 86.73


100%|█████████▉| 6003/6005 [06:26<00:01,  1.49it/s]

test acc 86.20


100%|██████████| 6005/6005 [06:27<00:00,  2.05it/s]
  0%|          | 0/6005 [00:00<?, ?it/s]

New best score on dev !
Epoch 12/20 :
dev acc 86.77


  0%|          | 3/6005 [00:05<6:53:22,  4.13s/it]

test acc 86.14


 17%|█▋        | 999/6005 [01:04<04:47, 17.41it/s] 

dev acc 86.67


 17%|█▋        | 1003/6005 [01:10<55:40,  1.50it/s]  

test acc 86.37


 33%|███▎      | 1999/6005 [02:08<03:48, 17.51it/s]

dev acc 86.65


 33%|███▎      | 2003/6005 [02:14<44:34,  1.50it/s]  

test acc 86.37


 50%|████▉     | 2999/6005 [03:11<02:50, 17.59it/s]

dev acc 86.79


 50%|█████     | 3003/6005 [03:17<33:21,  1.50it/s]

test acc 86.14


 67%|██████▋   | 3999/6005 [04:15<01:56, 17.15it/s]

dev acc 86.62


 67%|██████▋   | 4003/6005 [04:21<22:29,  1.48it/s]

test acc 86.34


 83%|████████▎ | 4999/6005 [05:18<00:57, 17.47it/s]

dev acc 86.82


 83%|████████▎ | 5003/6005 [05:24<11:11,  1.49it/s]

test acc 85.96


100%|█████████▉| 5999/6005 [06:22<00:00, 17.13it/s]

dev acc 86.88


100%|█████████▉| 6003/6005 [06:28<00:01,  1.49it/s]

test acc 86.44


100%|██████████| 6005/6005 [06:28<00:00,  2.05it/s]
  0%|          | 0/6005 [00:00<?, ?it/s]

New best score on dev !
Epoch 13/20 :
dev acc 86.80


  0%|          | 3/6005 [00:05<6:52:47,  4.13s/it]

test acc 86.32


 17%|█▋        | 999/6005 [01:03<04:55, 16.94it/s] 

dev acc 86.64


 17%|█▋        | 1003/6005 [01:09<55:44,  1.50it/s]  

test acc 86.00


 33%|███▎      | 1999/6005 [02:07<03:47, 17.63it/s]

dev acc 86.50


 33%|███▎      | 2003/6005 [02:13<44:39,  1.49it/s]  

test acc 86.04


 50%|████▉     | 2999/6005 [03:10<02:51, 17.51it/s]

dev acc 86.77


 50%|█████     | 3003/6005 [03:16<33:22,  1.50it/s]

test acc 85.89


 67%|██████▋   | 3999/6005 [04:13<01:55, 17.29it/s]

dev acc 86.90


 67%|██████▋   | 4003/6005 [04:20<22:26,  1.49it/s]

test acc 85.93


 83%|████████▎ | 4999/6005 [05:17<00:59, 17.02it/s]

dev acc 86.79


 83%|████████▎ | 5003/6005 [05:23<11:17,  1.48it/s]

test acc 85.77


100%|█████████▉| 5999/6005 [06:21<00:00, 17.03it/s]

dev acc 86.58


100%|█████████▉| 6003/6005 [06:27<00:01,  1.49it/s]

test acc 86.35


100%|██████████| 6005/6005 [06:27<00:00,  2.05it/s]
  0%|          | 0/6005 [00:00<?, ?it/s]

Epoch 14/20 :
dev acc 86.59


  0%|          | 3/6005 [00:06<6:53:52,  4.14s/it]

test acc 86.37


 17%|█▋        | 999/6005 [01:03<04:49, 17.32it/s] 

dev acc 86.43


 17%|█▋        | 1003/6005 [01:09<55:59,  1.49it/s]  

test acc 85.83


 33%|███▎      | 1999/6005 [02:07<03:49, 17.45it/s]

dev acc 86.58


 33%|███▎      | 2003/6005 [02:13<44:37,  1.49it/s]  

test acc 86.46


 50%|████▉     | 2999/6005 [03:10<02:50, 17.61it/s]

dev acc 86.68


 50%|█████     | 3003/6005 [03:16<33:26,  1.50it/s]

test acc 86.13


 67%|██████▋   | 3999/6005 [04:13<01:54, 17.48it/s]

dev acc 86.89


 67%|██████▋   | 4003/6005 [04:19<22:18,  1.50it/s]

test acc 86.01


 83%|████████▎ | 4999/6005 [05:17<00:58, 17.34it/s]

dev acc 86.99


 83%|████████▎ | 5003/6005 [05:23<11:10,  1.49it/s]

test acc 85.65


100%|█████████▉| 5999/6005 [06:20<00:00, 17.36it/s]

dev acc 86.79


100%|█████████▉| 6003/6005 [06:27<00:01,  1.48it/s]

test acc 86.12


100%|██████████| 6005/6005 [06:27<00:00,  2.03it/s]
  0%|          | 0/6005 [00:00<?, ?it/s]

Epoch 15/20 :
dev acc 86.81


  0%|          | 3/6005 [00:06<6:54:17,  4.14s/it]

test acc 86.17


 17%|█▋        | 999/6005 [01:03<04:46, 17.48it/s] 

dev acc 86.86


 17%|█▋        | 1003/6005 [01:09<55:34,  1.50it/s]  

test acc 86.33


 33%|███▎      | 1999/6005 [02:06<03:48, 17.53it/s]

dev acc 86.66


 33%|███▎      | 2003/6005 [02:12<44:39,  1.49it/s]  

test acc 86.13


 50%|████▉     | 2999/6005 [03:10<02:53, 17.37it/s]

dev acc 87.00


 50%|█████     | 3003/6005 [03:16<33:33,  1.49it/s]

test acc 85.76


 67%|██████▋   | 3999/6005 [04:14<01:54, 17.59it/s]

dev acc 86.52


 67%|██████▋   | 4003/6005 [04:20<22:18,  1.50it/s]

test acc 85.88


 83%|████████▎ | 4999/6005 [05:17<00:57, 17.49it/s]

dev acc 87.03


 83%|████████▎ | 5003/6005 [05:23<11:10,  1.49it/s]

test acc 86.01


100%|█████████▉| 5999/6005 [06:21<00:00, 17.57it/s]

dev acc 86.68


100%|█████████▉| 6003/6005 [06:27<00:01,  1.49it/s]

test acc 86.04


100%|██████████| 6005/6005 [06:27<00:00,  2.05it/s]
  0%|          | 0/6005 [00:00<?, ?it/s]

Epoch 16/20 :
dev acc 86.72


  0%|          | 3/6005 [00:06<6:54:17,  4.14s/it]

test acc 86.07


 17%|█▋        | 999/6005 [01:03<04:45, 17.56it/s] 

dev acc 86.90


 17%|█▋        | 1003/6005 [01:09<55:43,  1.50it/s]  

test acc 86.21


 33%|███▎      | 1999/6005 [02:06<03:51, 17.30it/s]

dev acc 86.66


 33%|███▎      | 2003/6005 [02:12<44:29,  1.50it/s]  

test acc 86.23


 50%|████▉     | 2999/6005 [03:10<02:53, 17.35it/s]

dev acc 86.75


 50%|█████     | 3003/6005 [03:16<33:22,  1.50it/s]

test acc 86.03


 67%|██████▋   | 3999/6005 [04:13<01:54, 17.54it/s]

dev acc 86.69


 67%|██████▋   | 4003/6005 [04:19<22:16,  1.50it/s]

test acc 86.17


 83%|████████▎ | 4999/6005 [05:17<00:57, 17.45it/s]

dev acc 86.81


 83%|████████▎ | 5003/6005 [05:23<11:11,  1.49it/s]

test acc 85.86


100%|█████████▉| 5999/6005 [06:21<00:00, 17.47it/s]

dev acc 86.60


100%|█████████▉| 6003/6005 [06:27<00:01,  1.50it/s]

test acc 86.13


100%|██████████| 6005/6005 [06:27<00:00,  2.07it/s]
  0%|          | 0/6005 [00:00<?, ?it/s]

Epoch 17/20 :
dev acc 86.61


  0%|          | 3/6005 [00:06<6:57:03,  4.17s/it]

test acc 86.18


 17%|█▋        | 999/6005 [01:03<04:51, 17.19it/s] 

dev acc 86.81


 17%|█▋        | 1003/6005 [01:09<55:46,  1.49it/s]  

test acc 86.26


 33%|███▎      | 1999/6005 [02:06<03:50, 17.34it/s]

dev acc 86.75


 33%|███▎      | 2003/6005 [02:12<44:38,  1.49it/s]  

test acc 86.32


 50%|████▉     | 2999/6005 [03:10<02:50, 17.60it/s]

dev acc 86.86


 50%|█████     | 3003/6005 [03:16<33:25,  1.50it/s]

test acc 86.17


 67%|██████▋   | 3999/6005 [04:14<01:57, 17.08it/s]

dev acc 87.08


 67%|██████▋   | 4003/6005 [04:20<22:18,  1.50it/s]

test acc 86.39


 83%|████████▎ | 4999/6005 [05:17<00:57, 17.60it/s]

dev acc 87.04


 83%|████████▎ | 5003/6005 [05:23<11:10,  1.49it/s]

test acc 86.18


100%|█████████▉| 5999/6005 [06:21<00:00, 17.69it/s]

dev acc 87.08


100%|█████████▉| 6003/6005 [06:27<00:01,  1.50it/s]

test acc 86.33


100%|██████████| 6005/6005 [06:27<00:00,  2.06it/s]
  0%|          | 0/6005 [00:00<?, ?it/s]

New best score on dev !
Epoch 18/20 :
dev acc 87.00


  0%|          | 3/6005 [00:06<6:55:03,  4.15s/it]

test acc 86.39


 17%|█▋        | 999/6005 [01:03<04:48, 17.35it/s] 

dev acc 87.01


 17%|█▋        | 1003/6005 [01:09<55:45,  1.50it/s]  

test acc 86.29


 33%|███▎      | 1999/6005 [02:07<03:49, 17.42it/s]

dev acc 86.98


 33%|███▎      | 2003/6005 [02:13<44:40,  1.49it/s]  

test acc 86.29


 50%|████▉     | 2999/6005 [03:10<02:52, 17.47it/s]

dev acc 86.71


 50%|█████     | 3003/6005 [03:16<33:22,  1.50it/s]

test acc 86.11


 67%|██████▋   | 3999/6005 [04:14<01:56, 17.21it/s]

dev acc 86.79


 67%|██████▋   | 4003/6005 [04:20<22:10,  1.50it/s]

test acc 86.10


 83%|████████▎ | 4999/6005 [05:17<00:57, 17.47it/s]

dev acc 87.16


 83%|████████▎ | 5003/6005 [05:23<11:09,  1.50it/s]

test acc 86.08


100%|█████████▉| 5999/6005 [06:21<00:00, 17.61it/s]

dev acc 86.97


100%|█████████▉| 6003/6005 [06:27<00:01,  1.49it/s]

test acc 86.01


100%|██████████| 6005/6005 [06:27<00:00,  2.06it/s]
  0%|          | 0/6005 [00:00<?, ?it/s]

Epoch 19/20 :
dev acc 86.95


  0%|          | 3/6005 [00:06<6:56:50,  4.17s/it]

test acc 86.05


 17%|█▋        | 999/6005 [01:09<04:56, 16.89it/s] 

dev acc 86.78


 17%|█▋        | 1003/6005 [01:15<56:21,  1.48it/s]  

test acc 86.02


 33%|███▎      | 1999/6005 [02:15<03:56, 16.92it/s]

dev acc 86.80


 33%|███▎      | 2003/6005 [02:22<44:27,  1.50it/s]  

test acc 86.26


 50%|████▉     | 2999/6005 [03:21<02:58, 16.81it/s]

dev acc 86.82


 50%|█████     | 3003/6005 [03:27<33:12,  1.51it/s]

test acc 86.35


 67%|██████▋   | 3999/6005 [04:27<02:04, 16.09it/s]

dev acc 86.87


 67%|██████▋   | 4003/6005 [04:34<23:20,  1.43it/s]

test acc 86.22


 83%|████████▎ | 4999/6005 [05:36<01:14, 13.43it/s]

dev acc 87.15


 83%|████████▎ | 5003/6005 [05:42<11:22,  1.47it/s]

test acc 86.31


100%|█████████▉| 5999/6005 [06:45<00:00, 16.20it/s]

dev acc 86.90


100%|█████████▉| 6003/6005 [06:52<00:01,  1.39it/s]

test acc 86.26


100%|██████████| 6005/6005 [06:52<00:00,  1.92it/s]
  0%|          | 0/6005 [00:00<?, ?it/s]

Epoch 20/20 :
dev acc 86.87


  0%|          | 3/6005 [00:06<7:59:30,  4.79s/it] 

test acc 86.27


 17%|█▋        | 999/6005 [01:10<05:36, 14.88it/s] 

dev acc 86.93


 17%|█▋        | 1003/6005 [01:17<1:03:02,  1.32it/s]

test acc 86.33


 33%|███▎      | 1999/6005 [02:20<04:28, 14.89it/s]  

dev acc 87.10


 33%|███▎      | 2003/6005 [02:27<48:17,  1.38it/s]  

test acc 86.14


 50%|████▉     | 2999/6005 [03:28<03:14, 15.43it/s]

dev acc 87.01


 50%|█████     | 3003/6005 [03:35<35:01,  1.43it/s]

test acc 86.28


 67%|██████▋   | 3999/6005 [04:36<02:00, 16.70it/s]

dev acc 86.89


 67%|██████▋   | 4003/6005 [04:42<22:30,  1.48it/s]

test acc 86.21


 83%|████████▎ | 4999/6005 [05:45<01:03, 15.84it/s]

dev acc 87.36


 83%|████████▎ | 5003/6005 [05:51<11:49,  1.41it/s]

test acc 86.10


100%|█████████▉| 5999/6005 [06:55<00:00, 14.46it/s]

dev acc 87.12


100%|█████████▉| 6003/6005 [07:02<00:01,  1.41it/s]

test acc 86.24


100%|██████████| 6005/6005 [07:02<00:00,  1.93it/s]


New best score on dev !
