In [1]:
#!pip3 install tqdm
#!pip3 install git+https://git@github.com/SKTBrain/KoBERT.git@master
#!pip3 install seqeval
#!pip3 install kiwipiepy
#!pip3 install pymongo wikipedia koalanlp datasets thefuzz

In [2]:
import torch
from torch import nn
import torch.nn.functional as F
import torch.optim as optim
from torch.utils.data import Dataset, DataLoader
import numpy as np
import argparse
from tqdm.notebook import tqdm
from transformers import AdamW
from transformers.optimization import get_cosine_schedule_with_warmup

In [3]:
from data_loader import load_and_cache_examples
from utils import init_logger, load_tokenizer, set_seed, MODEL_CLASSES, MODEL_PATH_MAP
from trainer import Trainer

In [4]:
args = {
    "task": "naver-ner",
    "model_dir": "./model_timex3_kobert",
    "data_dir": "./data/modeldata/",
    "pred_dir": "./preds_timex3_kobert",
    "train_file": "timex3.train",
    "test_file": "timex3.test",
    "val_file": "timex3.val",
    "label_file": "label.timex3",
    "write_pred": True,
    "model_type": "kobert",
    "seed": 42,
    "train_batch_size": 8,
    "eval_batch_size": 8,
    "max_seq_len": 100,
    "learning_rate": 5e-5,
    "num_train_epochs": 40.0,
    "weight_decay": 0.0,
    "gradient_accumulation_steps": 1,
    "adam_epsilon": 1e-8,
    "max_grad_norm": 1.0,
    "max_steps": -1,
    "warmup_steps": 0,
    "logging_steps": 1000,
    "save_steps": 1000,
    "do_train": True,
    "do_eval": True,
    "no_cuda": False
}
args["model_name_or_path"] = MODEL_PATH_MAP[args["model_type"]]

In [5]:
tokenizer = load_tokenizer(args)

In [6]:
train_dataset = None
dev_dataset = None
test_dataset = None

if args["do_train"] or args["do_eval"]:
    test_dataset = load_and_cache_examples(args, tokenizer, mode="test", use_cache=False)
if args["do_train"]:
    train_dataset = load_and_cache_examples(args, tokenizer, mode="train", use_cache=False)
    dev_dataset = load_and_cache_examples(args, tokenizer, mode="dev", use_cache=False)

In [7]:
trainer = Trainer(args, train_dataset, dev_dataset, test_dataset)

Some weights of BertForTokenClassification were not initialized from the model checkpoint at monologg/kobert and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.
  return torch._C._cuda_getDeviceCount() > 0


In [8]:
if args["do_train"]:
    trainer.train()

Epoch:   0%|                                             | 0/40 [00:00<?, ?it/s]
Iteration:   0%|                                         | 0/46 [00:00<?, ?it/s][A
Iteration:   2%|▋                                | 1/46 [00:02<01:50,  2.45s/it][A
Iteration:   4%|█▍                               | 2/46 [00:04<01:46,  2.43s/it][A
Iteration:   7%|██▏                              | 3/46 [00:07<01:43,  2.41s/it][A
Iteration:   9%|██▊                              | 4/46 [00:09<01:40,  2.39s/it][A
Iteration:  11%|███▌                             | 5/46 [00:11<01:37,  2.37s/it][A
Iteration:  13%|████▎                            | 6/46 [00:14<01:36,  2.41s/it][A
Iteration:  15%|█████                            | 7/46 [00:16<01:33,  2.41s/it][A
Iteration:  17%|█████▋                           | 8/46 [00:19<01:31,  2.41s/it][A
Iteration:  20%|██████▍                          | 9/46 [00:21<01:29,  2.42s/it][A
Iteration:  22%|██████▉                         | 10/46 [00:24<01:28,  2.46s/it

Iteration:   0%|                                         | 0/46 [00:00<?, ?it/s][A
Iteration:   2%|▋                                | 1/46 [00:02<01:52,  2.50s/it][A
Iteration:   4%|█▍                               | 2/46 [00:04<01:48,  2.48s/it][A
Iteration:   7%|██▏                              | 3/46 [00:07<01:46,  2.48s/it][A
Iteration:   9%|██▊                              | 4/46 [00:09<01:43,  2.46s/it][A
Iteration:  11%|███▌                             | 5/46 [00:12<01:40,  2.44s/it][A
Iteration:  13%|████▎                            | 6/46 [00:14<01:39,  2.48s/it][A
Iteration:  15%|█████                            | 7/46 [00:17<01:36,  2.48s/it][A
Iteration:  17%|█████▋                           | 8/46 [00:19<01:34,  2.48s/it][A
Iteration:  20%|██████▍                          | 9/46 [00:22<01:31,  2.47s/it][A
Iteration:  22%|██████▉                         | 10/46 [00:24<01:28,  2.45s/it][A
Iteration:  24%|███████▋                        | 11/46 [00:27<01:26,  2.48s

Iteration:   2%|▋                                | 1/46 [00:02<01:51,  2.49s/it][A
Iteration:   4%|█▍                               | 2/46 [00:04<01:49,  2.48s/it][A
Iteration:   7%|██▏                              | 3/46 [00:07<01:45,  2.46s/it][A
Iteration:   9%|██▊                              | 4/46 [00:09<01:42,  2.44s/it][A
Iteration:  11%|███▌                             | 5/46 [00:12<01:39,  2.44s/it][A
Iteration:  13%|████▎                            | 6/46 [00:14<01:38,  2.45s/it][A
Iteration:  15%|█████                            | 7/46 [00:17<01:36,  2.48s/it][A
Iteration:  17%|█████▋                           | 8/46 [00:19<01:35,  2.51s/it][A
Iteration:  20%|██████▍                          | 9/46 [00:22<01:31,  2.48s/it][A
Iteration:  22%|██████▉                         | 10/46 [00:24<01:28,  2.46s/it][A
Iteration:  24%|███████▋                        | 11/46 [00:27<01:25,  2.45s/it][A
Iteration:  26%|████████▎                       | 12/46 [00:29<01:24,  2.48s

Iteration:   4%|█▍                               | 2/46 [00:04<01:49,  2.48s/it][A
Iteration:   7%|██▏                              | 3/46 [00:07<01:45,  2.46s/it][A
Iteration:   9%|██▊                              | 4/46 [00:09<01:44,  2.48s/it][A
Iteration:  11%|███▌                             | 5/46 [00:12<01:40,  2.46s/it][A
Iteration:  13%|████▎                            | 6/46 [00:14<01:38,  2.47s/it][A
Iteration:  15%|█████                            | 7/46 [00:17<01:36,  2.47s/it][A
Iteration:  17%|█████▋                           | 8/46 [00:19<01:33,  2.46s/it][A
Iteration:  20%|██████▍                          | 9/46 [00:22<01:33,  2.52s/it][A
Iteration:  22%|██████▉                         | 10/46 [00:24<01:29,  2.49s/it][A
Iteration:  24%|███████▋                        | 11/46 [00:27<01:26,  2.48s/it][A
Iteration:  26%|████████▎                       | 12/46 [00:29<01:24,  2.49s/it][A
Iteration:  28%|█████████                       | 13/46 [00:32<01:21,  2.47s

Iteration:   7%|██▏                              | 3/46 [00:07<01:48,  2.51s/it][A
Iteration:   9%|██▊                              | 4/46 [00:10<01:44,  2.49s/it][A
Iteration:  11%|███▌                             | 5/46 [00:12<01:41,  2.49s/it][A
Iteration:  13%|████▎                            | 6/46 [00:14<01:39,  2.48s/it][A
Iteration:  15%|█████                            | 7/46 [00:17<01:36,  2.48s/it][A
Iteration:  17%|█████▋                           | 8/46 [00:19<01:33,  2.47s/it][A
Iteration:  20%|██████▍                          | 9/46 [00:22<01:31,  2.46s/it][A
Iteration:  22%|██████▉                         | 10/46 [00:24<01:28,  2.45s/it][A
Iteration:  24%|███████▋                        | 11/46 [00:27<01:26,  2.47s/it][A
Iteration:  26%|████████▎                       | 12/46 [00:29<01:24,  2.48s/it][A
Iteration:  28%|█████████                       | 13/46 [00:32<01:21,  2.48s/it][A
Iteration:  30%|█████████▋                      | 14/46 [00:34<01:19,  2.48s

Iteration:   9%|██▊                              | 4/46 [00:09<01:42,  2.44s/it][A
Iteration:  11%|███▌                             | 5/46 [00:12<01:40,  2.45s/it][A
Iteration:  13%|████▎                            | 6/46 [00:14<01:39,  2.48s/it][A
Iteration:  15%|█████                            | 7/46 [00:17<01:36,  2.47s/it][A
Iteration:  17%|█████▋                           | 8/46 [00:19<01:34,  2.47s/it][A
Iteration:  20%|██████▍                          | 9/46 [00:22<01:30,  2.46s/it][A
Iteration:  22%|██████▉                         | 10/46 [00:24<01:28,  2.45s/it][A
Iteration:  24%|███████▋                        | 11/46 [00:27<01:26,  2.46s/it][A
Iteration:  26%|████████▎                       | 12/46 [00:29<01:24,  2.47s/it][A
Iteration:  28%|█████████                       | 13/46 [00:32<01:21,  2.48s/it][A
Iteration:  30%|█████████▋                      | 14/46 [00:34<01:19,  2.47s/it][A
Iteration:  33%|██████████▍                     | 15/46 [00:36<01:16,  2.47s

Iteration:  11%|███▌                             | 5/46 [00:12<01:41,  2.47s/it][A
Iteration:  13%|████▎                            | 6/46 [00:14<01:38,  2.47s/it][A
Iteration:  15%|█████                            | 7/46 [00:17<01:35,  2.46s/it][A
Iteration:  17%|█████▋                           | 8/46 [00:19<01:32,  2.45s/it][A
Iteration:  20%|██████▍                          | 9/46 [00:22<01:31,  2.47s/it][A
Iteration:  22%|██████▉                         | 10/46 [00:24<01:29,  2.50s/it][A
Iteration:  24%|███████▋                        | 11/46 [00:27<01:27,  2.50s/it][A
Iteration:  26%|████████▎                       | 12/46 [00:29<01:24,  2.50s/it][A
Iteration:  28%|█████████                       | 13/46 [00:32<01:22,  2.51s/it][A
Iteration:  30%|█████████▋                      | 14/46 [00:34<01:19,  2.50s/it][A
Iteration:  33%|██████████▍                     | 15/46 [00:37<01:18,  2.54s/it][A
Iteration:  35%|███████████▏                    | 16/46 [00:39<01:15,  2.52s

Iteration:  13%|████▎                            | 6/46 [00:14<01:39,  2.48s/it][A
Iteration:  15%|█████                            | 7/46 [00:17<01:36,  2.46s/it][A
Iteration:  17%|█████▋                           | 8/46 [00:19<01:34,  2.48s/it][A
Iteration:  20%|██████▍                          | 9/46 [00:22<01:31,  2.48s/it][A
Iteration:  22%|██████▉                         | 10/46 [00:24<01:29,  2.49s/it][A
Iteration:  24%|███████▋                        | 11/46 [00:27<01:26,  2.48s/it][A
Iteration:  26%|████████▎                       | 12/46 [00:29<01:24,  2.50s/it][A
Iteration:  28%|█████████                       | 13/46 [00:32<01:22,  2.49s/it][A
Iteration:  30%|█████████▋                      | 14/46 [00:34<01:19,  2.48s/it][A
Iteration:  33%|██████████▍                     | 15/46 [00:37<01:17,  2.49s/it][A
Iteration:  35%|███████████▏                    | 16/46 [00:39<01:14,  2.49s/it][A
Iteration:  37%|███████████▊                    | 17/46 [00:42<01:12,  2.49s

Iteration:  15%|█████                            | 7/46 [00:17<01:35,  2.45s/it][A
Iteration:  17%|█████▋                           | 8/46 [00:19<01:32,  2.44s/it][A
Iteration:  20%|██████▍                          | 9/46 [00:22<01:30,  2.45s/it][A
Iteration:  22%|██████▉                         | 10/46 [00:24<01:28,  2.46s/it][A
Iteration:  24%|███████▋                        | 11/46 [00:27<01:26,  2.47s/it][A
Iteration:  26%|████████▎                       | 12/46 [00:29<01:24,  2.48s/it][A
Iteration:  28%|█████████                       | 13/46 [00:32<01:21,  2.47s/it][A
Iteration:  30%|█████████▋                      | 14/46 [00:34<01:18,  2.47s/it][A
Iteration:  33%|██████████▍                     | 15/46 [00:37<01:17,  2.49s/it][A
Iteration:  35%|███████████▏                    | 16/46 [00:39<01:15,  2.50s/it][A
Iteration:  37%|███████████▊                    | 17/46 [00:42<01:12,  2.49s/it][A
Iteration:  39%|████████████▌                   | 18/46 [00:44<01:09,  2.48s

Iteration:  17%|█████▋                           | 8/46 [00:19<01:33,  2.47s/it][A
Iteration:  20%|██████▍                          | 9/46 [00:22<01:31,  2.47s/it][A
Iteration:  22%|██████▉                         | 10/46 [00:24<01:29,  2.48s/it][A
Iteration:  24%|███████▋                        | 11/46 [00:27<01:26,  2.48s/it][A
Iteration:  26%|████████▎                       | 12/46 [00:29<01:25,  2.52s/it][A
Iteration:  28%|█████████                       | 13/46 [00:32<01:22,  2.49s/it][A
Iteration:  30%|█████████▋                      | 14/46 [00:34<01:19,  2.48s/it][A
Iteration:  33%|██████████▍                     | 15/46 [00:37<01:17,  2.49s/it][A
Iteration:  35%|███████████▏                    | 16/46 [00:39<01:14,  2.49s/it][A
Iteration:  37%|███████████▊                    | 17/46 [00:42<01:12,  2.48s/it][A
Iteration:  39%|████████████▌                   | 18/46 [00:44<01:09,  2.47s/it][A
Iteration:  41%|█████████████▏                  | 19/46 [00:47<01:06,  2.48s

Iteration:  20%|██████▍                          | 9/46 [00:22<01:31,  2.48s/it][A
Iteration:  22%|██████▉                         | 10/46 [00:24<01:29,  2.49s/it][A
Iteration:  24%|███████▋                        | 11/46 [00:27<01:27,  2.49s/it][A
Iteration:  26%|████████▎                       | 12/46 [00:29<01:23,  2.47s/it][A
Iteration:  28%|█████████                       | 13/46 [00:32<01:21,  2.46s/it][A
Iteration:  30%|█████████▋                      | 14/46 [00:34<01:18,  2.45s/it][A
Iteration:  33%|██████████▍                     | 15/46 [00:37<01:16,  2.47s/it][A
Iteration:  35%|███████████▏                    | 16/46 [00:39<01:14,  2.48s/it][A
Iteration:  37%|███████████▊                    | 17/46 [00:41<01:11,  2.46s/it][A
Iteration:  39%|████████████▌                   | 18/46 [00:44<01:08,  2.45s/it][A
Iteration:  41%|█████████████▏                  | 19/46 [00:46<01:05,  2.44s/it][A
Iteration:  43%|█████████████▉                  | 20/46 [00:49<01:03,  2.45s

***** Eval results *****
  %s = %s f1 0.527027027027027
  %s = %s loss 0.19735990571124212
  %s = %s precision 0.5064935064935064
  %s = %s recall 0.5492957746478874



Iteration:  74%|███████████████████████▋        | 34/46 [01:28<00:46,  3.91s/it][A
Iteration:  76%|████████████████████████▎       | 35/46 [01:31<00:38,  3.48s/it][A
Iteration:  78%|█████████████████████████       | 36/46 [01:33<00:32,  3.20s/it][A
Iteration:  80%|█████████████████████████▋      | 37/46 [01:36<00:27,  3.02s/it][A
Iteration:  83%|██████████████████████████▍     | 38/46 [01:38<00:22,  2.84s/it][A
Iteration:  85%|███████████████████████████▏    | 39/46 [01:41<00:19,  2.73s/it][A
Iteration:  87%|███████████████████████████▊    | 40/46 [01:43<00:15,  2.66s/it][A
Iteration:  89%|████████████████████████████▌   | 41/46 [01:46<00:13,  2.60s/it][A
Iteration:  91%|█████████████████████████████▏  | 42/46 [01:48<00:10,  2.56s/it][A
Iteration:  93%|█████████████████████████████▉  | 43/46 [01:51<00:07,  2.52s/it][A
Iteration:  96%|██████████████████████████████▌ | 44/46 [01:53<00:04,  2.49s/it][A
Iteration:  98%|███████████████████████████████▎| 45/46 [01:56<00:02,  2.51

Iteration:  76%|████████████████████████▎       | 35/46 [01:26<00:27,  2.46s/it][A
Iteration:  78%|█████████████████████████       | 36/46 [01:28<00:24,  2.47s/it][A
Iteration:  80%|█████████████████████████▋      | 37/46 [01:31<00:22,  2.46s/it][A
Iteration:  83%|██████████████████████████▍     | 38/46 [01:33<00:19,  2.46s/it][A
Iteration:  85%|███████████████████████████▏    | 39/46 [01:36<00:17,  2.47s/it][A
Iteration:  87%|███████████████████████████▊    | 40/46 [01:38<00:14,  2.47s/it][A
Iteration:  89%|████████████████████████████▌   | 41/46 [01:41<00:12,  2.46s/it][A
Iteration:  91%|█████████████████████████████▏  | 42/46 [01:43<00:09,  2.49s/it][A
Iteration:  93%|█████████████████████████████▉  | 43/46 [01:46<00:07,  2.49s/it][A
Iteration:  96%|██████████████████████████████▌ | 44/46 [01:48<00:04,  2.48s/it][A
Iteration:  98%|███████████████████████████████▎| 45/46 [01:51<00:02,  2.51s/it][A
Iteration: 100%|████████████████████████████████| 46/46 [01:52<00:00,  2.46s

Iteration:  78%|█████████████████████████       | 36/46 [01:29<00:24,  2.48s/it][A
Iteration:  80%|█████████████████████████▋      | 37/46 [01:31<00:22,  2.46s/it][A
Iteration:  83%|██████████████████████████▍     | 38/46 [01:34<00:19,  2.47s/it][A
Iteration:  85%|███████████████████████████▏    | 39/46 [01:36<00:17,  2.47s/it][A
Iteration:  87%|███████████████████████████▊    | 40/46 [01:38<00:14,  2.48s/it][A
Iteration:  89%|████████████████████████████▌   | 41/46 [01:41<00:12,  2.47s/it][A
Iteration:  91%|█████████████████████████████▏  | 42/46 [01:43<00:09,  2.45s/it][A
Iteration:  93%|█████████████████████████████▉  | 43/46 [01:46<00:07,  2.44s/it][A
Iteration:  96%|██████████████████████████████▌ | 44/46 [01:48<00:04,  2.46s/it][A
Iteration:  98%|███████████████████████████████▎| 45/46 [01:51<00:02,  2.47s/it][A
Iteration: 100%|████████████████████████████████| 46/46 [01:52<00:00,  2.45s/it][A
Epoch:  65%|██████████████████████▊            | 26/40 [49:04<26:27, 113.36s

Iteration:  80%|█████████████████████████▋      | 37/46 [01:31<00:22,  2.46s/it][A
Iteration:  83%|██████████████████████████▍     | 38/46 [01:34<00:19,  2.48s/it][A
Iteration:  85%|███████████████████████████▏    | 39/46 [01:36<00:17,  2.49s/it][A
Iteration:  87%|███████████████████████████▊    | 40/46 [01:39<00:14,  2.48s/it][A
Iteration:  89%|████████████████████████████▌   | 41/46 [01:41<00:12,  2.52s/it][A
Iteration:  91%|█████████████████████████████▏  | 42/46 [01:44<00:09,  2.49s/it][A
Iteration:  93%|█████████████████████████████▉  | 43/46 [01:46<00:07,  2.49s/it][A
Iteration:  96%|██████████████████████████████▌ | 44/46 [01:49<00:04,  2.49s/it][A
Iteration:  98%|███████████████████████████████▎| 45/46 [01:51<00:02,  2.49s/it][A
Iteration: 100%|████████████████████████████████| 46/46 [01:53<00:00,  2.46s/it][A
Epoch:  70%|████████████████████████▌          | 28/40 [52:51<22:39, 113.33s/it]
Iteration:   0%|                                         | 0/46 [00:00<?, ?it/s

Iteration:  83%|██████████████████████████▍     | 38/46 [01:34<00:20,  2.53s/it][A
Iteration:  85%|███████████████████████████▏    | 39/46 [01:37<00:17,  2.53s/it][A
Iteration:  87%|███████████████████████████▊    | 40/46 [01:39<00:15,  2.50s/it][A
Iteration:  89%|████████████████████████████▌   | 41/46 [01:41<00:12,  2.48s/it][A
Iteration:  91%|█████████████████████████████▏  | 42/46 [01:44<00:09,  2.47s/it][A
Iteration:  93%|█████████████████████████████▉  | 43/46 [01:46<00:07,  2.47s/it][A
Iteration:  96%|██████████████████████████████▌ | 44/46 [01:49<00:04,  2.47s/it][A
Iteration:  98%|███████████████████████████████▎| 45/46 [01:51<00:02,  2.49s/it][A
Iteration: 100%|████████████████████████████████| 46/46 [01:53<00:00,  2.47s/it][A
Epoch:  75%|██████████████████████████▎        | 30/40 [56:37<18:52, 113.27s/it]
Iteration:   0%|                                         | 0/46 [00:00<?, ?it/s][A
Iteration:   2%|▋                                | 1/46 [00:02<01:50,  2.45s/it

Iteration:  85%|███████████████████████████▏    | 39/46 [01:37<00:17,  2.49s/it][A
Iteration:  87%|███████████████████████████▊    | 40/46 [01:39<00:14,  2.48s/it][A
Iteration:  89%|████████████████████████████▌   | 41/46 [01:42<00:12,  2.49s/it][A
Iteration:  91%|█████████████████████████████▏  | 42/46 [01:44<00:09,  2.48s/it][A
Iteration:  93%|█████████████████████████████▉  | 43/46 [01:47<00:07,  2.51s/it][A
Iteration:  96%|██████████████████████████████▌ | 44/46 [01:49<00:05,  2.50s/it][A
Iteration:  98%|███████████████████████████████▎| 45/46 [01:52<00:02,  2.49s/it][A
Iteration: 100%|████████████████████████████████| 46/46 [01:53<00:00,  2.47s/it][A
Epoch:  80%|██████████████████████████▍      | 32/40 [1:00:24<15:07, 113.38s/it]
Iteration:   0%|                                         | 0/46 [00:00<?, ?it/s][A
Iteration:   2%|▋                                | 1/46 [00:02<01:52,  2.49s/it][A
Iteration:   4%|█▍                               | 2/46 [00:04<01:49,  2.48s/it

Iteration:  87%|███████████████████████████▊    | 40/46 [01:39<00:14,  2.47s/it][A
Iteration:  89%|████████████████████████████▌   | 41/46 [01:41<00:12,  2.46s/it][A
Iteration:  91%|█████████████████████████████▏  | 42/46 [01:43<00:09,  2.48s/it][A
Iteration:  93%|█████████████████████████████▉  | 43/46 [01:46<00:07,  2.48s/it][A
Iteration:  96%|██████████████████████████████▌ | 44/46 [01:49<00:05,  2.50s/it][A
Iteration:  98%|███████████████████████████████▎| 45/46 [01:51<00:02,  2.52s/it][A
Iteration: 100%|████████████████████████████████| 46/46 [01:53<00:00,  2.46s/it][A
Epoch:  85%|████████████████████████████     | 34/40 [1:04:10<11:19, 113.21s/it]
Iteration:   0%|                                         | 0/46 [00:00<?, ?it/s][A
Iteration:   2%|▋                                | 1/46 [00:02<01:50,  2.45s/it][A
Iteration:   4%|█▍                               | 2/46 [00:05<01:51,  2.53s/it][A
Iteration:   7%|██▏                              | 3/46 [00:07<01:47,  2.51s/it

Iteration:  89%|████████████████████████████▌   | 41/46 [01:41<00:12,  2.45s/it][A
Iteration:  91%|█████████████████████████████▏  | 42/46 [01:43<00:09,  2.46s/it][A
Iteration:  93%|█████████████████████████████▉  | 43/46 [01:46<00:07,  2.46s/it][A
Iteration:  96%|██████████████████████████████▌ | 44/46 [01:48<00:04,  2.46s/it][A
Iteration:  98%|███████████████████████████████▎| 45/46 [01:50<00:02,  2.45s/it][A
Iteration: 100%|████████████████████████████████| 46/46 [01:52<00:00,  2.45s/it][A
Epoch:  90%|█████████████████████████████▋   | 36/40 [1:07:56<07:32, 113.01s/it]
Iteration:   0%|                                         | 0/46 [00:00<?, ?it/s][A
Iteration:   2%|▋                                | 1/46 [00:02<01:53,  2.52s/it][A
Iteration:   4%|█▍                               | 2/46 [00:04<01:49,  2.48s/it][A
Iteration:   7%|██▏                              | 3/46 [00:07<01:47,  2.51s/it][A
Iteration:   9%|██▊                              | 4/46 [00:10<01:46,  2.54s/it

Iteration:  91%|█████████████████████████████▏  | 42/46 [01:44<00:09,  2.50s/it][A
Iteration:  93%|█████████████████████████████▉  | 43/46 [01:46<00:07,  2.50s/it][A
Iteration:  96%|██████████████████████████████▌ | 44/46 [01:49<00:04,  2.48s/it][A
Iteration:  98%|███████████████████████████████▎| 45/46 [01:51<00:02,  2.46s/it][A
Iteration: 100%|████████████████████████████████| 46/46 [01:53<00:00,  2.46s/it][A
Epoch:  95%|███████████████████████████████▎ | 38/40 [1:11:42<03:46, 113.13s/it]
Iteration:   0%|                                         | 0/46 [00:00<?, ?it/s][A
Iteration:   2%|▋                                | 1/46 [00:02<01:51,  2.48s/it][A
Iteration:   4%|█▍                               | 2/46 [00:04<01:48,  2.48s/it][A
Iteration:   7%|██▏                              | 3/46 [00:07<01:46,  2.48s/it][A
Iteration:   9%|██▊                              | 4/46 [00:09<01:44,  2.48s/it][A
Iteration:  11%|███▌                             | 5/46 [00:12<01:41,  2.48s/it

Iteration:  93%|█████████████████████████████▉  | 43/46 [01:46<00:07,  2.47s/it][A
Iteration:  96%|██████████████████████████████▌ | 44/46 [01:48<00:04,  2.45s/it][A
Iteration:  98%|███████████████████████████████▎| 45/46 [01:51<00:02,  2.45s/it][A
Iteration: 100%|████████████████████████████████| 46/46 [01:52<00:00,  2.45s/it][A
Epoch: 100%|█████████████████████████████████| 40/40 [1:15:28<00:00, 113.22s/it]


In [9]:
trainer.save_model()

In [10]:
if args["do_eval"]:
    trainer.load_model()
    trainer.evaluate("test", "eval")

Evaluating: 100%|█████████████████████████████████| 7/7 [00:04<00:00,  1.49it/s]

***** Eval results *****
  %s = %s f1 0.5428571428571428
  %s = %s loss 0.21534028542893274
  %s = %s precision 0.5507246376811594
  %s = %s recall 0.5352112676056338



