In [1]:
from trainer import Trainer
from utils import init_logger, load_tokenizer, set_seed, MODEL_CLASSES, MODEL_PATH_MAP
from data_loader import load_and_cache_examples
import argparse

In [2]:
parser = argparse.ArgumentParser()

parser.add_argument("--task", default="nsmc", type=str, help="The name of the task to train")
parser.add_argument("--model_dir", default="./model", type=str, help="Path to save, load model")
parser.add_argument("--data_dir", default="./data", type=str, help="The input data dir")
parser.add_argument("--train_file", default="ratings_train.txt", type=str, help="Train file")
parser.add_argument("--test_file", default="ratings_test.txt", type=str, help="Test file")

parser.add_argument("--model_type", default="kobert", type=str, help="Model type selected in the list: " + ", ".join(MODEL_CLASSES.keys()))

parser.add_argument('--seed', type=int, default=42, help="random seed for initialization")
parser.add_argument("--train_batch_size", default=32, type=int, help="Batch size for training.")
parser.add_argument("--eval_batch_size", default=64, type=int, help="Batch size for evaluation.")
parser.add_argument("--max_seq_len", default=50, type=int, help="The maximum total input sequence length after tokenization.")
parser.add_argument("--learning_rate", default=5e-5, type=float, help="The initial learning rate for Adam.")
parser.add_argument("--num_train_epochs", default=5.0, type=float, help="Total number of training epochs to perform.")
parser.add_argument("--weight_decay", default=0.0, type=float, help="Weight decay if we apply some.")
parser.add_argument('--gradient_accumulation_steps', type=int, default=1,
                    help="Number of updates steps to accumulate before performing a backward/update pass.")
parser.add_argument("--adam_epsilon", default=1e-8, type=float, help="Epsilon for Adam optimizer.")
parser.add_argument("--max_grad_norm", default=1.0, type=float, help="Max gradient norm.")
parser.add_argument("--max_steps", default=-1, type=int, help="If > 0: set total number of training steps to perform. Override num_train_epochs.")
parser.add_argument("--warmup_steps", default=0, type=int, help="Linear warmup over warmup_steps.")

parser.add_argument('--logging_steps', type=int, default=2000, help="Log every X updates steps.")
parser.add_argument('--save_steps', type=int, default=2000, help="Save checkpoint every X updates steps.")

parser.add_argument("--do_train", type=bool, default=True, help="Whether to run training.")
parser.add_argument("--do_eval", type=bool, default=True, help="Whether to run eval on the test set.")
parser.add_argument("--no_cuda", type=bool, default=False, help="Avoid using CUDA when available")

args = parser.parse_args([])

args.model_name_or_path = MODEL_PATH_MAP[args.model_type]

In [3]:
MODEL_PATH_MAP[args.model_type]

'monologg/kobert'

## Load tokenizer, build dataset

In [4]:
tokenizer = load_tokenizer(args)
train_dataset = load_and_cache_examples(args, tokenizer, mode="train")
dev_dataset = None
test_dataset = load_and_cache_examples(args, tokenizer, mode="test")


The tokenizer class you load from this checkpoint is not the same type as the class this function is called from. It may result in unexpected tokenization. 
The tokenizer class you load from this checkpoint is 'BertTokenizer'. 
The class this function is called from is 'KoBertTokenizer'.


## Train

In [5]:
trainer = Trainer(args, train_dataset, dev_dataset, test_dataset)
trainer.train()

Some weights of BertForSequenceClassification were not initialized from the model checkpoint at monologg/kobert and are newly initialized: ['classifier.weight', 'classifier.bias']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.
Epoch:   0%|          | 0/5 [00:00<?, ?it/s]
Iteration:   0%|          | 0/4688 [00:00<?, ?it/s][A
Iteration:   0%|          | 1/4688 [00:00<15:28,  5.05it/s][A
Iteration:   0%|          | 2/4688 [00:00<14:04,  5.55it/s][A
Iteration:   0%|          | 3/4688 [00:00<13:33,  5.76it/s][A
Iteration:   0%|          | 4/4688 [00:00<13:20,  5.85it/s][A
Iteration:   0%|          | 5/4688 [00:00<13:14,  5.89it/s][A
Iteration:   0%|          | 6/4688 [00:01<13:10,  5.92it/s][A
Iteration:   0%|          | 7/4688 [00:01<13:08,  5.94it/s][A
Iteration:   0%|          | 8/4688 [00:01<13:06,  5.95it/s][A
Iteration:   0%|          | 9/4688 [00:01<13:05,  5.96it/s][A
Iteration:   0%|          | 10/4688 [00:01

Iteration:   3%|▎         | 122/4688 [00:20<12:52,  5.91it/s][A
Iteration:   3%|▎         | 123/4688 [00:20<12:49,  5.94it/s][A
Iteration:   3%|▎         | 124/4688 [00:20<12:49,  5.93it/s][A
Iteration:   3%|▎         | 125/4688 [00:21<12:49,  5.93it/s][A
Iteration:   3%|▎         | 126/4688 [00:21<12:49,  5.93it/s][A
Iteration:   3%|▎         | 127/4688 [00:21<12:48,  5.93it/s][A
Iteration:   3%|▎         | 128/4688 [00:21<12:49,  5.92it/s][A
Iteration:   3%|▎         | 129/4688 [00:21<12:50,  5.92it/s][A
Iteration:   3%|▎         | 130/4688 [00:21<12:51,  5.91it/s][A
Iteration:   3%|▎         | 131/4688 [00:22<12:51,  5.90it/s][A
Iteration:   3%|▎         | 132/4688 [00:22<12:52,  5.90it/s][A
Iteration:   3%|▎         | 133/4688 [00:22<12:52,  5.90it/s][A
Iteration:   3%|▎         | 134/4688 [00:22<12:52,  5.89it/s][A
Iteration:   3%|▎         | 135/4688 [00:22<12:48,  5.92it/s][A
Iteration:   3%|▎         | 136/4688 [00:22<12:50,  5.91it/s][A
Iteration:   3%|▎        

Iteration:   5%|▌         | 248/4688 [00:41<12:32,  5.90it/s][A
Iteration:   5%|▌         | 249/4688 [00:42<12:33,  5.89it/s][A
Iteration:   5%|▌         | 250/4688 [00:42<12:35,  5.87it/s][A
Iteration:   5%|▌         | 251/4688 [00:42<12:37,  5.86it/s][A
Iteration:   5%|▌         | 252/4688 [00:42<12:37,  5.86it/s][A
Iteration:   5%|▌         | 253/4688 [00:42<12:37,  5.86it/s][A
Iteration:   5%|▌         | 254/4688 [00:42<12:37,  5.85it/s][A
Iteration:   5%|▌         | 255/4688 [00:43<12:36,  5.86it/s][A
Iteration:   5%|▌         | 256/4688 [00:43<12:35,  5.86it/s][A
Iteration:   5%|▌         | 257/4688 [00:43<12:36,  5.86it/s][A
Iteration:   6%|▌         | 258/4688 [00:43<12:36,  5.86it/s][A
Iteration:   6%|▌         | 259/4688 [00:43<12:37,  5.85it/s][A
Iteration:   6%|▌         | 260/4688 [00:43<12:36,  5.86it/s][A
Iteration:   6%|▌         | 261/4688 [00:44<12:36,  5.85it/s][A
Iteration:   6%|▌         | 262/4688 [00:44<12:33,  5.88it/s][A
Iteration:   6%|▌        

Iteration:   8%|▊         | 374/4688 [01:03<12:25,  5.79it/s][A
Iteration:   8%|▊         | 375/4688 [01:03<12:24,  5.79it/s][A
Iteration:   8%|▊         | 376/4688 [01:03<12:22,  5.81it/s][A
Iteration:   8%|▊         | 377/4688 [01:04<12:22,  5.81it/s][A
Iteration:   8%|▊         | 378/4688 [01:04<12:22,  5.81it/s][A
Iteration:   8%|▊         | 379/4688 [01:04<12:21,  5.81it/s][A
Iteration:   8%|▊         | 380/4688 [01:04<12:20,  5.82it/s][A
Iteration:   8%|▊         | 381/4688 [01:04<12:16,  5.85it/s][A
Iteration:   8%|▊         | 382/4688 [01:04<12:18,  5.83it/s][A
Iteration:   8%|▊         | 383/4688 [01:05<12:19,  5.82it/s][A
Iteration:   8%|▊         | 384/4688 [01:05<12:19,  5.82it/s][A
Iteration:   8%|▊         | 385/4688 [01:05<12:19,  5.82it/s][A
Iteration:   8%|▊         | 386/4688 [01:05<12:19,  5.82it/s][A
Iteration:   8%|▊         | 387/4688 [01:05<12:14,  5.85it/s][A
Iteration:   8%|▊         | 388/4688 [01:05<12:16,  5.84it/s][A
Iteration:   8%|▊        

Iteration:  11%|█         | 500/4688 [01:25<11:58,  5.83it/s][A
Iteration:  11%|█         | 501/4688 [01:25<11:59,  5.82it/s][A
Iteration:  11%|█         | 502/4688 [01:25<12:00,  5.81it/s][A
Iteration:  11%|█         | 503/4688 [01:25<12:00,  5.81it/s][A
Iteration:  11%|█         | 504/4688 [01:25<11:56,  5.84it/s][A
Iteration:  11%|█         | 505/4688 [01:26<11:58,  5.83it/s][A
Iteration:  11%|█         | 506/4688 [01:26<11:54,  5.85it/s][A
Iteration:  11%|█         | 507/4688 [01:26<11:57,  5.83it/s][A
Iteration:  11%|█         | 508/4688 [01:26<11:54,  5.85it/s][A
Iteration:  11%|█         | 509/4688 [01:26<11:52,  5.86it/s][A
Iteration:  11%|█         | 510/4688 [01:26<11:55,  5.84it/s][A
Iteration:  11%|█         | 511/4688 [01:27<11:52,  5.86it/s][A
Iteration:  11%|█         | 512/4688 [01:27<11:55,  5.84it/s][A
Iteration:  11%|█         | 513/4688 [01:27<11:56,  5.83it/s][A
Iteration:  11%|█         | 514/4688 [01:27<11:57,  5.82it/s][A
Iteration:  11%|█        

Iteration:  13%|█▎        | 626/4688 [01:46<11:44,  5.77it/s][A
Iteration:  13%|█▎        | 627/4688 [01:47<11:44,  5.77it/s][A
Iteration:  13%|█▎        | 628/4688 [01:47<11:44,  5.76it/s][A
Iteration:  13%|█▎        | 629/4688 [01:47<11:44,  5.76it/s][A
Iteration:  13%|█▎        | 630/4688 [01:47<11:43,  5.76it/s][A
Iteration:  13%|█▎        | 631/4688 [01:47<11:39,  5.80it/s][A
Iteration:  13%|█▎        | 632/4688 [01:47<11:36,  5.82it/s][A
Iteration:  14%|█▎        | 633/4688 [01:48<11:38,  5.81it/s][A
Iteration:  14%|█▎        | 634/4688 [01:48<11:40,  5.79it/s][A
Iteration:  14%|█▎        | 635/4688 [01:48<11:40,  5.78it/s][A
Iteration:  14%|█▎        | 636/4688 [01:48<11:37,  5.81it/s][A
Iteration:  14%|█▎        | 637/4688 [01:48<11:38,  5.80it/s][A
Iteration:  14%|█▎        | 638/4688 [01:48<11:39,  5.79it/s][A
Iteration:  14%|█▎        | 639/4688 [01:49<11:41,  5.77it/s][A
Iteration:  14%|█▎        | 640/4688 [01:49<11:41,  5.77it/s][A
Iteration:  14%|█▎       

Iteration:  16%|█▌        | 752/4688 [02:08<11:30,  5.70it/s][A
Iteration:  16%|█▌        | 753/4688 [02:09<11:27,  5.72it/s][A
Iteration:  16%|█▌        | 754/4688 [02:09<11:26,  5.73it/s][A
Iteration:  16%|█▌        | 755/4688 [02:09<11:21,  5.77it/s][A
Iteration:  16%|█▌        | 756/4688 [02:09<11:22,  5.76it/s][A
Iteration:  16%|█▌        | 757/4688 [02:09<11:19,  5.78it/s][A
Iteration:  16%|█▌        | 758/4688 [02:09<11:17,  5.80it/s][A
Iteration:  16%|█▌        | 759/4688 [02:10<11:19,  5.78it/s][A
Iteration:  16%|█▌        | 760/4688 [02:10<11:20,  5.77it/s][A
Iteration:  16%|█▌        | 761/4688 [02:10<11:22,  5.76it/s][A
Iteration:  16%|█▋        | 762/4688 [02:10<11:19,  5.78it/s][A
Iteration:  16%|█▋        | 763/4688 [02:10<11:21,  5.76it/s][A
Iteration:  16%|█▋        | 764/4688 [02:10<11:22,  5.75it/s][A
Iteration:  16%|█▋        | 765/4688 [02:11<11:28,  5.69it/s][A
Iteration:  16%|█▋        | 766/4688 [02:11<11:30,  5.68it/s][A
Iteration:  16%|█▋       

Iteration:  19%|█▊        | 878/4688 [02:30<11:07,  5.71it/s][A
Iteration:  19%|█▉        | 879/4688 [02:31<11:06,  5.71it/s][A
Iteration:  19%|█▉        | 880/4688 [02:31<11:08,  5.69it/s][A
Iteration:  19%|█▉        | 881/4688 [02:31<11:04,  5.73it/s][A
Iteration:  19%|█▉        | 882/4688 [02:31<11:06,  5.71it/s][A
Iteration:  19%|█▉        | 883/4688 [02:31<11:12,  5.66it/s][A
Iteration:  19%|█▉        | 884/4688 [02:31<11:10,  5.67it/s][A
Iteration:  19%|█▉        | 885/4688 [02:32<11:07,  5.69it/s][A
Iteration:  19%|█▉        | 886/4688 [02:32<11:07,  5.69it/s][A
Iteration:  19%|█▉        | 887/4688 [02:32<11:04,  5.72it/s][A
Iteration:  19%|█▉        | 888/4688 [02:32<11:04,  5.72it/s][A
Iteration:  19%|█▉        | 889/4688 [02:32<11:02,  5.73it/s][A
Iteration:  19%|█▉        | 890/4688 [02:33<11:10,  5.66it/s][A
Iteration:  19%|█▉        | 891/4688 [02:33<11:12,  5.64it/s][A
Iteration:  19%|█▉        | 892/4688 [02:33<11:08,  5.68it/s][A
Iteration:  19%|█▉       

Iteration:  21%|██▏       | 1003/4688 [02:52<10:59,  5.59it/s][A
Iteration:  21%|██▏       | 1004/4688 [02:53<10:57,  5.60it/s][A
Iteration:  21%|██▏       | 1005/4688 [02:53<10:53,  5.64it/s][A
Iteration:  21%|██▏       | 1006/4688 [02:53<10:46,  5.69it/s][A
Iteration:  21%|██▏       | 1007/4688 [02:53<10:44,  5.71it/s][A
Iteration:  22%|██▏       | 1008/4688 [02:53<10:45,  5.71it/s][A
Iteration:  22%|██▏       | 1009/4688 [02:53<10:49,  5.66it/s][A
Iteration:  22%|██▏       | 1010/4688 [02:54<10:52,  5.63it/s][A
Iteration:  22%|██▏       | 1011/4688 [02:54<10:47,  5.68it/s][A
Iteration:  22%|██▏       | 1012/4688 [02:54<10:46,  5.69it/s][A
Iteration:  22%|██▏       | 1013/4688 [02:54<10:44,  5.70it/s][A
Iteration:  22%|██▏       | 1014/4688 [02:54<10:39,  5.75it/s][A
Iteration:  22%|██▏       | 1015/4688 [02:54<10:39,  5.74it/s][A
Iteration:  22%|██▏       | 1016/4688 [02:55<10:47,  5.67it/s][A
Iteration:  22%|██▏       | 1017/4688 [02:55<10:49,  5.65it/s][A
Iteration:

Iteration:  24%|██▍       | 1127/4688 [03:14<10:23,  5.71it/s][A
Iteration:  24%|██▍       | 1128/4688 [03:14<10:31,  5.64it/s][A
Iteration:  24%|██▍       | 1129/4688 [03:14<10:31,  5.64it/s][A
Iteration:  24%|██▍       | 1130/4688 [03:15<10:28,  5.66it/s][A
Iteration:  24%|██▍       | 1131/4688 [03:15<10:25,  5.68it/s][A
Iteration:  24%|██▍       | 1132/4688 [03:15<10:24,  5.69it/s][A
Iteration:  24%|██▍       | 1133/4688 [03:15<10:18,  5.75it/s][A
Iteration:  24%|██▍       | 1134/4688 [03:15<10:19,  5.74it/s][A
Iteration:  24%|██▍       | 1135/4688 [03:16<10:26,  5.68it/s][A
Iteration:  24%|██▍       | 1136/4688 [03:16<10:26,  5.67it/s][A
Iteration:  24%|██▍       | 1137/4688 [03:16<10:25,  5.68it/s][A
Iteration:  24%|██▍       | 1138/4688 [03:16<10:22,  5.70it/s][A
Iteration:  24%|██▍       | 1139/4688 [03:16<10:18,  5.74it/s][A
Iteration:  24%|██▍       | 1140/4688 [03:16<10:17,  5.75it/s][A
Iteration:  24%|██▍       | 1141/4688 [03:17<10:17,  5.75it/s][A
Iteration:

Iteration:  27%|██▋       | 1251/4688 [03:36<09:57,  5.75it/s][A
Iteration:  27%|██▋       | 1252/4688 [03:36<10:02,  5.70it/s][A
Iteration:  27%|██▋       | 1253/4688 [03:36<10:01,  5.71it/s][A
Iteration:  27%|██▋       | 1254/4688 [03:36<10:00,  5.72it/s][A
Iteration:  27%|██▋       | 1255/4688 [03:37<09:59,  5.72it/s][A
Iteration:  27%|██▋       | 1256/4688 [03:37<10:00,  5.71it/s][A
Iteration:  27%|██▋       | 1257/4688 [03:37<10:01,  5.70it/s][A
Iteration:  27%|██▋       | 1258/4688 [03:37<10:00,  5.71it/s][A
Iteration:  27%|██▋       | 1259/4688 [03:37<10:08,  5.64it/s][A
Iteration:  27%|██▋       | 1260/4688 [03:37<10:10,  5.62it/s][A
Iteration:  27%|██▋       | 1261/4688 [03:38<10:07,  5.64it/s][A
Iteration:  27%|██▋       | 1262/4688 [03:38<10:06,  5.65it/s][A
Iteration:  27%|██▋       | 1263/4688 [03:38<10:04,  5.66it/s][A
Iteration:  27%|██▋       | 1264/4688 [03:38<10:04,  5.67it/s][A
Iteration:  27%|██▋       | 1265/4688 [03:38<10:03,  5.67it/s][A
Iteration:

Iteration:  29%|██▉       | 1375/4688 [03:58<09:44,  5.67it/s][A
Iteration:  29%|██▉       | 1376/4688 [03:58<09:42,  5.68it/s][A
Iteration:  29%|██▉       | 1377/4688 [03:58<09:41,  5.70it/s][A
Iteration:  29%|██▉       | 1378/4688 [03:58<09:37,  5.73it/s][A
Iteration:  29%|██▉       | 1379/4688 [03:58<09:34,  5.76it/s][A
Iteration:  29%|██▉       | 1380/4688 [03:59<09:42,  5.68it/s][A
Iteration:  29%|██▉       | 1381/4688 [03:59<09:41,  5.69it/s][A
Iteration:  29%|██▉       | 1382/4688 [03:59<09:40,  5.70it/s][A
Iteration:  30%|██▉       | 1383/4688 [03:59<09:40,  5.69it/s][A
Iteration:  30%|██▉       | 1384/4688 [03:59<09:39,  5.70it/s][A
Iteration:  30%|██▉       | 1385/4688 [03:59<09:38,  5.71it/s][A
Iteration:  30%|██▉       | 1386/4688 [04:00<09:33,  5.76it/s][A
Iteration:  30%|██▉       | 1387/4688 [04:00<09:39,  5.69it/s][A
Iteration:  30%|██▉       | 1388/4688 [04:00<09:40,  5.68it/s][A
Iteration:  30%|██▉       | 1389/4688 [04:00<09:39,  5.69it/s][A
Iteration:

Iteration:  32%|███▏      | 1499/4688 [04:19<09:13,  5.76it/s][A
Iteration:  32%|███▏      | 1500/4688 [04:20<09:21,  5.68it/s][A
Iteration:  32%|███▏      | 1501/4688 [04:20<09:23,  5.66it/s][A
Iteration:  32%|███▏      | 1502/4688 [04:20<09:20,  5.68it/s][A
Iteration:  32%|███▏      | 1503/4688 [04:20<09:19,  5.70it/s][A
Iteration:  32%|███▏      | 1504/4688 [04:20<09:18,  5.70it/s][A
Iteration:  32%|███▏      | 1505/4688 [04:20<09:18,  5.70it/s][A
Iteration:  32%|███▏      | 1506/4688 [04:21<09:19,  5.69it/s][A
Iteration:  32%|███▏      | 1507/4688 [04:21<09:20,  5.67it/s][A
Iteration:  32%|███▏      | 1508/4688 [04:21<09:20,  5.67it/s][A
Iteration:  32%|███▏      | 1509/4688 [04:21<09:18,  5.69it/s][A
Iteration:  32%|███▏      | 1510/4688 [04:21<09:18,  5.69it/s][A
Iteration:  32%|███▏      | 1511/4688 [04:22<09:15,  5.72it/s][A
Iteration:  32%|███▏      | 1512/4688 [04:22<09:18,  5.69it/s][A
Iteration:  32%|███▏      | 1513/4688 [04:22<09:13,  5.73it/s][A
Iteration:

Iteration:  35%|███▍      | 1623/4688 [04:41<08:56,  5.72it/s][A
Iteration:  35%|███▍      | 1624/4688 [04:41<08:56,  5.71it/s][A
Iteration:  35%|███▍      | 1625/4688 [04:42<08:54,  5.73it/s][A
Iteration:  35%|███▍      | 1626/4688 [04:42<09:00,  5.67it/s][A
Iteration:  35%|███▍      | 1627/4688 [04:42<08:59,  5.67it/s][A
Iteration:  35%|███▍      | 1628/4688 [04:42<08:56,  5.71it/s][A
Iteration:  35%|███▍      | 1629/4688 [04:42<08:57,  5.69it/s][A
Iteration:  35%|███▍      | 1630/4688 [04:42<08:57,  5.68it/s][A
Iteration:  35%|███▍      | 1631/4688 [04:43<08:56,  5.69it/s][A
Iteration:  35%|███▍      | 1632/4688 [04:43<08:54,  5.72it/s][A
Iteration:  35%|███▍      | 1633/4688 [04:43<08:56,  5.69it/s][A
Iteration:  35%|███▍      | 1634/4688 [04:43<09:01,  5.64it/s][A
Iteration:  35%|███▍      | 1635/4688 [04:43<08:58,  5.67it/s][A
Iteration:  35%|███▍      | 1636/4688 [04:44<08:56,  5.68it/s][A
Iteration:  35%|███▍      | 1637/4688 [04:44<08:52,  5.73it/s][A
Iteration:

Iteration:  37%|███▋      | 1747/4688 [05:03<08:36,  5.69it/s][A
Iteration:  37%|███▋      | 1748/4688 [05:03<08:32,  5.74it/s][A
Iteration:  37%|███▋      | 1749/4688 [05:03<08:33,  5.72it/s][A
Iteration:  37%|███▋      | 1750/4688 [05:03<08:28,  5.78it/s][A
Iteration:  37%|███▋      | 1751/4688 [05:04<08:35,  5.69it/s][A
Iteration:  37%|███▋      | 1752/4688 [05:04<08:35,  5.70it/s][A
Iteration:  37%|███▋      | 1753/4688 [05:04<08:34,  5.70it/s][A
Iteration:  37%|███▋      | 1754/4688 [05:04<08:34,  5.71it/s][A
Iteration:  37%|███▋      | 1755/4688 [05:04<08:30,  5.74it/s][A
Iteration:  37%|███▋      | 1756/4688 [05:05<08:30,  5.74it/s][A
Iteration:  37%|███▋      | 1757/4688 [05:05<08:29,  5.75it/s][A
Iteration:  38%|███▊      | 1758/4688 [05:05<08:37,  5.66it/s][A
Iteration:  38%|███▊      | 1759/4688 [05:05<08:36,  5.67it/s][A
Iteration:  38%|███▊      | 1760/4688 [05:05<08:32,  5.71it/s][A
Iteration:  38%|███▊      | 1761/4688 [05:05<08:30,  5.74it/s][A
Iteration:

Iteration:  40%|███▉      | 1871/4688 [05:25<08:19,  5.64it/s][A
Iteration:  40%|███▉      | 1872/4688 [05:25<08:17,  5.66it/s][A
Iteration:  40%|███▉      | 1873/4688 [05:25<08:15,  5.68it/s][A
Iteration:  40%|███▉      | 1874/4688 [05:25<08:13,  5.70it/s][A
Iteration:  40%|███▉      | 1875/4688 [05:25<08:15,  5.68it/s][A
Iteration:  40%|████      | 1876/4688 [05:26<08:16,  5.66it/s][A
Iteration:  40%|████      | 1877/4688 [05:26<08:12,  5.71it/s][A
Iteration:  40%|████      | 1878/4688 [05:26<08:12,  5.70it/s][A
Iteration:  40%|████      | 1879/4688 [05:26<08:09,  5.74it/s][A
Iteration:  40%|████      | 1880/4688 [05:26<08:10,  5.73it/s][A
Iteration:  40%|████      | 1881/4688 [05:26<08:10,  5.72it/s][A
Iteration:  40%|████      | 1882/4688 [05:27<08:13,  5.69it/s][A
Iteration:  40%|████      | 1883/4688 [05:27<08:18,  5.62it/s][A
Iteration:  40%|████      | 1884/4688 [05:27<08:18,  5.62it/s][A
Iteration:  40%|████      | 1885/4688 [05:27<08:16,  5.65it/s][A
Iteration:

Iteration:  43%|████▎     | 1995/4688 [05:46<07:56,  5.66it/s][A
Iteration:  43%|████▎     | 1996/4688 [05:47<08:01,  5.59it/s][A
Iteration:  43%|████▎     | 1997/4688 [05:47<07:55,  5.65it/s][A
Iteration:  43%|████▎     | 1998/4688 [05:47<07:52,  5.69it/s][A
Iteration:  43%|████▎     | 1999/4688 [05:47<07:49,  5.72it/s][A

Evaluating:   0%|          | 0/782 [00:00<?, ?it/s][A[A

Evaluating:   0%|          | 2/782 [00:00<01:11, 10.89it/s][A[A

Evaluating:   1%|          | 4/782 [00:00<01:12, 10.69it/s][A[A

Evaluating:   1%|          | 6/782 [00:00<01:12, 10.64it/s][A[A

Evaluating:   1%|          | 8/782 [00:00<01:12, 10.61it/s][A[A

Evaluating:   1%|▏         | 10/782 [00:00<01:12, 10.61it/s][A[A

Evaluating:   2%|▏         | 12/782 [00:01<01:12, 10.60it/s][A[A

Evaluating:   2%|▏         | 14/782 [00:01<01:12, 10.60it/s][A[A

Evaluating:   2%|▏         | 16/782 [00:01<01:12, 10.59it/s][A[A

Evaluating:   2%|▏         | 18/782 [00:01<01:12, 10.60it/s][A[A

Ev

Evaluating:  29%|██▉       | 228/782 [00:21<00:52, 10.62it/s][A[A

Evaluating:  29%|██▉       | 230/782 [00:21<00:51, 10.62it/s][A[A

Evaluating:  30%|██▉       | 232/782 [00:21<00:51, 10.63it/s][A[A

Evaluating:  30%|██▉       | 234/782 [00:22<00:51, 10.63it/s][A[A

Evaluating:  30%|███       | 236/782 [00:22<00:51, 10.63it/s][A[A

Evaluating:  30%|███       | 238/782 [00:22<00:51, 10.63it/s][A[A

Evaluating:  31%|███       | 240/782 [00:22<00:51, 10.63it/s][A[A

Evaluating:  31%|███       | 242/782 [00:22<00:50, 10.62it/s][A[A

Evaluating:  31%|███       | 244/782 [00:22<00:50, 10.62it/s][A[A

Evaluating:  31%|███▏      | 246/782 [00:23<00:50, 10.63it/s][A[A

Evaluating:  32%|███▏      | 248/782 [00:23<00:50, 10.63it/s][A[A

Evaluating:  32%|███▏      | 250/782 [00:23<00:50, 10.62it/s][A[A

Evaluating:  32%|███▏      | 252/782 [00:23<00:49, 10.63it/s][A[A

Evaluating:  32%|███▏      | 254/782 [00:23<00:49, 10.63it/s][A[A

Evaluating:  33%|███▎      | 256/7

Evaluating:  59%|█████▉    | 464/782 [00:43<00:30, 10.59it/s][A[A

Evaluating:  60%|█████▉    | 466/782 [00:43<00:29, 10.58it/s][A[A

Evaluating:  60%|█████▉    | 468/782 [00:44<00:29, 10.58it/s][A[A

Evaluating:  60%|██████    | 470/782 [00:44<00:29, 10.58it/s][A[A

Evaluating:  60%|██████    | 472/782 [00:44<00:29, 10.59it/s][A[A

Evaluating:  61%|██████    | 474/782 [00:44<00:29, 10.60it/s][A[A

Evaluating:  61%|██████    | 476/782 [00:44<00:28, 10.61it/s][A[A

Evaluating:  61%|██████    | 478/782 [00:45<00:28, 10.61it/s][A[A

Evaluating:  61%|██████▏   | 480/782 [00:45<00:28, 10.61it/s][A[A

Evaluating:  62%|██████▏   | 482/782 [00:45<00:28, 10.61it/s][A[A

Evaluating:  62%|██████▏   | 484/782 [00:45<00:28, 10.62it/s][A[A

Evaluating:  62%|██████▏   | 486/782 [00:45<00:27, 10.62it/s][A[A

Evaluating:  62%|██████▏   | 488/782 [00:45<00:27, 10.62it/s][A[A

Evaluating:  63%|██████▎   | 490/782 [00:46<00:27, 10.62it/s][A[A

Evaluating:  63%|██████▎   | 492/7

Evaluating:  90%|████████▉ | 700/782 [01:05<00:07, 10.62it/s][A[A

Evaluating:  90%|████████▉ | 702/782 [01:06<00:07, 10.62it/s][A[A

Evaluating:  90%|█████████ | 704/782 [01:06<00:07, 10.62it/s][A[A

Evaluating:  90%|█████████ | 706/782 [01:06<00:07, 10.63it/s][A[A

Evaluating:  91%|█████████ | 708/782 [01:06<00:06, 10.63it/s][A[A

Evaluating:  91%|█████████ | 710/782 [01:06<00:06, 10.63it/s][A[A

Evaluating:  91%|█████████ | 712/782 [01:07<00:06, 10.63it/s][A[A

Evaluating:  91%|█████████▏| 714/782 [01:07<00:06, 10.62it/s][A[A

Evaluating:  92%|█████████▏| 716/782 [01:07<00:06, 10.62it/s][A[A

Evaluating:  92%|█████████▏| 718/782 [01:07<00:06, 10.62it/s][A[A

Evaluating:  92%|█████████▏| 720/782 [01:07<00:05, 10.62it/s][A[A

Evaluating:  92%|█████████▏| 722/782 [01:08<00:05, 10.62it/s][A[A

Evaluating:  93%|█████████▎| 724/782 [01:08<00:05, 10.62it/s][A[A

Evaluating:  93%|█████████▎| 726/782 [01:08<00:05, 10.62it/s][A[A

Evaluating:  93%|█████████▎| 728/7

Iteration:  44%|████▍     | 2079/4688 [07:16<07:38,  5.69it/s][A
Iteration:  44%|████▍     | 2080/4688 [07:16<07:35,  5.72it/s][A
Iteration:  44%|████▍     | 2081/4688 [07:16<07:35,  5.72it/s][A
Iteration:  44%|████▍     | 2082/4688 [07:16<07:32,  5.76it/s][A
Iteration:  44%|████▍     | 2083/4688 [07:17<07:38,  5.68it/s][A
Iteration:  44%|████▍     | 2084/4688 [07:17<07:37,  5.70it/s][A
Iteration:  44%|████▍     | 2085/4688 [07:17<07:37,  5.69it/s][A
Iteration:  44%|████▍     | 2086/4688 [07:17<07:36,  5.70it/s][A
Iteration:  45%|████▍     | 2087/4688 [07:17<07:36,  5.69it/s][A
Iteration:  45%|████▍     | 2088/4688 [07:17<07:34,  5.72it/s][A
Iteration:  45%|████▍     | 2089/4688 [07:18<07:35,  5.71it/s][A
Iteration:  45%|████▍     | 2090/4688 [07:18<07:38,  5.67it/s][A
Iteration:  45%|████▍     | 2091/4688 [07:18<07:43,  5.61it/s][A
Iteration:  45%|████▍     | 2092/4688 [07:18<07:43,  5.60it/s][A
Iteration:  45%|████▍     | 2093/4688 [07:18<07:38,  5.66it/s][A
Iteration:

Iteration:  47%|████▋     | 2203/4688 [07:38<07:17,  5.68it/s][A
Iteration:  47%|████▋     | 2204/4688 [07:38<07:13,  5.72it/s][A
Iteration:  47%|████▋     | 2205/4688 [07:38<07:12,  5.74it/s][A
Iteration:  47%|████▋     | 2206/4688 [07:38<07:13,  5.72it/s][A
Iteration:  47%|████▋     | 2207/4688 [07:38<07:15,  5.70it/s][A
Iteration:  47%|████▋     | 2208/4688 [07:39<07:20,  5.62it/s][A
Iteration:  47%|████▋     | 2209/4688 [07:39<07:24,  5.58it/s][A
Iteration:  47%|████▋     | 2210/4688 [07:39<07:20,  5.63it/s][A
Iteration:  47%|████▋     | 2211/4688 [07:39<07:19,  5.63it/s][A
Iteration:  47%|████▋     | 2212/4688 [07:39<07:17,  5.66it/s][A
Iteration:  47%|████▋     | 2213/4688 [07:39<07:13,  5.70it/s][A
Iteration:  47%|████▋     | 2214/4688 [07:40<07:10,  5.75it/s][A
Iteration:  47%|████▋     | 2215/4688 [07:40<07:10,  5.75it/s][A
Iteration:  47%|████▋     | 2216/4688 [07:40<07:09,  5.75it/s][A
Iteration:  47%|████▋     | 2217/4688 [07:40<07:09,  5.76it/s][A
Iteration:

Iteration:  50%|████▉     | 2327/4688 [07:59<06:54,  5.70it/s][A
Iteration:  50%|████▉     | 2328/4688 [08:00<06:54,  5.69it/s][A
Iteration:  50%|████▉     | 2329/4688 [08:00<06:54,  5.69it/s][A
Iteration:  50%|████▉     | 2330/4688 [08:00<06:54,  5.68it/s][A
Iteration:  50%|████▉     | 2331/4688 [08:00<06:51,  5.72it/s][A
Iteration:  50%|████▉     | 2332/4688 [08:00<06:49,  5.75it/s][A
Iteration:  50%|████▉     | 2333/4688 [08:00<06:48,  5.76it/s][A
Iteration:  50%|████▉     | 2334/4688 [08:01<06:55,  5.67it/s][A
Iteration:  50%|████▉     | 2335/4688 [08:01<06:54,  5.67it/s][A
Iteration:  50%|████▉     | 2336/4688 [08:01<06:51,  5.71it/s][A
Iteration:  50%|████▉     | 2337/4688 [08:01<06:50,  5.72it/s][A
Iteration:  50%|████▉     | 2338/4688 [08:01<06:52,  5.70it/s][A
Iteration:  50%|████▉     | 2339/4688 [08:01<06:51,  5.70it/s][A
Iteration:  50%|████▉     | 2340/4688 [08:02<06:50,  5.73it/s][A
Iteration:  50%|████▉     | 2341/4688 [08:02<06:56,  5.64it/s][A
Iteration:

Iteration:  52%|█████▏    | 2451/4688 [08:21<06:31,  5.71it/s][A
Iteration:  52%|█████▏    | 2452/4688 [08:21<06:31,  5.71it/s][A
Iteration:  52%|█████▏    | 2453/4688 [08:21<06:30,  5.72it/s][A
Iteration:  52%|█████▏    | 2454/4688 [08:22<06:28,  5.75it/s][A
Iteration:  52%|█████▏    | 2455/4688 [08:22<06:26,  5.78it/s][A
Iteration:  52%|█████▏    | 2456/4688 [08:22<06:24,  5.80it/s][A
Iteration:  52%|█████▏    | 2457/4688 [08:22<06:27,  5.75it/s][A
Iteration:  52%|█████▏    | 2458/4688 [08:22<06:30,  5.71it/s][A
Iteration:  52%|█████▏    | 2459/4688 [08:22<06:30,  5.71it/s][A
Iteration:  52%|█████▏    | 2460/4688 [08:23<06:29,  5.72it/s][A
Iteration:  52%|█████▏    | 2461/4688 [08:23<06:27,  5.75it/s][A
Iteration:  53%|█████▎    | 2462/4688 [08:23<06:25,  5.77it/s][A
Iteration:  53%|█████▎    | 2463/4688 [08:23<06:27,  5.75it/s][A
Iteration:  53%|█████▎    | 2464/4688 [08:23<06:29,  5.71it/s][A
Iteration:  53%|█████▎    | 2465/4688 [08:24<06:30,  5.70it/s][A
Iteration:

Iteration:  55%|█████▍    | 2575/4688 [08:43<06:12,  5.67it/s][A
Iteration:  55%|█████▍    | 2576/4688 [08:43<06:11,  5.69it/s][A
Iteration:  55%|█████▍    | 2577/4688 [08:43<06:10,  5.70it/s][A
Iteration:  55%|█████▍    | 2578/4688 [08:43<06:09,  5.72it/s][A
Iteration:  55%|█████▌    | 2579/4688 [08:44<06:06,  5.75it/s][A
Iteration:  55%|█████▌    | 2580/4688 [08:44<06:04,  5.78it/s][A
Iteration:  55%|█████▌    | 2581/4688 [08:44<06:06,  5.75it/s][A
Iteration:  55%|█████▌    | 2582/4688 [08:44<06:09,  5.70it/s][A
Iteration:  55%|█████▌    | 2583/4688 [08:44<06:08,  5.72it/s][A
Iteration:  55%|█████▌    | 2584/4688 [08:44<06:07,  5.72it/s][A
Iteration:  55%|█████▌    | 2585/4688 [08:45<06:07,  5.72it/s][A
Iteration:  55%|█████▌    | 2586/4688 [08:45<06:05,  5.75it/s][A
Iteration:  55%|█████▌    | 2587/4688 [08:45<06:06,  5.73it/s][A
Iteration:  55%|█████▌    | 2588/4688 [08:45<06:07,  5.72it/s][A
Iteration:  55%|█████▌    | 2589/4688 [08:45<06:08,  5.70it/s][A
Iteration:

Iteration:  58%|█████▊    | 2699/4688 [09:05<05:47,  5.73it/s][A
Iteration:  58%|█████▊    | 2700/4688 [09:05<05:49,  5.69it/s][A
Iteration:  58%|█████▊    | 2701/4688 [09:05<05:48,  5.70it/s][A
Iteration:  58%|█████▊    | 2702/4688 [09:05<05:48,  5.70it/s][A
Iteration:  58%|█████▊    | 2703/4688 [09:05<05:46,  5.73it/s][A
Iteration:  58%|█████▊    | 2704/4688 [09:05<05:45,  5.75it/s][A
Iteration:  58%|█████▊    | 2705/4688 [09:06<05:45,  5.74it/s][A
Iteration:  58%|█████▊    | 2706/4688 [09:06<05:50,  5.66it/s][A
Iteration:  58%|█████▊    | 2707/4688 [09:06<05:51,  5.64it/s][A
Iteration:  58%|█████▊    | 2708/4688 [09:06<05:49,  5.66it/s][A
Iteration:  58%|█████▊    | 2709/4688 [09:06<05:48,  5.68it/s][A
Iteration:  58%|█████▊    | 2710/4688 [09:06<05:45,  5.73it/s][A
Iteration:  58%|█████▊    | 2711/4688 [09:07<05:44,  5.74it/s][A
Iteration:  58%|█████▊    | 2712/4688 [09:07<05:43,  5.76it/s][A
Iteration:  58%|█████▊    | 2713/4688 [09:07<05:48,  5.67it/s][A
Iteration:

Iteration:  60%|██████    | 2823/4688 [09:26<05:28,  5.68it/s][A
Iteration:  60%|██████    | 2824/4688 [09:26<05:25,  5.72it/s][A
Iteration:  60%|██████    | 2825/4688 [09:27<05:27,  5.69it/s][A
Iteration:  60%|██████    | 2826/4688 [09:27<05:26,  5.71it/s][A
Iteration:  60%|██████    | 2827/4688 [09:27<05:24,  5.74it/s][A
Iteration:  60%|██████    | 2828/4688 [09:27<05:22,  5.76it/s][A
Iteration:  60%|██████    | 2829/4688 [09:27<05:24,  5.74it/s][A
Iteration:  60%|██████    | 2830/4688 [09:27<05:23,  5.73it/s][A
Iteration:  60%|██████    | 2831/4688 [09:28<05:22,  5.75it/s][A
Iteration:  60%|██████    | 2832/4688 [09:28<05:23,  5.74it/s][A
Iteration:  60%|██████    | 2833/4688 [09:28<05:21,  5.77it/s][A
Iteration:  60%|██████    | 2834/4688 [09:28<05:20,  5.78it/s][A
Iteration:  60%|██████    | 2835/4688 [09:28<05:19,  5.80it/s][A
Iteration:  60%|██████    | 2836/4688 [09:28<05:24,  5.70it/s][A
Iteration:  61%|██████    | 2837/4688 [09:29<05:26,  5.66it/s][A
Iteration:

Iteration:  63%|██████▎   | 2947/4688 [09:48<05:04,  5.72it/s][A
Iteration:  63%|██████▎   | 2948/4688 [09:48<05:03,  5.72it/s][A
Iteration:  63%|██████▎   | 2949/4688 [09:48<05:04,  5.72it/s][A
Iteration:  63%|██████▎   | 2950/4688 [09:48<05:02,  5.74it/s][A
Iteration:  63%|██████▎   | 2951/4688 [09:49<05:05,  5.68it/s][A
Iteration:  63%|██████▎   | 2952/4688 [09:49<05:09,  5.61it/s][A
Iteration:  63%|██████▎   | 2953/4688 [09:49<05:09,  5.61it/s][A
Iteration:  63%|██████▎   | 2954/4688 [09:49<05:07,  5.64it/s][A
Iteration:  63%|██████▎   | 2955/4688 [09:49<05:04,  5.70it/s][A
Iteration:  63%|██████▎   | 2956/4688 [09:49<05:02,  5.72it/s][A
Iteration:  63%|██████▎   | 2957/4688 [09:50<05:02,  5.73it/s][A
Iteration:  63%|██████▎   | 2958/4688 [09:50<05:01,  5.73it/s][A
Iteration:  63%|██████▎   | 2959/4688 [09:50<05:02,  5.71it/s][A
Iteration:  63%|██████▎   | 2960/4688 [09:50<05:02,  5.71it/s][A
Iteration:  63%|██████▎   | 2961/4688 [09:50<05:02,  5.71it/s][A
Iteration:

Iteration:  66%|██████▌   | 3071/4688 [10:10<04:41,  5.75it/s][A
Iteration:  66%|██████▌   | 3072/4688 [10:10<04:42,  5.72it/s][A
Iteration:  66%|██████▌   | 3073/4688 [10:10<04:40,  5.76it/s][A
Iteration:  66%|██████▌   | 3074/4688 [10:10<04:39,  5.77it/s][A
Iteration:  66%|██████▌   | 3075/4688 [10:10<04:38,  5.79it/s][A
Iteration:  66%|██████▌   | 3076/4688 [10:10<04:41,  5.72it/s][A
Iteration:  66%|██████▌   | 3077/4688 [10:11<04:41,  5.73it/s][A
Iteration:  66%|██████▌   | 3078/4688 [10:11<04:39,  5.75it/s][A
Iteration:  66%|██████▌   | 3079/4688 [10:11<04:40,  5.74it/s][A
Iteration:  66%|██████▌   | 3080/4688 [10:11<04:39,  5.75it/s][A
Iteration:  66%|██████▌   | 3081/4688 [10:11<04:37,  5.78it/s][A
Iteration:  66%|██████▌   | 3082/4688 [10:11<04:42,  5.68it/s][A
Iteration:  66%|██████▌   | 3083/4688 [10:12<04:40,  5.72it/s][A
Iteration:  66%|██████▌   | 3084/4688 [10:12<04:39,  5.74it/s][A
Iteration:  66%|██████▌   | 3085/4688 [10:12<04:39,  5.73it/s][A
Iteration:

Iteration:  68%|██████▊   | 3195/4688 [10:31<04:22,  5.68it/s][A
Iteration:  68%|██████▊   | 3196/4688 [10:31<04:21,  5.71it/s][A
Iteration:  68%|██████▊   | 3197/4688 [10:32<04:20,  5.73it/s][A
Iteration:  68%|██████▊   | 3198/4688 [10:32<04:20,  5.72it/s][A
Iteration:  68%|██████▊   | 3199/4688 [10:32<04:23,  5.65it/s][A
Iteration:  68%|██████▊   | 3200/4688 [10:32<04:23,  5.66it/s][A
Iteration:  68%|██████▊   | 3201/4688 [10:32<04:21,  5.68it/s][A
Iteration:  68%|██████▊   | 3202/4688 [10:32<04:19,  5.72it/s][A
Iteration:  68%|██████▊   | 3203/4688 [10:33<04:18,  5.74it/s][A
Iteration:  68%|██████▊   | 3204/4688 [10:33<04:17,  5.76it/s][A
Iteration:  68%|██████▊   | 3205/4688 [10:33<04:18,  5.74it/s][A
Iteration:  68%|██████▊   | 3206/4688 [10:33<04:20,  5.68it/s][A
Iteration:  68%|██████▊   | 3207/4688 [10:33<04:22,  5.64it/s][A
Iteration:  68%|██████▊   | 3208/4688 [10:34<04:21,  5.65it/s][A
Iteration:  68%|██████▊   | 3209/4688 [10:34<04:20,  5.67it/s][A
Iteration:

Iteration:  71%|███████   | 3319/4688 [10:53<03:57,  5.76it/s][A
Iteration:  71%|███████   | 3320/4688 [10:53<03:58,  5.73it/s][A
Iteration:  71%|███████   | 3321/4688 [10:53<03:57,  5.75it/s][A
Iteration:  71%|███████   | 3322/4688 [10:53<03:59,  5.70it/s][A
Iteration:  71%|███████   | 3323/4688 [10:54<03:59,  5.70it/s][A
Iteration:  71%|███████   | 3324/4688 [10:54<03:58,  5.72it/s][A
Iteration:  71%|███████   | 3325/4688 [10:54<03:57,  5.75it/s][A
Iteration:  71%|███████   | 3326/4688 [10:54<03:56,  5.77it/s][A
Iteration:  71%|███████   | 3327/4688 [10:54<03:56,  5.74it/s][A
Iteration:  71%|███████   | 3328/4688 [10:55<03:57,  5.72it/s][A
Iteration:  71%|███████   | 3329/4688 [10:55<03:59,  5.68it/s][A
Iteration:  71%|███████   | 3330/4688 [10:55<04:01,  5.62it/s][A
Iteration:  71%|███████   | 3331/4688 [10:55<04:00,  5.65it/s][A
Iteration:  71%|███████   | 3332/4688 [10:55<03:57,  5.71it/s][A
Iteration:  71%|███████   | 3333/4688 [10:55<03:57,  5.71it/s][A
Iteration:

Iteration:  73%|███████▎  | 3443/4688 [11:15<03:38,  5.69it/s][A
Iteration:  73%|███████▎  | 3444/4688 [11:15<03:36,  5.73it/s][A
Iteration:  73%|███████▎  | 3445/4688 [11:15<03:37,  5.72it/s][A
Iteration:  74%|███████▎  | 3446/4688 [11:15<03:37,  5.72it/s][A
Iteration:  74%|███████▎  | 3447/4688 [11:15<03:36,  5.74it/s][A
Iteration:  74%|███████▎  | 3448/4688 [11:16<03:37,  5.69it/s][A
Iteration:  74%|███████▎  | 3449/4688 [11:16<03:39,  5.66it/s][A
Iteration:  74%|███████▎  | 3450/4688 [11:16<03:39,  5.65it/s][A
Iteration:  74%|███████▎  | 3451/4688 [11:16<03:38,  5.67it/s][A
Iteration:  74%|███████▎  | 3452/4688 [11:16<03:36,  5.70it/s][A
Iteration:  74%|███████▎  | 3453/4688 [11:16<03:36,  5.70it/s][A
Iteration:  74%|███████▎  | 3454/4688 [11:17<03:35,  5.73it/s][A
Iteration:  74%|███████▎  | 3455/4688 [11:17<03:34,  5.75it/s][A
Iteration:  74%|███████▎  | 3456/4688 [11:17<03:33,  5.77it/s][A
Iteration:  74%|███████▎  | 3457/4688 [11:17<03:34,  5.75it/s][A
Iteration:

KeyboardInterrupt: 

## Inference
input : sample_pred_in.txt, output : sample_pred_out.txt

In [6]:
from predict import predict
parser = argparse.ArgumentParser()

parser.add_argument("--input_file", default="sample_pred_in.txt", type=str, help="Input file for prediction")
parser.add_argument("--output_file", default="sample_pred_out.txt", type=str, help="Output file for prediction")
parser.add_argument("--model_dir", default="./model", type=str, help="Path to save, load model")

parser.add_argument("--batch_size", default=32, type=int, help="Batch size for prediction")
parser.add_argument("--no_cuda", action="store_true", help="Avoid using CUDA when available")

pred_config = parser.parse_args([])
predict(pred_config)

The tokenizer class you load from this checkpoint is not the same type as the class this function is called from. It may result in unexpected tokenization. 
The tokenizer class you load from this checkpoint is 'BertTokenizer'. 
The class this function is called from is 'KoBertTokenizer'.
Predicting: 100%|██████████| 1/1 [00:00<00:00, 64.61it/s]
