# 基于TextCNN的头条新闻分类笔记

## 编写配置

In [61]:
import torch 
import torch.nn as nn

config = {
    'train_file_path': '../../../data/toutiao_news_cls/train.csv',
    'test_file_path': '../../../data/toutiao_news_cls/test.csv',
    'train_val_ratio': 0.1,  # 10%用作验证集
    'vocab_size': 10000,   # 词典 3W
    'batch_size': 32,      # batch 大小 64
    'num_epochs': 3,      # 10次迭代
    'learning_rate': 1e-3, # 学习率
    'logging_step': 100,   # 每跑300个batch记录一次
    'seed': 2022           # 随机种子
}

config['device'] = 'cuda' if torch.cuda.is_available() else 'cpu' # cpu&gpu

import random
import numpy as np

def seed_everything(seed):
    random.seed(seed)
    np.random.seed(seed)
    torch.manual_seed(seed)
    torch.cuda.manual_seed_all(seed)
    return seed

seed_everything(config['seed'])

2022

## 获得词汇表

In [2]:
from collections import Counter
from tqdm import tqdm
import jieba

def get_vocab(config):
    token_counter = Counter()
    with open(config['train_file_path'], 'r', encoding='utf8') as f:
        lines = f.readlines()
        for line in tqdm(lines, desc='Counting tokens...', total=len(lines)):
            sent = line.split(',')[-1].strip()
            sent_cut = list(jieba.cut(sent))
            token_counter.update(sent_cut)
            
    vocab = set(token for token, _ in token_counter.most_common(config['vocab_size']))
    return vocab

In [3]:
vocab = get_vocab(config)
vocab

Counting tokens...:   0%|                                         | 0/53361 [00:00<?, ?it/s]Building prefix dict from the default dictionary ...
Loading model from cache /var/folders/19/dgxwsbgd76728hx577833nx00000gn/T/jieba.cache
Loading model cost 0.598 seconds.
Prefix dict has been built successfully.
Counting tokens...: 100%|███████████████████████████| 53361/53361 [00:06<00:00, 8123.94it/s]


{'处理器',
 '必去',
 '石',
 '屏幕',
 '知多少',
 '传说',
 '具有',
 '情',
 '这才',
 '理财产品',
 '10',
 '廖英强',
 '怪',
 '概念股',
 '混动',
 '起飞',
 '余',
 '自信',
 '入围',
 '园',
 '以前',
 '尸体',
 '无',
 '醒来',
 '颤抖',
 '组团',
 '一字',
 '：',
 '古今',
 '难民',
 '隐居',
 '县城',
 '同框',
 '路上',
 '丢',
 '境外',
 '可不是',
 '灭绝',
 '出售',
 '被动',
 '霸道',
 '直到',
 '认识',
 '些',
 '路虎',
 '面包车',
 '检验',
 '协会',
 '俗语',
 '大杀器',
 '上调',
 '看清',
 '超过',
 '行为',
 '里程',
 '国际乒联',
 '聊天',
 '风采',
 '抢滩',
 '遍地',
 'B2B',
 '慌',
 '含泪',
 '求助',
 '扮演',
 '没人敢',
 '源自',
 '爷爷',
 '不算',
 '效率',
 '报道',
 '截图',
 '缺',
 '难度',
 '嘉年华',
 '耗电',
 '坚果',
 '科学家',
 '中国空军',
 '车子',
 '我要',
 '偶遇',
 'O',
 '烟花',
 '大姐',
 '蓝海',
 '合同',
 '南非',
 '安置',
 '行者',
 '理财',
 '张檬',
 '入驻',
 '年前',
 '头号',
 '烧',
 '充电',
 '回来',
 '一部',
 '多岁',
 '实现',
 '这么久',
 '猜',
 '接送',
 '民国',
 '光棍',
 '东西部',
 '大胆',
 '尔特',
 '月球',
 '终生',
 '青',
 '新人',
 '配合',
 '亿万富豪',
 '领跑',
 '接受',
 '思维',
 '激光',
 '戴安娜',
 '服务器',
 '何炅',
 '赌',
 '综述',
 '条件',
 '狂欢',
 '导致',
 '今年',
 '尊严',
 '献给',
 '右',
 '七大',
 '图集',
 'bug',
 '云南',
 '屡屡',
 '各方',
 '之战',
 '宾利',
 '连云港',
 '亏损',
 '2',

## 获得词向量

In [4]:
import bz2

with bz2.open('../../../pt/sgns_weibo/sgns.weibo.word.bz2') as f:
    token_vector = f.readlines()    

In [5]:
for i, line in enumerate(token_vector):
    line_split = line.split()
    if i == 0:
        print(f'词汇规模:{(int)(line_split[0])}, 特征维度:{(int)(line_split[1])}')
    else:
        print(f"词汇:{line_split[0].decode('utf8')}\n特征:{line_split[1:]}")
    print()
    
    if i > 2:
        break

词汇规模:195202, 特征维度:300

词汇:，
特征:[b'0.094386', b'-0.200944', b'-0.030828', b'0.277130', b'-0.074674', b'0.239691', b'0.345185', b'0.298053', b'-0.026679', b'-0.077352', b'0.245854', b'-0.075995', b'0.058849', b'-0.176755', b'-0.072721', b'-0.246469', b'-0.182233', b'0.267472', b'0.109897', b'-0.266215', b'0.176660', b'-0.101581', b'0.374443', b'0.304319', b'0.024169', b'-0.158494', b'-0.254765', b'-0.265324', b'0.225498', b'-0.126215', b'-0.207172', b'-0.334429', b'-0.003584', b'-0.065530', b'0.174206', b'-0.097252', b'0.114595', b'-0.158193', b'-0.099948', b'-0.145332', b'-0.076565', b'-0.119460', b'0.074718', b'-0.056694', b'0.394867', b'-0.127122', b'0.270542', b'0.087482', b'-0.114715', b'0.124381', b'-0.149974', b'0.192933', b'0.131023', b'0.099271', b'-0.062209', b'0.079382', b'0.000578', b'-0.166215', b'0.155815', b'-0.279675', b'-0.184237', b'0.123209', b'0.043216', b'-0.308681', b'0.036135', b'0.064121', b'0.037674', b'0.026703', b'0.307341', b'0.089780', b'-0.057681', b'-0.2523

In [6]:
def get_embedding(vocab):
    token2embedding ={}

    with bz2.open('../../../pt/sgns_weibo/sgns.weibo.word.bz2') as f:
        token_vector = f.readlines()

        meta_info = token_vector[0].split()
        print(f'{(int)(meta_info[0])} tokens in embedding file in total, vector size is {(int)(meta_info[1])}')

        for line in tqdm(token_vector[1:]):
            line = line.split()
            token = line[0].decode('utf8')

            vector = line[1:]

            if token in vocab:
                token2embedding[token] = [float(num) for num in vector]

        # enumerate(, [start])
        token2id = {token: idx for idx, token in enumerate(token2embedding.keys(), 4)}
        id2embedding = {token2id[token]: embedding for token, embedding in token2embedding.items()}

        PAD, UNK, BOS, EOS = '<pad>', '<unk>', '<bos>', '<eos>'

        token2id[PAD] = 0
        token2id[UNK] = 1
        token2id[BOS] = 2
        token2id[EOS] = 3

        id2embedding[0] = [.0] * int(meta_info[1])
        id2embedding[1] = [.0] * int(meta_info[1])

        id2embedding[2] = np.random.random(int(meta_info[1])).tolist()
        id2embedding[3] = np.random.random(int(meta_info[1])).tolist()

        emb_mat = [id2embedding[idx] for idx in range(len(id2embedding))]

        return torch.tensor(emb_mat, dtype=torch.float), token2id, len(vocab)+4


In [7]:
emb_mat, token2id, config['vocab_size'] = get_embedding(vocab)

195202 tokens in embedding file in total, vector size is 300


100%|████████████████████████████████████████████| 195202/195202 [00:03<00:00, 63168.67it/s]


## 数据预处理并编写DataLoader

In [29]:
def tokenizer(sent, token2id):
    ids = [token2id.get(token, 1) for token in jieba.cut(sent)]
    return ids

In [9]:
import pandas as pd
from collections import defaultdict

In [30]:
def read_data(config, token2id, mode='train'):
    
    data_df = pd.read_csv(config[f'{mode}_file_path'], sep=',')
    LABEL, SENTENCE = 'label', 'sentence'
    data_df[SENTENCE].apply(lambda s: ' '.join([str(id_) for id_ in tokenizer(s, token2id)]))
    data_df['input_ids'] = data_df[SENTENCE].apply(lambda s: ' '.join([str(id_) for id_ in tokenizer(s, token2id)]))
    sentence_wids = np.array([[int(id_) for id_ in v.split()] for v in data_df['input_ids'].values])

    if mode == 'train':
        labels = data_df[LABEL].values
        
        X_train, y_train = defaultdict(list), []
        X_val, y_val = defaultdict(list), []
        num_val = int(config['train_val_ratio'] * len(data_df))
        
        # shuffle ids
        ids = np.random.choice(range(len(data_df)), size=len(data_df), replace=False)
        train_ids = ids[num_val:]
        val_ids = ids[:num_val]
        
        # get input_ids
        X_train['input_ids'], y_train = sentence_wids[train_ids], labels[train_ids]
        X_val['input_ids'], y_val = sentence_wids[val_ids], labels[val_ids]
        
        # label 
        label2id = {label: i for i, label in enumerate(np.unique(y_train))}
        id2label = {i: label for label, i in label2id.items()}
        y_train = torch.tensor([label2id[y] for y in y_train], dtype=torch.long)
        y_val = torch.tensor([label2id[y] for y in y_val], dtype=torch.long)

        return X_train, y_train, X_val, y_val, label2id, id2label

    else:
        X_test = defaultdict(list)
        X_test['input_ids'] = sentence_wids
        y_test = torch.zeros(len(data_df), dtype=torch.long)
        
        return X_test, y_test

In [31]:
X_train, y_train, X_val, y_val, label2id, id2label = read_data(config, token2id, mode='train')

  import sys


In [32]:
X_test, y_test = read_data(config, token2id, mode='test')

  import sys


#### Dataset提供数据集的封装，创建/继承Dataset必须实现:
+ __len__: 整个数据集的长度
+ __getitem__: 支持数据集索引的函数

In [44]:
from torch.utils.data import Dataset

class TNEWSDataset(Dataset):
    def __init__(self, X, y):
        self.x = X
        self.y = y
        
    def __getitem__(self, idx):
        return {
            'input_ids': self.x['input_ids'][idx],
            'label': self.y[idx]
        }
    
    def __len__(self):
        return self.y.size(0)

#### 使用DataLoader实现数据集的并行加载
+ DataLoader提供一个可迭代对象，实现数据并行加载，从TNEWSDataset返回一个example，取多次，最后形成一个长度为batch_size的列表examples
+ examples的格式：[dict1, dict2, ...]
+ collate_fn()将examples中的数据合并为Tensor

In [41]:
def collate_fn(examples):
    input_ids_lst = []
    labels = []
    for example in examples:
        input_ids_lst.append(example['input_ids'])
        labels.append(example['label'])
        
    # input_ids_lst中最长的句子长度
    max_length = max(len(input_ids) for input_ids in input_ids_lst)
    # 定义一个Tensor
    input_ids_tensor = torch.zeros((len(labels), max_length), dtype=torch.long)
    
    for i, input_ids in enumerate(input_ids_lst):
        seq_len = len(input_ids)
        input_ids_tensor[i, :seq_len] = torch.tensor(input_ids, dtype=torch.long)
    
    return {
        'input_ids': input_ids_tensor,
        'label': torch.tensor(labels, dtype=torch.long)
    }

In [42]:
from torch.utils.data import DataLoader

def build_dataloader(config, vocab):
    X_train, y_train, X_val, y_val, label2id, id2label = read_data(config, token2id, mode='train')
    X_test, y_test = read_data(config, token2id, mode='test')
    
    train_dataset = TNEWSDataset(X_train, y_train)
    val_dataset = TNEWSDataset(X_val, y_val)
    test_dataset = TNEWSDataset(X_test, y_test)
    
    train_dataloader = DataLoader(dataset=train_dataset, batch_size=config['batch_size'], num_workers=0, shuffle=True, collate_fn=collate_fn)
    val_dataloader = DataLoader(dataset=val_dataset, batch_size=config['batch_size'], num_workers=0, shuffle=False, collate_fn=collate_fn)
    test_dataloader = DataLoader(dataset=test_dataset, batch_size=config['batch_size'], num_workers=0, shuffle=False, collate_fn=collate_fn)

    return id2label, train_dataloader, val_dataloader, test_dataloader

In [45]:
id2label, train_dataloader, val_dataloader, test_dataloader = build_dataloader(config, vocab)

  import sys


In [47]:
for batch in train_dataloader:
    print(len(batch['input_ids']))
    print(batch)
    break

32
{'input_ids': tensor([[  48,    1,  581,    5,    1, 5811,    4,  227,   98,    1,   92,    4,
            1,  566,    8, 4341,    0,    0,    0,    0,    0,    0,    0,    0,
            0,    0],
        [  60,    1,   63,  340, 3077,   17, 6634,   80,  947, 1934,    1,    0,
            0,    0,    0,    0,    0,    0,    0,    0,    0,    0,    0,    0,
            0,    0],
        [   1, 6733,    1,  380,    1,    1,    0,    0,    0,    0,    0,    0,
            0,    0,    0,    0,    0,    0,    0,    0,    0,    0,    0,    0,
            0,    0],
        [   1,  360,   18,    1, 4724,  721,   22,    0,    0,    0,    0,    0,
            0,    0,    0,    0,    0,    0,    0,    0,    0,    0,    0,    0,
            0,    0],
        [ 340,    1, 1423,    5, 2574, 1862,   18, 1915,   30,  471,  379,  575,
            5,   24,   22,   17,    0,    0,    0,    0,    0,    0,    0,    0,
            0,    0],
        [8570, 1006,  278,    1, 2208,    4,  221, 8716,   68, 

## 实现TextCNN并训练验证

In [48]:
model_config = {
    'embedding_pretrained' : emb_mat,
    'num_filters' : 256,
    'emb_size' : emb_mat.shape[1],
    'dropout' : 0.3,
    'filter_sizes' : [2,3,5],
    'num_classes' : len(label2id)
}

In [49]:
emb_mat.dtype

torch.float32

In [50]:
import torch.nn.functional as F

class Model(nn.Module):
    def __init__(self, config):
        super(Model, self).__init__()
        
        self.embedding = nn.Embedding.from_pretrained(config['embedding_pretrained'], freeze=True)
        self.convs = nn.ModuleList([nn.Conv2d(1, config['num_filters'], (k, config['emb_size'])) for k in config['filter_sizes']])
        self.dropout = nn.Dropout(config['dropout'])
        
        self.fc = nn.Linear(len(config['filter_sizes']) * config['num_filters'], config['num_classes'])

        
    def convs_and_pool(self, x, conv):
        # x [batch_size, out_channels, seq_len_out, 1]
        # x [batch_size, out_channels, seq_len_out]
        x = F.relu(conv(x)).squeeze(3)
        
        # x [batch_size, out_channels, 1]
        # x [batch_size, out_channels]
        x = F.max_pool1d(x, x.size(2)).squeeze(2)
        
        return x
    
    def forward(self, input_ids=None, label=None):
        # out [batch_size, seq_len, embedding_dim]
        out = self.embedding(input_ids)
        
        # out [batch_size, 1, seq_len, embedding_dim]
        out = out.unsqueeze(1)
        
        # (batch_size, out_channels)
        out = torch.cat([self.convs_and_pool(out, conv) for conv in self.convs], 1)
        
        out = self.dropout(out)
        out = self.fc(out)
        output = (out, )
        
        if label is not None:  # for train
            loss_fct = nn.CrossEntropyLoss()
            loss = loss_fct(out, label)
            output = (loss,) + output
            
        return output

In [51]:
model = Model(model_config)

In [52]:
from sklearn.metrics import f1_score

def evaluation(config, model, val_dataloader):
    model.eval()
    preds = []
    labels = []
    val_loss = 0.
    val_iterator = tqdm(val_dataloader, desc='Evaluation...', total=len(val_dataloader))
    with torch.no_grad():
        for batch in val_iterator:
            labels.append(batch['label'])
            batch = {item:value.to(config['device']) for item, value in batch.items()}
            
            # val output (loss, out)
            loss, logits = model(**batch)[:2]
            val_loss += loss.item()
            
            preds.append(logits.argmax(dim=-1).detach().cpu())
            
    avg_val_loss = val_loss/len(val_dataloader)
    labels = torch.cat(labels, dim=0).numpy()
    preds = torch.cat(preds, dim=0).numpy()
    
    f1 =f1_score(labels, preds, average='macro')
    
    return avg_val_loss, f1

In [62]:
from torch.optim import AdamW
from tqdm import trange

def train(model, config, id2label, train_dataloader, val_dataloader):
    optimizer = AdamW(model.parameters(), lr=config['learning_rate'])
    model.to(config['device'])
    epoches_iterator = trange(config['num_epochs'])
    
    # 200batch/epoch * 10epochs = global_step
    global_step = 0
    train_loss = 0.
    # logging_loss = 0.
    
    for epoch in epoches_iterator:
        train_iterator = tqdm(train_dataloader, desc='Training', total=len(train_dataloader))
        model.train()
        for batch in train_iterator:
            batch = {item:value.to(config['device']) for item, value in batch.items()}
            
            # train output (loss, out)
            loss = model(**batch)[0]
            
            model.zero_grad()
            loss.backward()
            optimizer.step()
            train_loss += loss
            global_step += 1
            
            if global_step % config['logging_step'] == 0:
                print_train_loss = train_loss / config['logging_step']
                train_loss = 0.
                avg_val_loss, f1 = evaluation(config, model, val_dataloader)
                print_log = f'>>> training loss: {print_train_loss: .4f}, valid loss: {avg_val_loss: .4f}, valid f1 score: {f1: .4f}'
                print(print_log)
                model.train()
                
    return model

In [63]:
best_model = train(model, config, id2label, train_dataloader, val_dataloader)

  0%|                                                                 | 0/8 [00:00<?, ?it/s]
Training:   0%|                                                    | 0/1501 [00:00<?, ?it/s][A
Training:   0%|                                            | 2/1501 [00:00<01:55, 12.99it/s][A
Training:   0%|                                            | 4/1501 [00:00<01:44, 14.26it/s][A
Training:   0%|▏                                           | 6/1501 [00:00<01:37, 15.32it/s][A
Training:   1%|▏                                           | 8/1501 [00:00<01:34, 15.88it/s][A
Training:   1%|▎                                          | 10/1501 [00:00<01:34, 15.76it/s][A
Training:   1%|▎                                          | 12/1501 [00:00<01:30, 16.43it/s][A
Training:   1%|▍                                          | 14/1501 [00:00<01:33, 15.84it/s][A
Training:   1%|▍                                          | 16/1501 [00:01<01:30, 16.35it/s][A
Training:   1%|▌                           

Evaluation...:  79%|██████████████████████████████        | 132/167 [00:04<00:01, 29.76it/s][A[A

Evaluation...:  81%|██████████████████████████████▉       | 136/167 [00:04<00:00, 31.71it/s][A[A

Evaluation...:  84%|███████████████████████████████▊      | 140/167 [00:04<00:00, 32.38it/s][A[A

Evaluation...:  86%|████████████████████████████████▊     | 144/167 [00:04<00:00, 33.05it/s][A[A

Evaluation...:  89%|█████████████████████████████████▋    | 148/167 [00:04<00:00, 33.54it/s][A[A

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:04<00:00, 33.92it/s][A[A

Evaluation...:  93%|███████████████████████████████████▍  | 156/167 [00:04<00:00, 30.55it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 31.70it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:05<00:00, 32.45it/s][A[A

Training:   7%|██▊                                       | 101/1501 [00:11<19:23,  1.20it/s][A
Trai

>>> training loss:  0.7606, valid loss:  1.5865, valid f1 score:  0.4923



Training:   7%|██▉                                       | 105/1501 [00:12<10:11,  2.28it/s][A
Training:   7%|██▉                                       | 107/1501 [00:12<07:32,  3.08it/s][A
Training:   7%|███                                       | 109/1501 [00:12<05:40,  4.09it/s][A
Training:   7%|███                                       | 111/1501 [00:12<04:23,  5.28it/s][A
Training:   8%|███▏                                      | 113/1501 [00:12<03:30,  6.60it/s][A
Training:   8%|███▏                                      | 115/1501 [00:12<02:49,  8.15it/s][A
Training:   8%|███▎                                      | 117/1501 [00:12<02:22,  9.72it/s][A
Training:   8%|███▎                                      | 119/1501 [00:12<02:01, 11.34it/s][A
Training:   8%|███▍                                      | 121/1501 [00:12<01:46, 12.98it/s][A
Training:   8%|███▍                                      | 123/1501 [00:13<01:38, 13.92it/s][A
Training:   8%|███▍                    

Evaluation...:  95%|███████████████████████████████████▉  | 158/167 [00:04<00:00, 39.20it/s][A[A

Evaluation...:  97%|████████████████████████████████████▊ | 162/167 [00:04<00:00, 37.12it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.14it/s][A[A

Training:  13%|█████▌                                    | 200/1501 [00:21<15:22,  1.41it/s][A
Training:  13%|█████▋                                    | 202/1501 [00:22<11:08,  1.94it/s][A

>>> training loss:  0.7615, valid loss:  1.5887, valid f1 score:  0.4896



Training:  14%|█████▋                                    | 204/1501 [00:22<08:11,  2.64it/s][A
Training:  14%|█████▊                                    | 206/1501 [00:22<06:07,  3.52it/s][A
Training:  14%|█████▊                                    | 208/1501 [00:22<04:37,  4.65it/s][A
Training:  14%|█████▉                                    | 210/1501 [00:22<03:35,  5.99it/s][A
Training:  14%|█████▉                                    | 212/1501 [00:22<02:54,  7.41it/s][A
Training:  14%|█████▉                                    | 214/1501 [00:22<02:22,  9.04it/s][A
Training:  14%|██████                                    | 216/1501 [00:22<02:00, 10.69it/s][A
Training:  15%|██████                                    | 218/1501 [00:22<01:44, 12.24it/s][A
Training:  15%|██████▏                                   | 220/1501 [00:23<01:35, 13.43it/s][A
Training:  15%|██████▏                                   | 222/1501 [00:23<01:27, 14.60it/s][A
Training:  15%|██████▎                 

Evaluation...:  89%|█████████████████████████████████▋    | 148/167 [00:03<00:00, 37.19it/s][A[A

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:04<00:00, 37.73it/s][A[A

Evaluation...:  93%|███████████████████████████████████▍  | 156/167 [00:04<00:00, 36.88it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 37.49it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 36.97it/s][A[A

Training:  20%|████████▍                                 | 301/1501 [00:32<14:27,  1.38it/s][A
Training:  20%|████████▍                                 | 303/1501 [00:32<10:31,  1.90it/s][A

>>> training loss:  0.7321, valid loss:  1.6004, valid f1 score:  0.4942



Training:  20%|████████▌                                 | 305/1501 [00:32<07:44,  2.57it/s][A
Training:  20%|████████▌                                 | 307/1501 [00:32<05:46,  3.44it/s][A
Training:  21%|████████▋                                 | 309/1501 [00:32<04:23,  4.52it/s][A
Training:  21%|████████▋                                 | 311/1501 [00:32<03:29,  5.67it/s][A
Training:  21%|████████▊                                 | 313/1501 [00:32<02:48,  7.05it/s][A
Training:  21%|████████▊                                 | 315/1501 [00:32<02:19,  8.49it/s][A
Training:  21%|████████▊                                 | 317/1501 [00:33<01:57, 10.05it/s][A
Training:  21%|████████▉                                 | 319/1501 [00:33<01:40, 11.71it/s][A
Training:  21%|████████▉                                 | 321/1501 [00:33<01:30, 13.03it/s][A
Training:  22%|█████████                                 | 323/1501 [00:33<01:22, 14.21it/s][A
Training:  22%|█████████               

Evaluation...:  93%|███████████████████████████████████▍  | 156/167 [00:04<00:00, 39.07it/s][A[A

Evaluation...:  96%|████████████████████████████████████▋ | 161/167 [00:04<00:00, 39.46it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.85it/s][A[A

Training:  27%|███████████▏                              | 401/1501 [00:42<12:52,  1.42it/s][A
Training:  27%|███████████▎                              | 403/1501 [00:42<09:18,  1.97it/s][A

>>> training loss:  0.7662, valid loss:  1.6034, valid f1 score:  0.4892



Training:  27%|███████████▎                              | 405/1501 [00:42<06:50,  2.67it/s][A
Training:  27%|███████████▍                              | 407/1501 [00:42<05:04,  3.59it/s][A
Training:  27%|███████████▍                              | 409/1501 [00:42<03:52,  4.70it/s][A
Training:  27%|███████████▌                              | 411/1501 [00:42<02:59,  6.09it/s][A
Training:  28%|███████████▌                              | 413/1501 [00:42<02:23,  7.60it/s][A
Training:  28%|███████████▌                              | 415/1501 [00:42<01:56,  9.29it/s][A
Training:  28%|███████████▋                              | 417/1501 [00:43<01:40, 10.82it/s][A
Training:  28%|███████████▋                              | 419/1501 [00:43<01:27, 12.39it/s][A
Training:  28%|███████████▊                              | 421/1501 [00:43<01:18, 13.67it/s][A
Training:  28%|███████████▊                              | 423/1501 [00:43<01:14, 14.53it/s][A
Training:  28%|███████████▉            

Evaluation...:  88%|█████████████████████████████████▍    | 147/167 [00:03<00:00, 38.88it/s][A[A

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:04<00:00, 40.13it/s][A[A

Evaluation...:  94%|███████████████████████████████████▋  | 157/167 [00:04<00:00, 39.59it/s][A[A

Evaluation...:  96%|████████████████████████████████████▋ | 161/167 [00:04<00:00, 39.07it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 37.26it/s][A[A

Training:  33%|██████████████                            | 501/1501 [00:52<12:12,  1.37it/s][A

>>> training loss:  0.8013, valid loss:  1.6458, valid f1 score:  0.4805



Training:  34%|██████████████                            | 503/1501 [00:52<08:52,  1.87it/s][A
Training:  34%|██████████████▏                           | 505/1501 [00:52<06:32,  2.54it/s][A
Training:  34%|██████████████▏                           | 507/1501 [00:52<04:52,  3.40it/s][A
Training:  34%|██████████████▏                           | 509/1501 [00:52<03:40,  4.51it/s][A
Training:  34%|██████████████▎                           | 511/1501 [00:53<02:51,  5.78it/s][A
Training:  34%|██████████████▎                           | 513/1501 [00:53<02:16,  7.26it/s][A
Training:  34%|██████████████▍                           | 515/1501 [00:53<01:51,  8.85it/s][A
Training:  34%|██████████████▍                           | 517/1501 [00:53<01:33, 10.54it/s][A
Training:  35%|██████████████▌                           | 519/1501 [00:53<01:23, 11.81it/s][A
Training:  35%|██████████████▌                           | 521/1501 [00:53<01:17, 12.63it/s][A
Training:  35%|██████████████▋         

Evaluation...:  86%|████████████████████████████████▌     | 143/167 [00:03<00:00, 37.45it/s][A[A

Evaluation...:  88%|█████████████████████████████████▍    | 147/167 [00:04<00:00, 37.96it/s][A[A

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:04<00:00, 38.93it/s][A[A

Evaluation...:  93%|███████████████████████████████████▍  | 156/167 [00:04<00:00, 38.40it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 38.38it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 36.27it/s][A[A

Training:  40%|████████████████▊                         | 600/1501 [01:02<11:14,  1.33it/s][A
Training:  40%|████████████████▊                         | 602/1501 [01:02<08:06,  1.85it/s][A

>>> training loss:  0.7953, valid loss:  1.5890, valid f1 score:  0.5057



Training:  40%|████████████████▉                         | 604/1501 [01:03<05:55,  2.52it/s][A
Training:  40%|████████████████▉                         | 606/1501 [01:03<04:23,  3.39it/s][A
Training:  41%|█████████████████                         | 608/1501 [01:03<03:17,  4.51it/s][A
Training:  41%|█████████████████                         | 610/1501 [01:03<02:34,  5.76it/s][A
Training:  41%|█████████████████                         | 612/1501 [01:03<02:03,  7.18it/s][A
Training:  41%|█████████████████▏                        | 614/1501 [01:03<01:43,  8.60it/s][A
Training:  41%|█████████████████▏                        | 616/1501 [01:03<01:26, 10.22it/s][A
Training:  41%|█████████████████▎                        | 618/1501 [01:03<01:13, 11.93it/s][A
Training:  41%|█████████████████▎                        | 620/1501 [01:03<01:05, 13.37it/s][A
Training:  41%|█████████████████▍                        | 622/1501 [01:04<01:01, 14.31it/s][A
Training:  42%|█████████████████▍      

Evaluation...:  89%|█████████████████████████████████▋    | 148/167 [00:04<00:00, 37.92it/s][A[A

Evaluation...:  92%|██████████████████████████████████▊   | 153/167 [00:04<00:00, 38.61it/s][A[A

Evaluation...:  95%|███████████████████████████████████▉  | 158/167 [00:04<00:00, 39.72it/s][A[A

Evaluation...:  97%|████████████████████████████████████▊ | 162/167 [00:04<00:00, 37.88it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 36.05it/s][A[A

Training:  47%|███████████████████▌                      | 700/1501 [01:13<10:03,  1.33it/s][A
Training:  47%|███████████████████▋                      | 702/1501 [01:13<07:16,  1.83it/s][A

>>> training loss:  0.8127, valid loss:  1.5936, valid f1 score:  0.5005



Training:  47%|███████████████████▋                      | 704/1501 [01:13<05:19,  2.49it/s][A
Training:  47%|███████████████████▊                      | 706/1501 [01:13<03:57,  3.34it/s][A
Training:  47%|███████████████████▊                      | 708/1501 [01:13<03:00,  4.39it/s][A
Training:  47%|███████████████████▊                      | 710/1501 [01:13<02:18,  5.70it/s][A
Training:  47%|███████████████████▉                      | 712/1501 [01:14<01:51,  7.09it/s][A
Training:  48%|███████████████████▉                      | 714/1501 [01:14<01:30,  8.66it/s][A
Training:  48%|████████████████████                      | 716/1501 [01:14<01:16, 10.23it/s][A
Training:  48%|████████████████████                      | 718/1501 [01:14<01:07, 11.56it/s][A
Training:  48%|████████████████████▏                     | 720/1501 [01:14<01:00, 12.91it/s][A
Training:  48%|████████████████████▏                     | 722/1501 [01:14<00:54, 14.23it/s][A
Training:  48%|████████████████████▎   

Evaluation...:  87%|████████████████████████████████▉     | 145/167 [00:03<00:00, 38.06it/s][A[A

Evaluation...:  90%|██████████████████████████████████▏   | 150/167 [00:04<00:00, 39.77it/s][A[A

Evaluation...:  92%|███████████████████████████████████   | 154/167 [00:04<00:00, 38.82it/s][A[A

Evaluation...:  95%|███████████████████████████████████▉  | 158/167 [00:04<00:00, 38.00it/s][A[A

Evaluation...:  97%|████████████████████████████████████▊ | 162/167 [00:04<00:00, 35.48it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 36.84it/s][A[A

Training:  53%|██████████████████████▍                   | 800/1501 [01:23<08:38,  1.35it/s][A
Training:  53%|██████████████████████▍                   | 802/1501 [01:24<06:17,  1.85it/s][A

>>> training loss:  0.8287, valid loss:  1.6077, valid f1 score:  0.4976



Training:  54%|██████████████████████▍                   | 804/1501 [01:24<04:36,  2.52it/s][A
Training:  54%|██████████████████████▌                   | 806/1501 [01:24<03:27,  3.35it/s][A
Training:  54%|██████████████████████▌                   | 808/1501 [01:24<02:36,  4.44it/s][A
Training:  54%|██████████████████████▋                   | 810/1501 [01:24<02:01,  5.70it/s][A
Training:  54%|██████████████████████▋                   | 812/1501 [01:24<01:36,  7.13it/s][A
Training:  54%|██████████████████████▊                   | 814/1501 [01:24<01:18,  8.71it/s][A
Training:  54%|██████████████████████▊                   | 816/1501 [01:24<01:08, 10.06it/s][A
Training:  54%|██████████████████████▉                   | 818/1501 [01:25<00:59, 11.54it/s][A
Training:  55%|██████████████████████▉                   | 820/1501 [01:25<00:54, 12.61it/s][A
Training:  55%|███████████████████████                   | 822/1501 [01:25<00:48, 13.90it/s][A
Training:  55%|███████████████████████ 

Evaluation...:  93%|███████████████████████████████████▎  | 155/167 [00:04<00:00, 38.27it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 38.30it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.29it/s][A[A

Training:  60%|█████████████████████████▏                | 901/1501 [01:34<07:07,  1.40it/s][A
Training:  60%|█████████████████████████▎                | 903/1501 [01:34<05:09,  1.93it/s][A

>>> training loss:  0.8363, valid loss:  1.6123, valid f1 score:  0.5022



Training:  60%|█████████████████████████▎                | 905/1501 [01:34<03:45,  2.64it/s][A
Training:  60%|█████████████████████████▍                | 907/1501 [01:34<02:46,  3.56it/s][A
Training:  61%|█████████████████████████▍                | 909/1501 [01:34<02:07,  4.63it/s][A
Training:  61%|█████████████████████████▍                | 911/1501 [01:34<01:40,  5.86it/s][A
Training:  61%|█████████████████████████▌                | 913/1501 [01:35<01:21,  7.21it/s][A
Training:  61%|█████████████████████████▌                | 915/1501 [01:35<01:08,  8.61it/s][A
Training:  61%|█████████████████████████▋                | 917/1501 [01:35<00:57, 10.08it/s][A
Training:  61%|█████████████████████████▋                | 919/1501 [01:35<00:51, 11.33it/s][A
Training:  61%|█████████████████████████▊                | 921/1501 [01:35<00:45, 12.76it/s][A
Training:  61%|█████████████████████████▊                | 923/1501 [01:35<00:41, 13.80it/s][A
Training:  62%|████████████████████████

Evaluation...:  93%|███████████████████████████████████▍  | 156/167 [00:04<00:00, 38.46it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 38.32it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 37.13it/s][A[A

Training:  67%|███████████████████████████▎             | 1000/1501 [01:44<06:04,  1.37it/s][A
Training:  67%|███████████████████████████▎             | 1002/1501 [01:44<04:22,  1.90it/s][A

>>> training loss:  0.8377, valid loss:  1.6125, valid f1 score:  0.4936



Training:  67%|███████████████████████████▍             | 1004/1501 [01:44<03:13,  2.57it/s][A
Training:  67%|███████████████████████████▍             | 1006/1501 [01:44<02:23,  3.45it/s][A
Training:  67%|███████████████████████████▌             | 1008/1501 [01:45<01:49,  4.52it/s][A
Training:  67%|███████████████████████████▌             | 1010/1501 [01:45<01:23,  5.85it/s][A
Training:  67%|███████████████████████████▋             | 1012/1501 [01:45<01:06,  7.37it/s][A
Training:  68%|███████████████████████████▋             | 1014/1501 [01:45<00:54,  8.91it/s][A
Training:  68%|███████████████████████████▊             | 1016/1501 [01:45<00:46, 10.54it/s][A
Training:  68%|███████████████████████████▊             | 1018/1501 [01:45<00:39, 12.10it/s][A
Training:  68%|███████████████████████████▊             | 1020/1501 [01:45<00:36, 13.18it/s][A
Training:  68%|███████████████████████████▉             | 1022/1501 [01:45<00:33, 14.25it/s][A
Training:  68%|████████████████████████

Evaluation...:  86%|████████████████████████████████▊     | 144/167 [00:04<00:00, 37.67it/s][A[A

Evaluation...:  89%|█████████████████████████████████▋    | 148/167 [00:04<00:00, 37.53it/s][A[A

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:04<00:00, 38.19it/s][A[A

Evaluation...:  93%|███████████████████████████████████▍  | 156/167 [00:04<00:00, 37.93it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 37.86it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 36.12it/s][A[A

Training:  73%|██████████████████████████████           | 1100/1501 [01:55<05:02,  1.32it/s][A
Training:  73%|██████████████████████████████           | 1102/1501 [01:55<03:38,  1.83it/s][A

>>> training loss:  0.8329, valid loss:  1.6232, valid f1 score:  0.4924



Training:  74%|██████████████████████████████▏          | 1104/1501 [01:55<02:38,  2.50it/s][A
Training:  74%|██████████████████████████████▏          | 1106/1501 [01:55<01:57,  3.35it/s][A
Training:  74%|██████████████████████████████▎          | 1108/1501 [01:55<01:28,  4.45it/s][A
Training:  74%|██████████████████████████████▎          | 1110/1501 [01:55<01:09,  5.65it/s][A
Training:  74%|██████████████████████████████▎          | 1112/1501 [01:55<00:54,  7.11it/s][A
Training:  74%|██████████████████████████████▍          | 1114/1501 [01:55<00:44,  8.66it/s][A
Training:  74%|██████████████████████████████▍          | 1116/1501 [01:56<00:38, 10.10it/s][A
Training:  74%|██████████████████████████████▌          | 1118/1501 [01:56<00:32, 11.63it/s][A
Training:  75%|██████████████████████████████▌          | 1120/1501 [01:56<00:29, 13.13it/s][A
Training:  75%|██████████████████████████████▋          | 1122/1501 [01:56<00:27, 14.03it/s][A
Training:  75%|████████████████████████

Evaluation...:  86%|████████████████████████████████▌     | 143/167 [00:04<00:00, 38.21it/s][A[A

Evaluation...:  88%|█████████████████████████████████▍    | 147/167 [00:04<00:00, 38.28it/s][A[A

Evaluation...:  90%|██████████████████████████████████▎   | 151/167 [00:04<00:00, 38.59it/s][A[A

Evaluation...:  93%|███████████████████████████████████▎  | 155/167 [00:04<00:00, 37.28it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 38.21it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 35.41it/s][A[A

Training:  80%|████████████████████████████████▊        | 1200/1501 [02:05<03:50,  1.31it/s][A
Training:  80%|████████████████████████████████▊        | 1202/1501 [02:05<02:45,  1.81it/s][A

>>> training loss:  0.8827, valid loss:  1.6020, valid f1 score:  0.5042



Training:  80%|████████████████████████████████▉        | 1204/1501 [02:06<01:59,  2.49it/s][A
Training:  80%|████████████████████████████████▉        | 1206/1501 [02:06<01:28,  3.34it/s][A
Training:  80%|████████████████████████████████▉        | 1208/1501 [02:06<01:05,  4.46it/s][A
Training:  81%|█████████████████████████████████        | 1210/1501 [02:06<00:50,  5.78it/s][A
Training:  81%|█████████████████████████████████        | 1212/1501 [02:06<00:39,  7.30it/s][A
Training:  81%|█████████████████████████████████▏       | 1214/1501 [02:06<00:33,  8.66it/s][A
Training:  81%|█████████████████████████████████▏       | 1216/1501 [02:06<00:27, 10.30it/s][A
Training:  81%|█████████████████████████████████▎       | 1218/1501 [02:06<00:23, 11.90it/s][A
Training:  81%|█████████████████████████████████▎       | 1220/1501 [02:06<00:21, 13.36it/s][A
Training:  81%|█████████████████████████████████▍       | 1222/1501 [02:06<00:18, 14.73it/s][A
Training:  82%|████████████████████████

Evaluation...:  90%|██████████████████████████████████▏   | 150/167 [00:03<00:00, 39.76it/s][A[A

Evaluation...:  92%|███████████████████████████████████   | 154/167 [00:04<00:00, 38.97it/s][A[A

Evaluation...:  95%|████████████████████████████████████▏ | 159/167 [00:04<00:00, 39.73it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.47it/s][A[A

Training:  87%|███████████████████████████████████▌     | 1300/1501 [02:15<02:22,  1.41it/s][A
Training:  87%|███████████████████████████████████▌     | 1302/1501 [02:15<01:41,  1.96it/s][A

>>> training loss:  0.8945, valid loss:  1.5972, valid f1 score:  0.4948



Training:  87%|███████████████████████████████████▌     | 1304/1501 [02:15<01:14,  2.66it/s][A
Training:  87%|███████████████████████████████████▋     | 1306/1501 [02:16<00:54,  3.56it/s][A
Training:  87%|███████████████████████████████████▋     | 1308/1501 [02:16<00:41,  4.70it/s][A
Training:  87%|███████████████████████████████████▊     | 1310/1501 [02:16<00:31,  6.03it/s][A
Training:  87%|███████████████████████████████████▊     | 1312/1501 [02:16<00:25,  7.51it/s][A
Training:  88%|███████████████████████████████████▉     | 1314/1501 [02:16<00:20,  8.98it/s][A
Training:  88%|███████████████████████████████████▉     | 1316/1501 [02:16<00:17, 10.61it/s][A
Training:  88%|████████████████████████████████████     | 1318/1501 [02:16<00:15, 12.19it/s][A
Training:  88%|████████████████████████████████████     | 1320/1501 [02:16<00:13, 13.77it/s][A
Training:  88%|████████████████████████████████████     | 1322/1501 [02:16<00:12, 14.30it/s][A
Training:  88%|████████████████████████

Evaluation...:  88%|█████████████████████████████████▍    | 147/167 [00:03<00:00, 37.10it/s][A[A

Evaluation...:  90%|██████████████████████████████████▎   | 151/167 [00:04<00:00, 37.91it/s][A[A

Evaluation...:  93%|███████████████████████████████████▎  | 155/167 [00:04<00:00, 36.92it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 38.11it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 37.51it/s][A[A

Training:  93%|██████████████████████████████████████▏  | 1400/1501 [02:25<01:13,  1.38it/s][A
Training:  93%|██████████████████████████████████████▎  | 1402/1501 [02:26<00:52,  1.90it/s][A

>>> training loss:  0.8861, valid loss:  1.6034, valid f1 score:  0.4960



Training:  94%|██████████████████████████████████████▎  | 1404/1501 [02:26<00:37,  2.58it/s][A
Training:  94%|██████████████████████████████████████▍  | 1406/1501 [02:26<00:27,  3.48it/s][A
Training:  94%|██████████████████████████████████████▍  | 1408/1501 [02:26<00:20,  4.62it/s][A
Training:  94%|██████████████████████████████████████▌  | 1410/1501 [02:26<00:15,  5.98it/s][A
Training:  94%|██████████████████████████████████████▌  | 1412/1501 [02:26<00:11,  7.45it/s][A
Training:  94%|██████████████████████████████████████▌  | 1414/1501 [02:26<00:09,  9.00it/s][A
Training:  94%|██████████████████████████████████████▋  | 1416/1501 [02:26<00:08, 10.61it/s][A
Training:  94%|██████████████████████████████████████▋  | 1418/1501 [02:26<00:06, 12.13it/s][A
Training:  95%|██████████████████████████████████████▊  | 1420/1501 [02:27<00:06, 13.31it/s][A
Training:  95%|██████████████████████████████████████▊  | 1422/1501 [02:27<00:05, 14.60it/s][A
Training:  95%|████████████████████████

Evaluation...:  87%|████████████████████████████████▉     | 145/167 [00:04<00:00, 35.71it/s][A[A

Evaluation...:  89%|█████████████████████████████████▉    | 149/167 [00:04<00:00, 35.71it/s][A[A

Evaluation...:  92%|██████████████████████████████████▊   | 153/167 [00:04<00:00, 34.74it/s][A[A

Evaluation...:  94%|███████████████████████████████████▋  | 157/167 [00:04<00:00, 36.03it/s][A[A

Evaluation...:  96%|████████████████████████████████████▋ | 161/167 [00:04<00:00, 36.13it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 35.91it/s][A[A

Training: 100%|█████████████████████████████████████████| 1501/1501 [02:36<00:00,  9.59it/s][A
 12%|███████                                                 | 1/8 [02:36<18:16, 156.58s/it]

>>> training loss:  0.8948, valid loss:  1.6345, valid f1 score:  0.4934



Training:   0%|                                                    | 0/1501 [00:00<?, ?it/s][A
Training:   0%|                                            | 2/1501 [00:00<01:33, 16.11it/s][A
Training:   0%|                                            | 4/1501 [00:00<01:28, 16.91it/s][A
Training:   0%|▏                                           | 6/1501 [00:00<01:30, 16.53it/s][A
Training:   1%|▏                                           | 8/1501 [00:00<01:32, 16.13it/s][A
Training:   1%|▎                                          | 10/1501 [00:00<01:34, 15.81it/s][A
Training:   1%|▎                                          | 12/1501 [00:00<01:33, 15.95it/s][A
Training:   1%|▍                                          | 14/1501 [00:00<01:32, 16.09it/s][A
Training:   1%|▍                                          | 16/1501 [00:00<01:30, 16.41it/s][A
Training:   1%|▌                                          | 18/1501 [00:01<01:38, 15.05it/s][A
Training:   1%|▌                       

Evaluation...:  84%|███████████████████████████████▊      | 140/167 [00:03<00:00, 36.07it/s][A[A

Evaluation...:  86%|████████████████████████████████▊     | 144/167 [00:04<00:00, 35.08it/s][A[A

Evaluation...:  89%|█████████████████████████████████▋    | 148/167 [00:04<00:00, 34.45it/s][A[A

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:04<00:00, 35.01it/s][A[A

Evaluation...:  93%|███████████████████████████████████▍  | 156/167 [00:04<00:00, 34.27it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 34.14it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 34.97it/s][A[A

Training:   7%|██▊                                        | 99/1501 [00:10<18:10,  1.29it/s][A
Training:   7%|██▊                                       | 101/1501 [00:10<13:10,  1.77it/s][A

>>> training loss:  0.5992, valid loss:  1.6341, valid f1 score:  0.4967



Training:   7%|██▉                                       | 103/1501 [00:11<09:42,  2.40it/s][A
Training:   7%|██▉                                       | 105/1501 [00:11<07:10,  3.24it/s][A
Training:   7%|██▉                                       | 107/1501 [00:11<05:27,  4.25it/s][A
Training:   7%|███                                       | 109/1501 [00:11<04:14,  5.47it/s][A
Training:   7%|███                                       | 111/1501 [00:11<03:21,  6.90it/s][A
Training:   8%|███▏                                      | 113/1501 [00:11<02:43,  8.48it/s][A
Training:   8%|███▏                                      | 115/1501 [00:11<02:16, 10.13it/s][A
Training:   8%|███▎                                      | 117/1501 [00:11<02:01, 11.36it/s][A
Training:   8%|███▎                                      | 119/1501 [00:11<01:51, 12.43it/s][A
Training:   8%|███▍                                      | 121/1501 [00:12<01:43, 13.29it/s][A
Training:   8%|███▍                    

Evaluation...:  85%|████████████████████████████████▎     | 142/167 [00:04<00:00, 35.24it/s][A[A

Evaluation...:  87%|█████████████████████████████████▏    | 146/167 [00:04<00:00, 35.10it/s][A[A

Evaluation...:  90%|██████████████████████████████████▎   | 151/167 [00:04<00:00, 36.67it/s][A[A

Evaluation...:  93%|███████████████████████████████████▎  | 155/167 [00:04<00:00, 35.54it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 36.68it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 35.40it/s][A[A

Training:  13%|█████▌                                    | 199/1501 [00:21<16:44,  1.30it/s][A
Training:  13%|█████▌                                    | 201/1501 [00:21<12:08,  1.78it/s][A

>>> training loss:  0.5677, valid loss:  1.6491, valid f1 score:  0.5053



Training:  14%|█████▋                                    | 203/1501 [00:21<08:51,  2.44it/s][A
Training:  14%|█████▋                                    | 205/1501 [00:21<06:39,  3.24it/s][A
Training:  14%|█████▊                                    | 207/1501 [00:22<05:03,  4.26it/s][A
Training:  14%|█████▊                                    | 209/1501 [00:22<03:53,  5.53it/s][A
Training:  14%|█████▉                                    | 211/1501 [00:22<03:06,  6.93it/s][A
Training:  14%|█████▉                                    | 213/1501 [00:22<02:32,  8.45it/s][A
Training:  14%|██████                                    | 215/1501 [00:22<02:11,  9.75it/s][A
Training:  14%|██████                                    | 217/1501 [00:22<01:55, 11.10it/s][A
Training:  15%|██████▏                                   | 219/1501 [00:22<01:44, 12.27it/s][A
Training:  15%|██████▏                                   | 221/1501 [00:22<01:37, 13.10it/s][A
Training:  15%|██████▏                 

Evaluation...:  85%|████████████████████████████████▎     | 142/167 [00:04<00:00, 36.01it/s][A[A

Evaluation...:  87%|█████████████████████████████████▏    | 146/167 [00:04<00:00, 33.69it/s][A[A

Evaluation...:  90%|██████████████████████████████████▏   | 150/167 [00:04<00:00, 34.62it/s][A[A

Evaluation...:  92%|███████████████████████████████████   | 154/167 [00:04<00:00, 35.05it/s][A[A

Evaluation...:  95%|████████████████████████████████████▏ | 159/167 [00:04<00:00, 36.93it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 34.97it/s][A[A

Training:  20%|████████▎                                 | 299/1501 [00:32<15:37,  1.28it/s][A
Training:  20%|████████▍                                 | 301/1501 [00:32<11:17,  1.77it/s][A

>>> training loss:  0.5803, valid loss:  1.6589, valid f1 score:  0.4987



Training:  20%|████████▍                                 | 303/1501 [00:32<08:14,  2.42it/s][A
Training:  20%|████████▌                                 | 305/1501 [00:32<06:05,  3.28it/s][A
Training:  21%|████████▌                                 | 308/1501 [00:32<04:06,  4.84it/s][A
Training:  21%|████████▋                                 | 310/1501 [00:33<03:18,  6.00it/s][A
Training:  21%|████████▋                                 | 312/1501 [00:33<02:41,  7.36it/s][A
Training:  21%|████████▊                                 | 314/1501 [00:33<02:15,  8.74it/s][A
Training:  21%|████████▊                                 | 316/1501 [00:33<01:53, 10.42it/s][A
Training:  21%|████████▉                                 | 318/1501 [00:33<01:41, 11.66it/s][A
Training:  21%|████████▉                                 | 320/1501 [00:33<01:34, 12.51it/s][A
Training:  21%|█████████                                 | 322/1501 [00:33<01:26, 13.67it/s][A
Training:  22%|█████████               

Evaluation...:  86%|████████████████████████████████▊     | 144/167 [00:04<00:00, 38.08it/s][A[A

Evaluation...:  89%|█████████████████████████████████▋    | 148/167 [00:04<00:00, 38.04it/s][A[A

Evaluation...:  92%|██████████████████████████████████▊   | 153/167 [00:04<00:00, 38.46it/s][A[A

Evaluation...:  95%|███████████████████████████████████▉  | 158/167 [00:04<00:00, 39.38it/s][A[A

Evaluation...:  97%|████████████████████████████████████▊ | 162/167 [00:04<00:00, 38.22it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 35.99it/s][A[A

Training:  27%|███████████▏                              | 400/1501 [00:43<13:53,  1.32it/s][A
Training:  27%|███████████▏                              | 402/1501 [00:43<10:00,  1.83it/s][A

>>> training loss:  0.6294, valid loss:  1.6867, valid f1 score:  0.5119



Training:  27%|███████████▎                              | 404/1501 [00:43<07:18,  2.50it/s][A
Training:  27%|███████████▎                              | 406/1501 [00:43<05:22,  3.39it/s][A
Training:  27%|███████████▍                              | 408/1501 [00:43<04:04,  4.47it/s][A
Training:  27%|███████████▍                              | 410/1501 [00:43<03:11,  5.69it/s][A
Training:  27%|███████████▌                              | 412/1501 [00:43<02:33,  7.09it/s][A
Training:  28%|███████████▌                              | 414/1501 [00:43<02:04,  8.71it/s][A
Training:  28%|███████████▋                              | 416/1501 [00:44<01:45, 10.33it/s][A
Training:  28%|███████████▋                              | 418/1501 [00:44<01:31, 11.86it/s][A
Training:  28%|███████████▊                              | 420/1501 [00:44<01:21, 13.34it/s][A
Training:  28%|███████████▊                              | 422/1501 [00:44<01:14, 14.56it/s][A
Training:  28%|███████████▊            

Evaluation...:  86%|████████████████████████████████▊     | 144/167 [00:04<00:00, 38.61it/s][A[A

Evaluation...:  89%|█████████████████████████████████▋    | 148/167 [00:04<00:00, 36.70it/s][A[A

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:04<00:00, 35.07it/s][A[A

Evaluation...:  93%|███████████████████████████████████▍  | 156/167 [00:04<00:00, 35.06it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 35.00it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 34.93it/s][A[A

Training:  33%|█████████████▉                            | 500/1501 [00:53<12:59,  1.28it/s][A
Training:  33%|██████████████                            | 502/1501 [00:53<09:21,  1.78it/s][A

>>> training loss:  0.6428, valid loss:  1.7071, valid f1 score:  0.5059



Training:  34%|██████████████                            | 504/1501 [00:54<06:49,  2.43it/s][A
Training:  34%|██████████████▏                           | 506/1501 [00:54<05:02,  3.29it/s][A
Training:  34%|██████████████▏                           | 508/1501 [00:54<03:49,  4.33it/s][A
Training:  34%|██████████████▎                           | 510/1501 [00:54<02:57,  5.57it/s][A
Training:  34%|██████████████▎                           | 512/1501 [00:54<02:23,  6.87it/s][A
Training:  34%|██████████████▍                           | 514/1501 [00:54<02:00,  8.20it/s][A
Training:  34%|██████████████▍                           | 516/1501 [00:54<01:40,  9.79it/s][A
Training:  35%|██████████████▍                           | 518/1501 [00:54<01:27, 11.26it/s][A
Training:  35%|██████████████▌                           | 520/1501 [00:55<01:18, 12.53it/s][A
Training:  35%|██████████████▌                           | 522/1501 [00:55<01:11, 13.61it/s][A
Training:  35%|██████████████▋         

Evaluation...:  84%|███████████████████████████████▊      | 140/167 [00:04<00:00, 33.37it/s][A[A

Evaluation...:  86%|████████████████████████████████▊     | 144/167 [00:04<00:00, 34.26it/s][A[A

Evaluation...:  89%|█████████████████████████████████▋    | 148/167 [00:04<00:00, 35.18it/s][A[A

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:04<00:00, 36.30it/s][A[A

Evaluation...:  93%|███████████████████████████████████▍  | 156/167 [00:04<00:00, 35.76it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 36.08it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 35.00it/s][A[A

Training:  40%|████████████████▊                         | 600/1501 [01:04<11:40,  1.29it/s][A
Training:  40%|████████████████▊                         | 602/1501 [01:04<08:24,  1.78it/s][A

>>> training loss:  0.6363, valid loss:  1.6829, valid f1 score:  0.5065



Training:  40%|████████████████▉                         | 604/1501 [01:04<06:09,  2.43it/s][A
Training:  40%|████████████████▉                         | 606/1501 [01:04<04:33,  3.27it/s][A
Training:  41%|█████████████████                         | 608/1501 [01:05<03:29,  4.27it/s][A
Training:  41%|█████████████████                         | 610/1501 [01:05<02:42,  5.49it/s][A
Training:  41%|█████████████████                         | 612/1501 [01:05<02:07,  6.98it/s][A
Training:  41%|█████████████████▏                        | 614/1501 [01:05<01:45,  8.43it/s][A
Training:  41%|█████████████████▏                        | 616/1501 [01:05<01:28, 10.02it/s][A
Training:  41%|█████████████████▎                        | 618/1501 [01:05<01:16, 11.52it/s][A
Training:  41%|█████████████████▎                        | 620/1501 [01:05<01:12, 12.15it/s][A
Training:  41%|█████████████████▍                        | 622/1501 [01:05<01:05, 13.41it/s][A
Training:  42%|█████████████████▍      

Evaluation...:  81%|██████████████████████████████▉       | 136/167 [00:04<00:01, 27.34it/s][A[A

Evaluation...:  84%|███████████████████████████████▊      | 140/167 [00:04<00:00, 29.87it/s][A[A

Evaluation...:  86%|████████████████████████████████▊     | 144/167 [00:04<00:00, 32.04it/s][A[A

Evaluation...:  89%|█████████████████████████████████▋    | 148/167 [00:04<00:00, 33.42it/s][A[A

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:04<00:00, 35.18it/s][A[A

Evaluation...:  93%|███████████████████████████████████▍  | 156/167 [00:04<00:00, 35.79it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:05<00:00, 36.71it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:05<00:00, 31.72it/s][A[A

Training:  47%|███████████████████▌                      | 699/1501 [01:15<11:20,  1.18it/s][A
Training:  47%|███████████████████▌                      | 701/1501 [01:15<08:07,  1.64it/s][A

>>> training loss:  0.6566, valid loss:  1.6832, valid f1 score:  0.4985



Training:  47%|███████████████████▋                      | 703/1501 [01:15<05:55,  2.24it/s][A
Training:  47%|███████████████████▋                      | 705/1501 [01:16<04:21,  3.04it/s][A
Training:  47%|███████████████████▊                      | 707/1501 [01:16<03:17,  4.02it/s][A
Training:  47%|███████████████████▊                      | 709/1501 [01:16<02:32,  5.20it/s][A
Training:  47%|███████████████████▉                      | 711/1501 [01:16<01:59,  6.60it/s][A
Training:  48%|███████████████████▉                      | 713/1501 [01:16<01:36,  8.19it/s][A
Training:  48%|████████████████████                      | 715/1501 [01:16<01:21,  9.70it/s][A
Training:  48%|████████████████████                      | 717/1501 [01:16<01:10, 11.15it/s][A
Training:  48%|████████████████████                      | 719/1501 [01:16<01:01, 12.64it/s][A
Training:  48%|████████████████████▏                     | 721/1501 [01:16<00:58, 13.40it/s][A
Training:  48%|████████████████████▏   

Evaluation...:  85%|████████████████████████████████▎     | 142/167 [00:03<00:00, 36.46it/s][A[A

Evaluation...:  87%|█████████████████████████████████▏    | 146/167 [00:03<00:00, 35.47it/s][A[A

Evaluation...:  90%|██████████████████████████████████▎   | 151/167 [00:04<00:00, 37.33it/s][A[A

Evaluation...:  93%|███████████████████████████████████▎  | 155/167 [00:04<00:00, 36.14it/s][A[A

Evaluation...:  95%|████████████████████████████████████▏ | 159/167 [00:04<00:00, 36.24it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 36.66it/s][A[A

Training:  53%|██████████████████████▎                   | 799/1501 [01:27<08:42,  1.34it/s][A
Training:  53%|██████████████████████▍                   | 801/1501 [01:27<06:15,  1.86it/s][A

>>> training loss:  0.6722, valid loss:  1.6912, valid f1 score:  0.5043



Training:  53%|██████████████████████▍                   | 803/1501 [01:27<04:35,  2.54it/s][A
Training:  54%|██████████████████████▌                   | 805/1501 [01:27<03:24,  3.40it/s][A
Training:  54%|██████████████████████▌                   | 807/1501 [01:27<02:35,  4.46it/s][A
Training:  54%|██████████████████████▋                   | 809/1501 [01:27<02:00,  5.74it/s][A
Training:  54%|██████████████████████▋                   | 811/1501 [01:27<01:38,  7.04it/s][A
Training:  54%|██████████████████████▋                   | 813/1501 [01:27<01:20,  8.58it/s][A
Training:  54%|██████████████████████▊                   | 815/1501 [01:27<01:08, 10.05it/s][A
Training:  54%|██████████████████████▊                   | 817/1501 [01:28<00:59, 11.48it/s][A
Training:  55%|██████████████████████▉                   | 819/1501 [01:28<00:54, 12.53it/s][A
Training:  55%|██████████████████████▉                   | 821/1501 [01:28<00:50, 13.46it/s][A
Training:  55%|███████████████████████ 

Evaluation...:  85%|████████████████████████████████▎     | 142/167 [00:04<00:00, 36.38it/s][A[A

Evaluation...:  87%|█████████████████████████████████▏    | 146/167 [00:04<00:00, 33.35it/s][A[A

Evaluation...:  90%|██████████████████████████████████▏   | 150/167 [00:04<00:00, 32.83it/s][A[A

Evaluation...:  92%|███████████████████████████████████   | 154/167 [00:04<00:00, 30.10it/s][A[A

Evaluation...:  95%|███████████████████████████████████▉  | 158/167 [00:04<00:00, 30.49it/s][A[A

Evaluation...:  97%|████████████████████████████████████▊ | 162/167 [00:04<00:00, 31.50it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 33.70it/s][A[A

Training:  60%|█████████████████████████▏                | 899/1501 [01:37<08:03,  1.25it/s][A
Training:  60%|█████████████████████████▏                | 901/1501 [01:37<05:48,  1.72it/s][A

>>> training loss:  0.6437, valid loss:  1.7186, valid f1 score:  0.4876



Training:  60%|█████████████████████████▎                | 903/1501 [01:38<04:15,  2.34it/s][A
Training:  60%|█████████████████████████▎                | 905/1501 [01:38<03:08,  3.16it/s][A
Training:  60%|█████████████████████████▍                | 907/1501 [01:38<02:21,  4.20it/s][A
Training:  61%|█████████████████████████▍                | 909/1501 [01:38<01:48,  5.47it/s][A
Training:  61%|█████████████████████████▍                | 911/1501 [01:38<01:26,  6.82it/s][A
Training:  61%|█████████████████████████▌                | 913/1501 [01:38<01:09,  8.40it/s][A
Training:  61%|█████████████████████████▌                | 915/1501 [01:38<00:58, 10.01it/s][A
Training:  61%|█████████████████████████▋                | 917/1501 [01:38<00:53, 10.94it/s][A
Training:  61%|█████████████████████████▋                | 919/1501 [01:39<00:46, 12.38it/s][A
Training:  61%|█████████████████████████▊                | 921/1501 [01:39<00:42, 13.50it/s][A
Training:  61%|████████████████████████

Training:  67%|███████████████████████████▎             | 1000/1501 [01:47<05:34,  1.50it/s][A
Training:  67%|███████████████████████████▎             | 1002/1501 [01:47<04:02,  2.06it/s][A

>>> training loss:  0.6934, valid loss:  1.7611, valid f1 score:  0.4786



Training:  67%|███████████████████████████▍             | 1004/1501 [01:48<02:57,  2.80it/s][A
Training:  67%|███████████████████████████▍             | 1006/1501 [01:48<02:12,  3.74it/s][A
Training:  67%|███████████████████████████▌             | 1008/1501 [01:48<01:40,  4.92it/s][A
Training:  67%|███████████████████████████▌             | 1010/1501 [01:48<01:17,  6.33it/s][A
Training:  67%|███████████████████████████▋             | 1012/1501 [01:48<01:03,  7.68it/s][A
Training:  68%|███████████████████████████▋             | 1014/1501 [01:48<00:54,  9.01it/s][A
Training:  68%|███████████████████████████▊             | 1016/1501 [01:48<00:45, 10.75it/s][A
Training:  68%|███████████████████████████▊             | 1018/1501 [01:48<00:39, 12.24it/s][A
Training:  68%|███████████████████████████▊             | 1020/1501 [01:48<00:35, 13.55it/s][A
Training:  68%|███████████████████████████▉             | 1022/1501 [01:49<00:32, 14.93it/s][A
Training:  68%|████████████████████████

Evaluation...:  97%|████████████████████████████████████▊ | 162/167 [00:04<00:00, 35.64it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.28it/s][A[A

Training:  73%|██████████████████████████████           | 1099/1501 [01:57<04:43,  1.42it/s][A
Training:  73%|██████████████████████████████           | 1101/1501 [01:57<03:24,  1.95it/s][A

>>> training loss:  0.7160, valid loss:  1.7080, valid f1 score:  0.5050



Training:  73%|██████████████████████████████▏          | 1103/1501 [01:57<02:29,  2.66it/s][A
Training:  74%|██████████████████████████████▏          | 1105/1501 [01:58<01:50,  3.58it/s][A
Training:  74%|██████████████████████████████▏          | 1107/1501 [01:58<01:24,  4.66it/s][A
Training:  74%|██████████████████████████████▎          | 1109/1501 [01:58<01:05,  5.98it/s][A
Training:  74%|██████████████████████████████▎          | 1111/1501 [01:58<00:52,  7.37it/s][A
Training:  74%|██████████████████████████████▍          | 1113/1501 [01:58<00:43,  8.96it/s][A
Training:  74%|██████████████████████████████▍          | 1115/1501 [01:58<00:36, 10.55it/s][A
Training:  74%|██████████████████████████████▌          | 1117/1501 [01:58<00:31, 12.09it/s][A
Training:  75%|██████████████████████████████▌          | 1119/1501 [01:58<00:28, 13.33it/s][A
Training:  75%|██████████████████████████████▌          | 1121/1501 [01:58<00:27, 13.61it/s][A
Training:  75%|████████████████████████

Evaluation...:  93%|███████████████████████████████████▎  | 155/167 [00:04<00:00, 40.90it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 41.12it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.89it/s][A[A

Training:  80%|████████████████████████████████▊        | 1199/1501 [02:08<03:33,  1.42it/s][A
Training:  80%|████████████████████████████████▊        | 1201/1501 [02:08<02:33,  1.96it/s][A

>>> training loss:  0.7313, valid loss:  1.7021, valid f1 score:  0.4893



Training:  80%|████████████████████████████████▊        | 1203/1501 [02:08<01:52,  2.65it/s][A
Training:  80%|████████████████████████████████▉        | 1205/1501 [02:08<01:23,  3.56it/s][A
Training:  80%|████████████████████████████████▉        | 1207/1501 [02:08<01:03,  4.63it/s][A
Training:  81%|█████████████████████████████████        | 1209/1501 [02:08<00:50,  5.75it/s][A
Training:  81%|█████████████████████████████████        | 1211/1501 [02:08<00:41,  7.05it/s][A
Training:  81%|█████████████████████████████████▏       | 1213/1501 [02:08<00:34,  8.30it/s][A
Training:  81%|█████████████████████████████████▏       | 1215/1501 [02:09<00:29,  9.67it/s][A
Training:  81%|█████████████████████████████████▏       | 1217/1501 [02:09<00:26, 10.75it/s][A
Training:  81%|█████████████████████████████████▎       | 1219/1501 [02:09<00:23, 11.83it/s][A
Training:  81%|█████████████████████████████████▎       | 1221/1501 [02:09<00:21, 12.90it/s][A
Training:  81%|████████████████████████

Evaluation...:  90%|██████████████████████████████████▎   | 151/167 [00:04<00:00, 34.90it/s][A[A

Evaluation...:  93%|███████████████████████████████████▎  | 155/167 [00:04<00:00, 34.25it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 35.76it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 36.52it/s][A[A

Training:  87%|███████████████████████████████████▍     | 1299/1501 [02:18<02:31,  1.34it/s][A
Training:  87%|███████████████████████████████████▌     | 1301/1501 [02:19<01:49,  1.83it/s][A

>>> training loss:  0.7194, valid loss:  1.7578, valid f1 score:  0.4904



Training:  87%|███████████████████████████████████▌     | 1303/1501 [02:19<01:19,  2.49it/s][A
Training:  87%|███████████████████████████████████▋     | 1305/1501 [02:19<00:59,  3.31it/s][A
Training:  87%|███████████████████████████████████▋     | 1307/1501 [02:19<00:44,  4.40it/s][A
Training:  87%|███████████████████████████████████▊     | 1309/1501 [02:19<00:34,  5.62it/s][A
Training:  87%|███████████████████████████████████▊     | 1311/1501 [02:19<00:27,  6.85it/s][A
Training:  87%|███████████████████████████████████▊     | 1313/1501 [02:19<00:22,  8.44it/s][A
Training:  88%|███████████████████████████████████▉     | 1315/1501 [02:19<00:18,  9.81it/s][A
Training:  88%|███████████████████████████████████▉     | 1317/1501 [02:20<00:16, 11.13it/s][A
Training:  88%|████████████████████████████████████     | 1319/1501 [02:20<00:15, 12.06it/s][A
Training:  88%|████████████████████████████████████     | 1321/1501 [02:20<00:13, 13.29it/s][A
Training:  88%|████████████████████████

Evaluation...:  87%|█████████████████████████████████▏    | 146/167 [00:04<00:00, 37.04it/s][A[A

Evaluation...:  90%|██████████████████████████████████▎   | 151/167 [00:04<00:00, 38.65it/s][A[A

Evaluation...:  93%|███████████████████████████████████▎  | 155/167 [00:04<00:00, 38.31it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 39.37it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 36.69it/s][A[A

Training:  93%|██████████████████████████████████████▏  | 1400/1501 [02:29<01:14,  1.35it/s][A
Training:  93%|██████████████████████████████████████▎  | 1402/1501 [02:29<00:53,  1.86it/s][A

>>> training loss:  0.7520, valid loss:  1.7175, valid f1 score:  0.4851



Training:  94%|██████████████████████████████████████▎  | 1404/1501 [02:29<00:38,  2.54it/s][A
Training:  94%|██████████████████████████████████████▍  | 1406/1501 [02:29<00:27,  3.44it/s][A
Training:  94%|██████████████████████████████████████▍  | 1408/1501 [02:29<00:20,  4.54it/s][A
Training:  94%|██████████████████████████████████████▌  | 1410/1501 [02:30<00:15,  5.77it/s][A
Training:  94%|██████████████████████████████████████▌  | 1412/1501 [02:30<00:12,  7.16it/s][A
Training:  94%|██████████████████████████████████████▌  | 1414/1501 [02:30<00:10,  8.27it/s][A
Training:  94%|██████████████████████████████████████▋  | 1416/1501 [02:30<00:08,  9.53it/s][A
Training:  94%|██████████████████████████████████████▋  | 1418/1501 [02:30<00:07, 10.99it/s][A
Training:  95%|██████████████████████████████████████▊  | 1420/1501 [02:30<00:06, 12.01it/s][A
Training:  95%|██████████████████████████████████████▊  | 1422/1501 [02:30<00:06, 13.02it/s][A
Training:  95%|████████████████████████

Evaluation...:  89%|█████████████████████████████████▋    | 148/167 [00:03<00:00, 37.44it/s][A[A

Evaluation...:  92%|██████████████████████████████████▊   | 153/167 [00:04<00:00, 38.07it/s][A[A

Evaluation...:  94%|███████████████████████████████████▋  | 157/167 [00:04<00:00, 38.29it/s][A[A

Evaluation...:  96%|████████████████████████████████████▋ | 161/167 [00:04<00:00, 37.63it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 37.23it/s][A[A

Training: 100%|████████████████████████████████████████▉| 1499/1501 [02:39<00:01,  1.37it/s][A
Training: 100%|█████████████████████████████████████████| 1501/1501 [02:39<00:00,  9.39it/s][A
 25%|██████████████                                          | 2/8 [05:16<15:51, 158.54s/it]

>>> training loss:  0.7677, valid loss:  1.7190, valid f1 score:  0.4895



Training:   0%|                                                    | 0/1501 [00:00<?, ?it/s][A
Training:   0%|                                            | 2/1501 [00:00<01:27, 17.04it/s][A
Training:   0%|                                            | 4/1501 [00:00<01:30, 16.61it/s][A
Training:   0%|▏                                           | 6/1501 [00:00<01:25, 17.46it/s][A
Training:   1%|▏                                           | 8/1501 [00:00<01:31, 16.27it/s][A
Training:   1%|▎                                          | 10/1501 [00:00<01:34, 15.85it/s][A
Training:   1%|▎                                          | 12/1501 [00:00<01:32, 16.16it/s][A
Training:   1%|▍                                          | 14/1501 [00:00<01:30, 16.48it/s][A
Training:   1%|▍                                          | 16/1501 [00:00<01:31, 16.22it/s][A
Training:   1%|▌                                          | 18/1501 [00:01<01:29, 16.61it/s][A
Training:   1%|▌                       

Evaluation...:  84%|████████████████████████████████      | 141/167 [00:03<00:00, 38.76it/s][A[A

Evaluation...:  87%|████████████████████████████████▉     | 145/167 [00:03<00:00, 37.71it/s][A[A

Evaluation...:  90%|██████████████████████████████████▏   | 150/167 [00:03<00:00, 39.32it/s][A[A

Evaluation...:  92%|███████████████████████████████████   | 154/167 [00:04<00:00, 37.81it/s][A[A

Evaluation...:  95%|████████████████████████████████████▏ | 159/167 [00:04<00:00, 39.13it/s][A[A

Evaluation...:  98%|█████████████████████████████████████ | 163/167 [00:04<00:00, 38.22it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 37.61it/s][A[A

Training:   7%|██▊                                        | 98/1501 [00:10<16:57,  1.38it/s][A
Training:   7%|██▊                                       | 100/1501 [00:10<12:17,  1.90it/s][A

>>> training loss:  0.4844, valid loss:  1.7336, valid f1 score:  0.4822



Training:   7%|██▊                                       | 102/1501 [00:10<08:59,  2.59it/s][A
Training:   7%|██▉                                       | 104/1501 [00:10<06:40,  3.49it/s][A
Training:   7%|██▉                                       | 106/1501 [00:10<05:05,  4.57it/s][A
Training:   7%|███                                       | 108/1501 [00:10<03:57,  5.86it/s][A
Training:   7%|███                                       | 110/1501 [00:11<03:08,  7.39it/s][A
Training:   7%|███▏                                      | 112/1501 [00:11<02:36,  8.89it/s][A
Training:   8%|███▏                                      | 114/1501 [00:11<02:14, 10.33it/s][A
Training:   8%|███▎                                      | 117/1501 [00:11<01:50, 12.58it/s][A
Training:   8%|███▎                                      | 119/1501 [00:11<01:44, 13.25it/s][A
Training:   8%|███▍                                      | 121/1501 [00:11<01:38, 14.00it/s][A
Training:   8%|███▍                    

Evaluation...:  87%|█████████████████████████████████▏    | 146/167 [00:04<00:00, 33.84it/s][A[A

Evaluation...:  90%|██████████████████████████████████▏   | 150/167 [00:04<00:00, 35.17it/s][A[A

Evaluation...:  92%|███████████████████████████████████   | 154/167 [00:04<00:00, 34.83it/s][A[A

Evaluation...:  95%|███████████████████████████████████▉  | 158/167 [00:04<00:00, 35.95it/s][A[A

Evaluation...:  97%|████████████████████████████████████▊ | 162/167 [00:04<00:00, 33.67it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 34.61it/s][A[A

Training:  13%|█████▌                                    | 198/1501 [00:20<16:32,  1.31it/s][A
Training:  13%|█████▌                                    | 200/1501 [00:21<12:09,  1.78it/s][A

>>> training loss:  0.4613, valid loss:  1.7683, valid f1 score:  0.4937



Training:  13%|█████▋                                    | 202/1501 [00:21<08:56,  2.42it/s][A
Training:  14%|█████▋                                    | 204/1501 [00:21<06:39,  3.25it/s][A
Training:  14%|█████▊                                    | 206/1501 [00:21<05:01,  4.29it/s][A
Training:  14%|█████▊                                    | 208/1501 [00:21<04:01,  5.35it/s][A
Training:  14%|█████▉                                    | 210/1501 [00:21<03:16,  6.57it/s][A
Training:  14%|█████▉                                    | 212/1501 [00:21<02:40,  8.04it/s][A
Training:  14%|█████▉                                    | 214/1501 [00:22<02:19,  9.24it/s][A
Training:  14%|██████                                    | 216/1501 [00:22<01:58, 10.83it/s][A
Training:  15%|██████                                    | 218/1501 [00:22<01:44, 12.30it/s][A
Training:  15%|██████▏                                   | 220/1501 [00:22<01:43, 12.41it/s][A
Training:  15%|██████▏                 

Evaluation...:  88%|█████████████████████████████████▍    | 147/167 [00:03<00:00, 38.48it/s][A[A

Evaluation...:  90%|██████████████████████████████████▎   | 151/167 [00:04<00:00, 38.88it/s][A[A

Evaluation...:  93%|███████████████████████████████████▎  | 155/167 [00:04<00:00, 38.11it/s][A[A

Evaluation...:  95%|████████████████████████████████████▏ | 159/167 [00:04<00:00, 38.46it/s][A[A

Evaluation...:  98%|█████████████████████████████████████ | 163/167 [00:04<00:00, 37.24it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 37.20it/s][A[A

Training:  20%|████████▎                                 | 298/1501 [00:31<14:51,  1.35it/s][A
Training:  20%|████████▍                                 | 300/1501 [00:31<10:43,  1.87it/s][A

>>> training loss:  0.4899, valid loss:  1.7836, valid f1 score:  0.4951



Training:  20%|████████▍                                 | 302/1501 [00:31<07:50,  2.55it/s][A
Training:  20%|████████▌                                 | 304/1501 [00:32<05:48,  3.43it/s][A
Training:  20%|████████▌                                 | 306/1501 [00:32<04:24,  4.52it/s][A
Training:  21%|████████▌                                 | 308/1501 [00:32<03:24,  5.82it/s][A
Training:  21%|████████▋                                 | 310/1501 [00:32<02:45,  7.18it/s][A
Training:  21%|████████▋                                 | 312/1501 [00:32<02:19,  8.55it/s][A
Training:  21%|████████▊                                 | 314/1501 [00:32<01:59,  9.89it/s][A
Training:  21%|████████▊                                 | 316/1501 [00:32<01:44, 11.32it/s][A
Training:  21%|████████▉                                 | 318/1501 [00:32<01:32, 12.76it/s][A
Training:  21%|████████▉                                 | 320/1501 [00:33<01:24, 14.05it/s][A
Training:  21%|█████████               

Evaluation...:  85%|████████████████████████████████▎     | 142/167 [00:04<00:00, 34.77it/s][A[A

Evaluation...:  87%|█████████████████████████████████▏    | 146/167 [00:04<00:00, 34.77it/s][A[A

Evaluation...:  90%|██████████████████████████████████▎   | 151/167 [00:04<00:00, 36.73it/s][A[A

Evaluation...:  93%|███████████████████████████████████▎  | 155/167 [00:04<00:00, 34.60it/s][A[A

Evaluation...:  95%|████████████████████████████████████▏ | 159/167 [00:04<00:00, 32.67it/s][A[A

Evaluation...:  98%|█████████████████████████████████████ | 163/167 [00:04<00:00, 29.65it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 34.52it/s][A[A

Training:  27%|███████████▏                              | 398/1501 [00:42<14:25,  1.27it/s][A
Training:  27%|███████████▏                              | 400/1501 [00:42<10:28,  1.75it/s][A

>>> training loss:  0.4916, valid loss:  1.7947, valid f1 score:  0.4927



Training:  27%|███████████▏                              | 402/1501 [00:42<07:41,  2.38it/s][A
Training:  27%|███████████▎                              | 404/1501 [00:42<05:39,  3.23it/s][A
Training:  27%|███████████▎                              | 406/1501 [00:42<04:16,  4.27it/s][A
Training:  27%|███████████▍                              | 408/1501 [00:43<03:18,  5.51it/s][A
Training:  27%|███████████▍                              | 410/1501 [00:43<02:38,  6.88it/s][A
Training:  27%|███████████▌                              | 412/1501 [00:43<02:12,  8.24it/s][A
Training:  28%|███████████▌                              | 414/1501 [00:43<01:54,  9.50it/s][A
Training:  28%|███████████▋                              | 416/1501 [00:43<01:41, 10.65it/s][A
Training:  28%|███████████▋                              | 418/1501 [00:43<01:33, 11.59it/s][A
Training:  28%|███████████▊                              | 420/1501 [00:43<01:24, 12.72it/s][A
Training:  28%|███████████▊            

Evaluation...:  87%|████████████████████████████████▉     | 145/167 [00:03<00:00, 36.31it/s][A[A

Evaluation...:  90%|██████████████████████████████████▏   | 150/167 [00:03<00:00, 38.49it/s][A[A

Evaluation...:  92%|███████████████████████████████████   | 154/167 [00:04<00:00, 37.21it/s][A[A

Evaluation...:  95%|████████████████████████████████████▏ | 159/167 [00:04<00:00, 38.70it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 37.55it/s][A[A

Training:  33%|█████████████▉                            | 499/1501 [00:52<12:09,  1.37it/s][A
Training:  33%|██████████████                            | 501/1501 [00:52<08:46,  1.90it/s][A

>>> training loss:  0.5276, valid loss:  1.8186, valid f1 score:  0.4966



Training:  34%|██████████████                            | 503/1501 [00:53<06:24,  2.60it/s][A
Training:  34%|██████████████▏                           | 505/1501 [00:53<04:45,  3.48it/s][A
Training:  34%|██████████████▏                           | 507/1501 [00:53<03:36,  4.58it/s][A
Training:  34%|██████████████▏                           | 509/1501 [00:53<02:47,  5.93it/s][A
Training:  34%|██████████████▎                           | 511/1501 [00:53<02:13,  7.42it/s][A
Training:  34%|██████████████▎                           | 513/1501 [00:53<01:50,  8.98it/s][A
Training:  34%|██████████████▍                           | 515/1501 [00:53<01:32, 10.63it/s][A
Training:  34%|██████████████▍                           | 517/1501 [00:53<01:21, 12.10it/s][A
Training:  35%|██████████████▌                           | 519/1501 [00:53<01:12, 13.56it/s][A
Training:  35%|██████████████▌                           | 521/1501 [00:54<01:06, 14.66it/s][A
Training:  35%|██████████████▋         

Evaluation...:  76%|████████████████████████████▉         | 127/167 [00:03<00:01, 37.58it/s][A[A

Evaluation...:  78%|█████████████████████████████▊        | 131/167 [00:04<00:00, 36.36it/s][A[A

Evaluation...:  81%|██████████████████████████████▉       | 136/167 [00:04<00:00, 38.05it/s][A[A

Evaluation...:  84%|███████████████████████████████▊      | 140/167 [00:04<00:00, 38.36it/s][A[A

Evaluation...:  86%|████████████████████████████████▊     | 144/167 [00:04<00:00, 38.13it/s][A[A

Evaluation...:  89%|█████████████████████████████████▋    | 148/167 [00:04<00:00, 35.38it/s][A[A

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:04<00:00, 33.27it/s][A[A

Evaluation...:  93%|███████████████████████████████████▍  | 156/167 [00:04<00:00, 30.81it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:05<00:00, 29.68it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:05<00:00, 31.98it/s][A[A



>>> training loss:  0.5468, valid loss:  1.7862, valid f1 score:  0.4818



Training:  40%|████████████████▊                         | 603/1501 [01:04<06:49,  2.19it/s][A
Training:  40%|████████████████▉                         | 605/1501 [01:04<05:08,  2.91it/s][A
Training:  40%|████████████████▉                         | 607/1501 [01:05<03:56,  3.79it/s][A
Training:  41%|█████████████████                         | 609/1501 [01:05<03:04,  4.82it/s][A
Training:  41%|█████████████████                         | 611/1501 [01:05<02:25,  6.11it/s][A
Training:  41%|█████████████████▏                        | 613/1501 [01:05<01:59,  7.42it/s][A
Training:  41%|█████████████████▏                        | 615/1501 [01:05<01:42,  8.68it/s][A
Training:  41%|█████████████████▎                        | 617/1501 [01:05<01:31,  9.64it/s][A
Training:  41%|█████████████████▎                        | 619/1501 [01:05<01:25, 10.33it/s][A
Training:  41%|█████████████████▍                        | 621/1501 [01:06<01:22, 10.66it/s][A
Training:  42%|█████████████████▍      

Evaluation...:  88%|█████████████████████████████████▍    | 147/167 [00:04<00:00, 38.40it/s][A[A

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:04<00:00, 40.06it/s][A[A

Evaluation...:  94%|███████████████████████████████████▋  | 157/167 [00:04<00:00, 40.18it/s][A[A

Evaluation...:  97%|████████████████████████████████████▊ | 162/167 [00:04<00:00, 39.30it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 36.58it/s][A[A

Training:  47%|███████████████████▌                      | 699/1501 [01:16<09:57,  1.34it/s][A
Training:  47%|███████████████████▌                      | 701/1501 [01:16<07:11,  1.85it/s][A

>>> training loss:  0.5506, valid loss:  1.8140, valid f1 score:  0.4905



Training:  47%|███████████████████▋                      | 703/1501 [01:16<05:14,  2.54it/s][A
Training:  47%|███████████████████▋                      | 705/1501 [01:16<03:53,  3.41it/s][A
Training:  47%|███████████████████▊                      | 707/1501 [01:16<03:01,  4.37it/s][A
Training:  47%|███████████████████▊                      | 709/1501 [01:16<02:23,  5.50it/s][A
Training:  47%|███████████████████▉                      | 711/1501 [01:17<01:54,  6.92it/s][A
Training:  48%|███████████████████▉                      | 713/1501 [01:17<01:42,  7.69it/s][A
Training:  48%|████████████████████                      | 715/1501 [01:17<01:26,  9.05it/s][A
Training:  48%|████████████████████                      | 717/1501 [01:17<01:15, 10.44it/s][A
Training:  48%|████████████████████                      | 719/1501 [01:17<01:04, 12.13it/s][A
Training:  48%|████████████████████▏                     | 721/1501 [01:17<01:01, 12.78it/s][A
Training:  48%|████████████████████▏   

Evaluation...:  88%|█████████████████████████████████▍    | 147/167 [00:04<00:00, 36.84it/s][A[A

Evaluation...:  90%|██████████████████████████████████▎   | 151/167 [00:04<00:00, 36.39it/s][A[A

Evaluation...:  93%|███████████████████████████████████▎  | 155/167 [00:04<00:00, 33.76it/s][A[A

Evaluation...:  95%|████████████████████████████████████▏ | 159/167 [00:04<00:00, 34.65it/s][A[A

Evaluation...:  98%|█████████████████████████████████████ | 163/167 [00:04<00:00, 34.03it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 35.90it/s][A[A

Training:  53%|██████████████████████▎                   | 799/1501 [01:26<08:52,  1.32it/s][A
Training:  53%|██████████████████████▍                   | 801/1501 [01:27<06:24,  1.82it/s][A

>>> training loss:  0.5487, valid loss:  1.7907, valid f1 score:  0.4900



Training:  53%|██████████████████████▍                   | 803/1501 [01:27<04:41,  2.48it/s][A
Training:  54%|██████████████████████▌                   | 805/1501 [01:27<03:28,  3.34it/s][A
Training:  54%|██████████████████████▌                   | 807/1501 [01:27<02:37,  4.41it/s][A
Training:  54%|██████████████████████▋                   | 809/1501 [01:27<02:01,  5.68it/s][A
Training:  54%|██████████████████████▋                   | 811/1501 [01:27<01:37,  7.05it/s][A
Training:  54%|██████████████████████▋                   | 813/1501 [01:27<01:21,  8.49it/s][A
Training:  54%|██████████████████████▊                   | 815/1501 [01:27<01:07, 10.11it/s][A
Training:  54%|██████████████████████▊                   | 817/1501 [01:28<00:58, 11.72it/s][A
Training:  55%|██████████████████████▉                   | 819/1501 [01:28<00:53, 12.81it/s][A
Training:  55%|██████████████████████▉                   | 821/1501 [01:28<00:48, 14.04it/s][A
Training:  55%|███████████████████████ 

Evaluation...:  98%|█████████████████████████████████████ | 163/167 [00:04<00:00, 36.16it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 39.30it/s][A[A

Training:  60%|█████████████████████████▏                | 899/1501 [01:36<06:56,  1.44it/s][A
Training:  60%|█████████████████████████▏                | 901/1501 [01:37<05:01,  1.99it/s][A

>>> training loss:  0.5816, valid loss:  1.8139, valid f1 score:  0.5045



Training:  60%|█████████████████████████▎                | 903/1501 [01:37<03:41,  2.70it/s][A
Training:  60%|█████████████████████████▎                | 905/1501 [01:37<02:44,  3.63it/s][A
Training:  60%|█████████████████████████▍                | 907/1501 [01:37<02:04,  4.77it/s][A
Training:  61%|█████████████████████████▍                | 909/1501 [01:37<01:36,  6.11it/s][A
Training:  61%|█████████████████████████▍                | 911/1501 [01:37<01:16,  7.68it/s][A
Training:  61%|█████████████████████████▌                | 914/1501 [01:37<00:58, 10.02it/s][A
Training:  61%|█████████████████████████▋                | 916/1501 [01:37<00:51, 11.29it/s][A
Training:  61%|█████████████████████████▋                | 918/1501 [01:37<00:46, 12.67it/s][A
Training:  61%|█████████████████████████▋                | 920/1501 [01:38<00:41, 13.89it/s][A
Training:  61%|█████████████████████████▊                | 922/1501 [01:38<00:38, 14.90it/s][A
Training:  62%|████████████████████████

Evaluation...:  72%|███████████████████████████▎          | 120/167 [00:04<00:01, 26.97it/s][A[A

Evaluation...:  74%|████████████████████████████▏         | 124/167 [00:04<00:01, 28.00it/s][A[A

Evaluation...:  76%|████████████████████████████▉         | 127/167 [00:04<00:01, 27.95it/s][A[A

Evaluation...:  78%|█████████████████████████████▌        | 130/167 [00:04<00:01, 26.70it/s][A[A

Evaluation...:  80%|██████████████████████████████▎       | 133/167 [00:04<00:01, 27.52it/s][A[A

Evaluation...:  82%|███████████████████████████████▏      | 137/167 [00:04<00:01, 29.60it/s][A[A

Evaluation...:  84%|████████████████████████████████      | 141/167 [00:05<00:00, 30.40it/s][A[A

Evaluation...:  87%|████████████████████████████████▉     | 145/167 [00:05<00:00, 28.97it/s][A[A

Evaluation...:  89%|█████████████████████████████████▋    | 148/167 [00:05<00:00, 29.21it/s][A[A

Evaluation...:  90%|██████████████████████████████████▎   | 151/167 [00:05<00:00, 29.40it/s][A[A



>>> training loss:  0.5951, valid loss:  1.7997, valid f1 score:  0.4942



Training:  67%|███████████████████████████▎             | 1002/1501 [01:49<04:13,  1.97it/s][A
Training:  67%|███████████████████████████▍             | 1004/1501 [01:49<03:04,  2.70it/s][A
Training:  67%|███████████████████████████▍             | 1006/1501 [01:49<02:18,  3.58it/s][A
Training:  67%|███████████████████████████▌             | 1008/1501 [01:49<01:47,  4.57it/s][A
Training:  67%|███████████████████████████▌             | 1010/1501 [01:49<01:26,  5.70it/s][A
Training:  67%|███████████████████████████▋             | 1012/1501 [01:49<01:11,  6.88it/s][A
Training:  68%|███████████████████████████▋             | 1014/1501 [01:50<00:58,  8.28it/s][A
Training:  68%|███████████████████████████▊             | 1016/1501 [01:50<00:51,  9.46it/s][A
Training:  68%|███████████████████████████▊             | 1018/1501 [01:50<00:47, 10.18it/s][A
Training:  68%|███████████████████████████▊             | 1020/1501 [01:50<00:42, 11.21it/s][A
Training:  68%|████████████████████████

Evaluation...:  86%|████████████████████████████████▌     | 143/167 [00:03<00:00, 28.68it/s][A[A

Evaluation...:  88%|█████████████████████████████████▍    | 147/167 [00:04<00:00, 30.62it/s][A[A

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:04<00:00, 33.40it/s][A[A

Evaluation...:  93%|███████████████████████████████████▍  | 156/167 [00:04<00:00, 34.44it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 35.15it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 36.51it/s][A[A

Training:  73%|█████████████████████████████▉           | 1098/1501 [02:00<05:01,  1.34it/s][A
Training:  73%|██████████████████████████████           | 1100/1501 [02:00<03:37,  1.85it/s][A

>>> training loss:  0.6016, valid loss:  1.8250, valid f1 score:  0.4834



Training:  73%|██████████████████████████████           | 1102/1501 [02:00<02:38,  2.52it/s][A
Training:  74%|██████████████████████████████▏          | 1104/1501 [02:00<01:56,  3.42it/s][A
Training:  74%|██████████████████████████████▏          | 1106/1501 [02:00<01:27,  4.51it/s][A
Training:  74%|██████████████████████████████▎          | 1108/1501 [02:01<01:08,  5.70it/s][A
Training:  74%|██████████████████████████████▎          | 1110/1501 [02:01<00:54,  7.13it/s][A
Training:  74%|██████████████████████████████▎          | 1112/1501 [02:01<00:45,  8.55it/s][A
Training:  74%|██████████████████████████████▍          | 1114/1501 [02:01<00:38, 10.11it/s][A
Training:  74%|██████████████████████████████▍          | 1116/1501 [02:01<00:33, 11.66it/s][A
Training:  74%|██████████████████████████████▌          | 1118/1501 [02:01<00:29, 12.96it/s][A
Training:  75%|██████████████████████████████▌          | 1120/1501 [02:01<00:29, 13.02it/s][A
Training:  75%|████████████████████████

Evaluation...:  88%|█████████████████████████████████▍    | 147/167 [00:04<00:00, 39.15it/s][A[A

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:04<00:00, 40.31it/s][A[A

Evaluation...:  94%|███████████████████████████████████▋  | 157/167 [00:04<00:00, 40.26it/s][A[A

Evaluation...:  97%|████████████████████████████████████▊ | 162/167 [00:04<00:00, 39.30it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 36.00it/s][A[A

Training:  80%|████████████████████████████████▋        | 1198/1501 [02:11<03:49,  1.32it/s][A
Training:  80%|████████████████████████████████▊        | 1200/1501 [02:11<02:44,  1.83it/s][A

>>> training loss:  0.6071, valid loss:  1.8046, valid f1 score:  0.4943



Training:  80%|████████████████████████████████▊        | 1202/1501 [02:11<01:59,  2.50it/s][A
Training:  80%|████████████████████████████████▉        | 1204/1501 [02:11<01:28,  3.36it/s][A
Training:  80%|████████████████████████████████▉        | 1206/1501 [02:11<01:06,  4.43it/s][A
Training:  80%|████████████████████████████████▉        | 1208/1501 [02:11<00:51,  5.70it/s][A
Training:  81%|█████████████████████████████████        | 1210/1501 [02:12<00:40,  7.10it/s][A
Training:  81%|█████████████████████████████████        | 1212/1501 [02:12<00:33,  8.67it/s][A
Training:  81%|█████████████████████████████████▏       | 1214/1501 [02:12<00:27, 10.29it/s][A
Training:  81%|█████████████████████████████████▏       | 1216/1501 [02:12<00:23, 11.99it/s][A
Training:  81%|█████████████████████████████████▎       | 1218/1501 [02:12<00:21, 13.03it/s][A
Training:  81%|█████████████████████████████████▎       | 1220/1501 [02:12<00:20, 14.03it/s][A
Training:  81%|████████████████████████

Evaluation...:  83%|███████████████████████████████▍      | 138/167 [00:04<00:00, 38.29it/s][A[A

Evaluation...:  86%|████████████████████████████████▌     | 143/167 [00:04<00:00, 38.74it/s][A[A

Evaluation...:  88%|█████████████████████████████████▍    | 147/167 [00:04<00:00, 38.49it/s][A[A

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:04<00:00, 39.58it/s][A[A

Evaluation...:  93%|███████████████████████████████████▍  | 156/167 [00:04<00:00, 39.20it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 38.81it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 34.67it/s][A[A

Training:  86%|███████████████████████████████████▍     | 1298/1501 [02:22<02:40,  1.26it/s][A
Training:  87%|███████████████████████████████████▌     | 1300/1501 [02:22<01:55,  1.74it/s][A

>>> training loss:  0.6711, valid loss:  1.8186, valid f1 score:  0.4938



Training:  87%|███████████████████████████████████▌     | 1302/1501 [02:22<01:23,  2.39it/s][A
Training:  87%|███████████████████████████████████▌     | 1304/1501 [02:22<01:01,  3.23it/s][A
Training:  87%|███████████████████████████████████▋     | 1306/1501 [02:22<00:45,  4.28it/s][A
Training:  87%|███████████████████████████████████▋     | 1308/1501 [02:22<00:34,  5.52it/s][A
Training:  87%|███████████████████████████████████▊     | 1310/1501 [02:22<00:27,  6.94it/s][A
Training:  87%|███████████████████████████████████▊     | 1312/1501 [02:23<00:22,  8.55it/s][A
Training:  88%|███████████████████████████████████▉     | 1314/1501 [02:23<00:18, 10.03it/s][A
Training:  88%|███████████████████████████████████▉     | 1316/1501 [02:23<00:16, 11.43it/s][A
Training:  88%|████████████████████████████████████     | 1318/1501 [02:23<00:14, 12.89it/s][A
Training:  88%|████████████████████████████████████     | 1320/1501 [02:23<00:12, 14.15it/s][A
Training:  88%|████████████████████████

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:03<00:00, 40.07it/s][A[A

Evaluation...:  94%|███████████████████████████████████▋  | 157/167 [00:04<00:00, 40.13it/s][A[A

Evaluation...:  97%|████████████████████████████████████▊ | 162/167 [00:04<00:00, 38.82it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.36it/s][A[A

Training:  93%|██████████████████████████████████████▏  | 1398/1501 [02:32<01:13,  1.41it/s][A
Training:  93%|██████████████████████████████████████▏  | 1400/1501 [02:32<00:52,  1.93it/s][A

>>> training loss:  0.6642, valid loss:  1.8232, valid f1 score:  0.4947



Training:  93%|██████████████████████████████████████▎  | 1402/1501 [02:32<00:37,  2.65it/s][A
Training:  94%|██████████████████████████████████████▎  | 1404/1501 [02:32<00:27,  3.54it/s][A
Training:  94%|██████████████████████████████████████▍  | 1406/1501 [02:32<00:20,  4.68it/s][A
Training:  94%|██████████████████████████████████████▍  | 1408/1501 [02:32<00:15,  6.06it/s][A
Training:  94%|██████████████████████████████████████▌  | 1410/1501 [02:33<00:12,  7.55it/s][A
Training:  94%|██████████████████████████████████████▌  | 1412/1501 [02:33<00:10,  8.86it/s][A
Training:  94%|██████████████████████████████████████▌  | 1414/1501 [02:33<00:08, 10.56it/s][A
Training:  94%|██████████████████████████████████████▋  | 1416/1501 [02:33<00:07, 11.99it/s][A
Training:  94%|██████████████████████████████████████▋  | 1418/1501 [02:33<00:06, 13.17it/s][A
Training:  95%|██████████████████████████████████████▊  | 1420/1501 [02:33<00:05, 14.33it/s][A
Training:  95%|████████████████████████

Evaluation...:  92%|██████████████████████████████████▊   | 153/167 [00:03<00:00, 39.16it/s][A[A

Evaluation...:  95%|███████████████████████████████████▉  | 158/167 [00:04<00:00, 39.52it/s][A[A

Evaluation...:  97%|████████████████████████████████████▊ | 162/167 [00:04<00:00, 38.03it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.46it/s][A[A

Training: 100%|████████████████████████████████████████▉| 1498/1501 [02:42<00:02,  1.42it/s][A
Training: 100%|█████████████████████████████████████████| 1501/1501 [02:42<00:00,  9.24it/s][A
 38%|█████████████████████                                   | 3/8 [07:59<13:21, 160.36s/it]

>>> training loss:  0.6583, valid loss:  1.8068, valid f1 score:  0.4952



Training:   0%|                                                    | 0/1501 [00:00<?, ?it/s][A
Training:   0%|                                            | 2/1501 [00:00<01:28, 16.96it/s][A
Training:   0%|                                            | 4/1501 [00:00<01:22, 18.07it/s][A
Training:   0%|▏                                           | 6/1501 [00:00<01:27, 17.06it/s][A
Training:   1%|▏                                           | 8/1501 [00:00<01:22, 18.05it/s][A
Training:   1%|▎                                          | 10/1501 [00:00<01:20, 18.59it/s][A
Training:   1%|▎                                          | 12/1501 [00:00<01:21, 18.20it/s][A
Training:   1%|▍                                          | 14/1501 [00:00<01:20, 18.44it/s][A
Training:   1%|▍                                          | 16/1501 [00:00<01:23, 17.69it/s][A
Training:   1%|▌                                          | 18/1501 [00:01<01:27, 17.00it/s][A
Training:   1%|▌                       

Evaluation...:  87%|████████████████████████████████▉     | 145/167 [00:03<00:00, 37.94it/s][A[A

Evaluation...:  90%|██████████████████████████████████▏   | 150/167 [00:03<00:00, 39.13it/s][A[A

Evaluation...:  92%|███████████████████████████████████   | 154/167 [00:04<00:00, 38.24it/s][A[A

Evaluation...:  95%|████████████████████████████████████▏ | 159/167 [00:04<00:00, 39.17it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.00it/s][A[A

Training:   6%|██▊                                        | 97/1501 [00:09<14:40,  1.59it/s][A
Training:   7%|██▊                                        | 99/1501 [00:09<11:02,  2.12it/s][A

>>> training loss:  0.4377, valid loss:  1.8188, valid f1 score:  0.5026



Training:   7%|██▊                                       | 101/1501 [00:10<08:19,  2.80it/s][A
Training:   7%|██▉                                       | 103/1501 [00:10<06:20,  3.68it/s][A
Training:   7%|██▉                                       | 105/1501 [00:10<04:52,  4.77it/s][A
Training:   7%|██▉                                       | 107/1501 [00:10<03:50,  6.04it/s][A
Training:   7%|███                                       | 109/1501 [00:10<03:03,  7.60it/s][A
Training:   7%|███                                       | 111/1501 [00:10<02:33,  9.08it/s][A
Training:   8%|███▏                                      | 113/1501 [00:10<02:09, 10.69it/s][A
Training:   8%|███▏                                      | 115/1501 [00:10<01:56, 11.87it/s][A
Training:   8%|███▎                                      | 117/1501 [00:11<01:44, 13.25it/s][A
Training:   8%|███▎                                      | 119/1501 [00:11<01:37, 14.19it/s][A
Training:   8%|███▍                    

Evaluation...:  93%|███████████████████████████████████▎  | 155/167 [00:03<00:00, 39.18it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 39.63it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 39.21it/s][A[A

Training:  13%|█████▌                                    | 197/1501 [00:19<15:06,  1.44it/s][A
Training:  13%|█████▌                                    | 199/1501 [00:19<10:58,  1.98it/s][A

>>> training loss:  0.4058, valid loss:  1.8471, valid f1 score:  0.5027



Training:  13%|█████▌                                    | 201/1501 [00:20<08:02,  2.69it/s][A
Training:  14%|█████▋                                    | 203/1501 [00:20<05:58,  3.62it/s][A
Training:  14%|█████▋                                    | 205/1501 [00:20<04:31,  4.78it/s][A
Training:  14%|█████▊                                    | 207/1501 [00:20<03:30,  6.15it/s][A
Training:  14%|█████▊                                    | 209/1501 [00:20<02:50,  7.57it/s][A
Training:  14%|█████▉                                    | 211/1501 [00:20<02:19,  9.23it/s][A
Training:  14%|█████▉                                    | 214/1501 [00:20<01:51, 11.59it/s][A
Training:  14%|██████                                    | 216/1501 [00:20<01:40, 12.75it/s][A
Training:  15%|██████                                    | 218/1501 [00:20<01:31, 14.01it/s][A
Training:  15%|██████▏                                   | 220/1501 [00:21<01:27, 14.65it/s][A
Training:  15%|██████▏                 

Evaluation...:  95%|████████████████████████████████████▏ | 159/167 [00:04<00:00, 40.68it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 39.31it/s][A[A

Training:  20%|████████▎                                 | 297/1501 [00:29<13:56,  1.44it/s][A
Training:  20%|████████▎                                 | 299/1501 [00:29<10:09,  1.97it/s][A

>>> training loss:  0.4245, valid loss:  1.8754, valid f1 score:  0.5008



Training:  20%|████████▍                                 | 301/1501 [00:29<07:25,  2.69it/s][A
Training:  20%|████████▍                                 | 303/1501 [00:30<05:32,  3.61it/s][A
Training:  20%|████████▌                                 | 305/1501 [00:30<04:13,  4.72it/s][A
Training:  20%|████████▌                                 | 307/1501 [00:30<03:16,  6.07it/s][A
Training:  21%|████████▋                                 | 309/1501 [00:30<02:37,  7.57it/s][A
Training:  21%|████████▋                                 | 311/1501 [00:30<02:10,  9.13it/s][A
Training:  21%|████████▊                                 | 313/1501 [00:30<01:50, 10.76it/s][A
Training:  21%|████████▊                                 | 315/1501 [00:30<01:38, 12.03it/s][A
Training:  21%|████████▊                                 | 317/1501 [00:30<01:31, 12.90it/s][A
Training:  21%|████████▉                                 | 319/1501 [00:30<01:26, 13.72it/s][A
Training:  21%|████████▉               

Evaluation...:  93%|███████████████████████████████████▎  | 155/167 [00:04<00:00, 39.65it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 39.81it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.54it/s][A[A

Training:  26%|███████████                               | 397/1501 [00:39<12:42,  1.45it/s][A
Training:  27%|███████████▏                              | 399/1501 [00:39<09:13,  1.99it/s][A

>>> training loss:  0.4466, valid loss:  1.9020, valid f1 score:  0.4832



Training:  27%|███████████▏                              | 401/1501 [00:39<06:51,  2.67it/s][A
Training:  27%|███████████▎                              | 403/1501 [00:40<05:06,  3.58it/s][A
Training:  27%|███████████▎                              | 405/1501 [00:40<03:54,  4.68it/s][A
Training:  27%|███████████▍                              | 407/1501 [00:40<03:03,  5.95it/s][A
Training:  27%|███████████▍                              | 409/1501 [00:40<02:26,  7.43it/s][A
Training:  27%|███████████▌                              | 412/1501 [00:40<01:52,  9.68it/s][A
Training:  28%|███████████▌                              | 414/1501 [00:40<01:37, 11.17it/s][A
Training:  28%|███████████▋                              | 416/1501 [00:40<01:27, 12.47it/s][A
Training:  28%|███████████▋                              | 418/1501 [00:40<01:18, 13.80it/s][A
Training:  28%|███████████▊                              | 420/1501 [00:41<01:13, 14.77it/s][A
Training:  28%|███████████▊            

Evaluation...:  89%|█████████████████████████████████▋    | 148/167 [00:03<00:00, 38.76it/s][A[A

Evaluation...:  92%|██████████████████████████████████▊   | 153/167 [00:03<00:00, 39.15it/s][A[A

Evaluation...:  94%|███████████████████████████████████▋  | 157/167 [00:04<00:00, 39.24it/s][A[A

Evaluation...:  96%|████████████████████████████████████▋ | 161/167 [00:04<00:00, 38.42it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.45it/s][A[A

Training:  33%|█████████████▉                            | 498/1501 [00:49<11:55,  1.40it/s][A
Training:  33%|█████████████▉                            | 500/1501 [00:50<08:36,  1.94it/s][A

>>> training loss:  0.4780, valid loss:  1.8663, valid f1 score:  0.4941



Training:  33%|██████████████                            | 502/1501 [00:50<06:20,  2.62it/s][A
Training:  34%|██████████████                            | 504/1501 [00:50<04:41,  3.54it/s][A
Training:  34%|██████████████▏                           | 507/1501 [00:50<03:11,  5.20it/s][A
Training:  34%|██████████████▏                           | 509/1501 [00:50<02:34,  6.43it/s][A
Training:  34%|██████████████▎                           | 511/1501 [00:50<02:05,  7.86it/s][A
Training:  34%|██████████████▎                           | 513/1501 [00:50<01:46,  9.25it/s][A
Training:  34%|██████████████▍                           | 516/1501 [00:50<01:23, 11.73it/s][A
Training:  35%|██████████████▌                           | 519/1501 [00:51<01:11, 13.65it/s][A
Training:  35%|██████████████▌                           | 521/1501 [00:51<01:07, 14.55it/s][A
Training:  35%|██████████████▋                           | 523/1501 [00:51<01:03, 15.39it/s][A
Training:  35%|██████████████▋         

Evaluation...:  96%|████████████████████████████████████▋ | 161/167 [00:04<00:00, 38.30it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.07it/s][A[A

Training:  40%|████████████████▋                         | 597/1501 [00:59<09:48,  1.54it/s][A
Training:  40%|████████████████▊                         | 599/1501 [01:00<07:16,  2.07it/s][A

>>> training loss:  0.4751, valid loss:  1.8725, valid f1 score:  0.4916



Training:  40%|████████████████▊                         | 601/1501 [01:00<05:26,  2.76it/s][A
Training:  40%|████████████████▊                         | 603/1501 [01:00<04:08,  3.62it/s][A
Training:  40%|████████████████▉                         | 605/1501 [01:00<03:10,  4.71it/s][A
Training:  40%|████████████████▉                         | 607/1501 [01:00<02:27,  6.05it/s][A
Training:  41%|█████████████████                         | 609/1501 [01:00<01:59,  7.48it/s][A
Training:  41%|█████████████████                         | 611/1501 [01:00<01:39,  8.98it/s][A
Training:  41%|█████████████████▏                        | 613/1501 [01:00<01:27, 10.20it/s][A
Training:  41%|█████████████████▏                        | 615/1501 [01:00<01:15, 11.74it/s][A
Training:  41%|█████████████████▎                        | 617/1501 [01:01<01:08, 12.92it/s][A
Training:  41%|█████████████████▎                        | 619/1501 [01:01<01:02, 14.16it/s][A
Training:  41%|█████████████████▍      

Evaluation...:  88%|█████████████████████████████████▍    | 147/167 [00:03<00:00, 39.10it/s][A[A

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:04<00:00, 40.06it/s][A[A

Evaluation...:  94%|███████████████████████████████████▋  | 157/167 [00:04<00:00, 39.90it/s][A[A

Evaluation...:  96%|████████████████████████████████████▋ | 161/167 [00:04<00:00, 39.09it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 37.93it/s][A[A

Training:  46%|███████████████████▌                      | 697/1501 [01:10<09:39,  1.39it/s][A
Training:  47%|███████████████████▌                      | 699/1501 [01:10<06:59,  1.91it/s][A

>>> training loss:  0.4908, valid loss:  1.8920, valid f1 score:  0.4855



Training:  47%|███████████████████▌                      | 701/1501 [01:10<05:06,  2.61it/s][A
Training:  47%|███████████████████▋                      | 703/1501 [01:10<03:48,  3.49it/s][A
Training:  47%|███████████████████▋                      | 705/1501 [01:10<02:52,  4.61it/s][A
Training:  47%|███████████████████▊                      | 707/1501 [01:10<02:13,  5.93it/s][A
Training:  47%|███████████████████▊                      | 709/1501 [01:10<01:46,  7.40it/s][A
Training:  47%|███████████████████▉                      | 711/1501 [01:10<01:26,  9.10it/s][A
Training:  48%|███████████████████▉                      | 713/1501 [01:10<01:13, 10.77it/s][A
Training:  48%|████████████████████                      | 715/1501 [01:11<01:04, 12.13it/s][A
Training:  48%|████████████████████                      | 717/1501 [01:11<01:01, 12.65it/s][A
Training:  48%|████████████████████                      | 719/1501 [01:11<00:57, 13.59it/s][A
Training:  48%|████████████████████▏   

Evaluation...:  86%|████████████████████████████████▌     | 143/167 [00:03<00:00, 38.31it/s][A[A

Evaluation...:  88%|█████████████████████████████████▍    | 147/167 [00:03<00:00, 38.13it/s][A[A

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:04<00:00, 38.92it/s][A[A

Evaluation...:  93%|███████████████████████████████████▍  | 156/167 [00:04<00:00, 38.36it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 38.41it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 37.59it/s][A[A

Training:  53%|██████████████████████▎                   | 798/1501 [01:20<08:29,  1.38it/s][A
Training:  53%|██████████████████████▍                   | 800/1501 [01:20<06:06,  1.91it/s][A

>>> training loss:  0.5098, valid loss:  1.8772, valid f1 score:  0.4922



Training:  53%|██████████████████████▍                   | 802/1501 [01:20<04:27,  2.61it/s][A
Training:  54%|██████████████████████▍                   | 804/1501 [01:20<03:19,  3.49it/s][A
Training:  54%|██████████████████████▌                   | 806/1501 [01:20<02:30,  4.61it/s][A
Training:  54%|██████████████████████▌                   | 808/1501 [01:20<01:58,  5.84it/s][A
Training:  54%|██████████████████████▋                   | 810/1501 [01:21<01:34,  7.31it/s][A
Training:  54%|██████████████████████▋                   | 812/1501 [01:21<01:16,  8.96it/s][A
Training:  54%|██████████████████████▊                   | 814/1501 [01:21<01:06, 10.34it/s][A
Training:  54%|██████████████████████▊                   | 816/1501 [01:21<00:57, 11.87it/s][A
Training:  54%|██████████████████████▉                   | 818/1501 [01:21<00:51, 13.35it/s][A
Training:  55%|██████████████████████▉                   | 820/1501 [01:21<00:46, 14.62it/s][A
Training:  55%|███████████████████████ 

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:04<00:00, 39.43it/s][A[A

Evaluation...:  93%|███████████████████████████████████▍  | 156/167 [00:04<00:00, 38.80it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 38.69it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 37.88it/s][A[A

Training:  60%|█████████████████████████                 | 897/1501 [01:30<07:14,  1.39it/s][A
Training:  60%|█████████████████████████▏                | 899/1501 [01:30<05:13,  1.92it/s][A

>>> training loss:  0.5135, valid loss:  1.9018, valid f1 score:  0.4962



Training:  60%|█████████████████████████▏                | 901/1501 [01:30<03:49,  2.62it/s][A
Training:  60%|█████████████████████████▎                | 903/1501 [01:30<02:50,  3.50it/s][A
Training:  60%|█████████████████████████▎                | 905/1501 [01:30<02:08,  4.65it/s][A
Training:  60%|█████████████████████████▍                | 907/1501 [01:30<01:40,  5.91it/s][A
Training:  61%|█████████████████████████▍                | 909/1501 [01:31<01:19,  7.48it/s][A
Training:  61%|█████████████████████████▍                | 911/1501 [01:31<01:04,  9.09it/s][A
Training:  61%|█████████████████████████▌                | 913/1501 [01:31<00:54, 10.70it/s][A
Training:  61%|█████████████████████████▌                | 915/1501 [01:31<00:48, 12.10it/s][A
Training:  61%|█████████████████████████▋                | 917/1501 [01:31<00:43, 13.41it/s][A
Training:  61%|█████████████████████████▋                | 919/1501 [01:31<00:39, 14.57it/s][A
Training:  61%|████████████████████████

Evaluation...:  88%|█████████████████████████████████▍    | 147/167 [00:03<00:00, 38.26it/s][A[A

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:03<00:00, 39.29it/s][A[A

Evaluation...:  93%|███████████████████████████████████▍  | 156/167 [00:04<00:00, 38.62it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 38.24it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.20it/s][A[A

Training:  66%|███████████████████████████▉              | 998/1501 [01:40<05:57,  1.41it/s][A
Training:  67%|███████████████████████████▎             | 1000/1501 [01:40<04:18,  1.94it/s][A

>>> training loss:  0.5343, valid loss:  1.9232, valid f1 score:  0.5122



Training:  67%|███████████████████████████▎             | 1002/1501 [01:40<03:09,  2.64it/s][A
Training:  67%|███████████████████████████▍             | 1004/1501 [01:40<02:20,  3.53it/s][A
Training:  67%|███████████████████████████▍             | 1006/1501 [01:40<01:47,  4.62it/s][A
Training:  67%|███████████████████████████▌             | 1008/1501 [01:41<01:23,  5.87it/s][A
Training:  67%|███████████████████████████▌             | 1010/1501 [01:41<01:06,  7.39it/s][A
Training:  67%|███████████████████████████▋             | 1012/1501 [01:41<00:54,  8.95it/s][A
Training:  68%|███████████████████████████▋             | 1014/1501 [01:41<00:46, 10.48it/s][A
Training:  68%|███████████████████████████▊             | 1016/1501 [01:41<00:40, 11.90it/s][A
Training:  68%|███████████████████████████▊             | 1018/1501 [01:41<00:35, 13.52it/s][A
Training:  68%|███████████████████████████▊             | 1020/1501 [01:41<00:32, 14.60it/s][A
Training:  68%|████████████████████████

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:03<00:00, 39.90it/s][A[A

Evaluation...:  93%|███████████████████████████████████▍  | 156/167 [00:04<00:00, 39.23it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 38.99it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.35it/s][A[A

Training:  73%|█████████████████████████████▉           | 1098/1501 [01:50<04:38,  1.45it/s][A
Training:  73%|██████████████████████████████           | 1100/1501 [01:50<03:22,  1.98it/s][A

>>> training loss:  0.5362, valid loss:  1.9055, valid f1 score:  0.5000



Training:  73%|██████████████████████████████           | 1102/1501 [01:50<02:29,  2.67it/s][A
Training:  74%|██████████████████████████████▏          | 1104/1501 [01:50<01:52,  3.53it/s][A
Training:  74%|██████████████████████████████▏          | 1106/1501 [01:51<01:25,  4.63it/s][A
Training:  74%|██████████████████████████████▎          | 1108/1501 [01:51<01:06,  5.90it/s][A
Training:  74%|██████████████████████████████▎          | 1110/1501 [01:51<00:53,  7.30it/s][A
Training:  74%|██████████████████████████████▎          | 1112/1501 [01:51<00:43,  8.91it/s][A
Training:  74%|██████████████████████████████▍          | 1114/1501 [01:51<00:36, 10.61it/s][A
Training:  74%|██████████████████████████████▍          | 1116/1501 [01:51<00:31, 12.32it/s][A
Training:  74%|██████████████████████████████▌          | 1118/1501 [01:51<00:28, 13.64it/s][A
Training:  75%|██████████████████████████████▌          | 1121/1501 [01:51<00:24, 15.42it/s][A
Training:  75%|████████████████████████

Evaluation...:  90%|██████████████████████████████████▏   | 150/167 [00:03<00:00, 40.03it/s][A[A

Evaluation...:  92%|███████████████████████████████████   | 154/167 [00:04<00:00, 39.08it/s][A[A

Evaluation...:  95%|████████████████████████████████████▏ | 159/167 [00:04<00:00, 39.98it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.47it/s][A[A

Training:  80%|████████████████████████████████▋        | 1198/1501 [02:00<03:35,  1.41it/s][A
Training:  80%|████████████████████████████████▊        | 1200/1501 [02:00<02:35,  1.93it/s][A

>>> training loss:  0.5533, valid loss:  1.8718, valid f1 score:  0.5041



Training:  80%|████████████████████████████████▊        | 1202/1501 [02:00<01:53,  2.64it/s][A
Training:  80%|████████████████████████████████▉        | 1204/1501 [02:01<01:23,  3.55it/s][A
Training:  80%|████████████████████████████████▉        | 1206/1501 [02:01<01:03,  4.67it/s][A
Training:  80%|████████████████████████████████▉        | 1208/1501 [02:01<00:48,  5.99it/s][A
Training:  81%|█████████████████████████████████        | 1210/1501 [02:01<00:38,  7.52it/s][A
Training:  81%|█████████████████████████████████        | 1212/1501 [02:01<00:31,  9.09it/s][A
Training:  81%|█████████████████████████████████▏       | 1214/1501 [02:01<00:26, 10.78it/s][A
Training:  81%|█████████████████████████████████▏       | 1216/1501 [02:01<00:23, 12.02it/s][A
Training:  81%|█████████████████████████████████▎       | 1218/1501 [02:01<00:21, 13.31it/s][A
Training:  81%|█████████████████████████████████▎       | 1221/1501 [02:02<00:18, 15.47it/s][A
Training:  81%|████████████████████████

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:04<00:00, 39.29it/s][A[A

Evaluation...:  93%|███████████████████████████████████▍  | 156/167 [00:04<00:00, 38.92it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 38.85it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.00it/s][A[A

Training:  86%|███████████████████████████████████▍     | 1297/1501 [02:10<02:25,  1.40it/s][A
Training:  87%|███████████████████████████████████▍     | 1299/1501 [02:10<01:44,  1.94it/s][A

>>> training loss:  0.5520, valid loss:  1.9023, valid f1 score:  0.5040



Training:  87%|███████████████████████████████████▌     | 1301/1501 [02:10<01:16,  2.63it/s][A
Training:  87%|███████████████████████████████████▌     | 1303/1501 [02:11<00:55,  3.54it/s][A
Training:  87%|███████████████████████████████████▋     | 1305/1501 [02:11<00:41,  4.68it/s][A
Training:  87%|███████████████████████████████████▋     | 1307/1501 [02:11<00:32,  5.97it/s][A
Training:  87%|███████████████████████████████████▊     | 1309/1501 [02:11<00:25,  7.44it/s][A
Training:  87%|███████████████████████████████████▊     | 1311/1501 [02:11<00:21,  9.02it/s][A
Training:  87%|███████████████████████████████████▊     | 1313/1501 [02:11<00:17, 10.65it/s][A
Training:  88%|███████████████████████████████████▉     | 1315/1501 [02:11<00:15, 11.86it/s][A
Training:  88%|███████████████████████████████████▉     | 1317/1501 [02:11<00:13, 13.26it/s][A
Training:  88%|████████████████████████████████████     | 1319/1501 [02:11<00:12, 14.47it/s][A
Training:  88%|████████████████████████

Evaluation...:  88%|█████████████████████████████████▍    | 147/167 [00:03<00:00, 38.76it/s][A[A

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:04<00:00, 39.66it/s][A[A

Evaluation...:  93%|███████████████████████████████████▍  | 156/167 [00:04<00:00, 39.09it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 38.63it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 37.99it/s][A[A

Training:  93%|██████████████████████████████████████▏  | 1397/1501 [02:20<01:14,  1.39it/s][A
Training:  93%|██████████████████████████████████████▏  | 1399/1501 [02:20<00:52,  1.93it/s][A

>>> training loss:  0.5695, valid loss:  1.9079, valid f1 score:  0.4898



Training:  93%|██████████████████████████████████████▎  | 1401/1501 [02:21<00:37,  2.63it/s][A
Training:  93%|██████████████████████████████████████▎  | 1403/1501 [02:21<00:27,  3.54it/s][A
Training:  94%|██████████████████████████████████████▍  | 1405/1501 [02:21<00:20,  4.67it/s][A
Training:  94%|██████████████████████████████████████▍  | 1407/1501 [02:21<00:15,  5.89it/s][A
Training:  94%|██████████████████████████████████████▍  | 1409/1501 [02:21<00:12,  7.42it/s][A
Training:  94%|██████████████████████████████████████▌  | 1411/1501 [02:21<00:09,  9.03it/s][A
Training:  94%|██████████████████████████████████████▌  | 1413/1501 [02:21<00:08, 10.75it/s][A
Training:  94%|██████████████████████████████████████▋  | 1415/1501 [02:21<00:07, 12.13it/s][A
Training:  94%|██████████████████████████████████████▋  | 1417/1501 [02:21<00:06, 13.27it/s][A
Training:  95%|██████████████████████████████████████▊  | 1419/1501 [02:22<00:05, 14.59it/s][A
Training:  95%|████████████████████████

Evaluation...:  88%|█████████████████████████████████▍    | 147/167 [00:03<00:00, 38.57it/s][A[A

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:04<00:00, 39.43it/s][A[A

Evaluation...:  93%|███████████████████████████████████▍  | 156/167 [00:04<00:00, 38.24it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 38.12it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 37.77it/s][A[A

Training: 100%|████████████████████████████████████████▉| 1497/1501 [02:30<00:02,  1.39it/s][A
Training: 100%|████████████████████████████████████████▉| 1499/1501 [02:31<00:01,  1.92it/s][A

>>> training loss:  0.5685, valid loss:  1.9120, valid f1 score:  0.4987



Training: 100%|█████████████████████████████████████████| 1501/1501 [02:31<00:00,  9.93it/s][A
 50%|████████████████████████████                            | 4/8 [10:30<10:26, 156.74s/it]
Training:   0%|                                                    | 0/1501 [00:00<?, ?it/s][A
Training:   0%|                                            | 2/1501 [00:00<01:25, 17.44it/s][A
Training:   0%|                                            | 4/1501 [00:00<01:28, 16.95it/s][A
Training:   0%|▏                                           | 6/1501 [00:00<01:27, 17.16it/s][A
Training:   1%|▏                                           | 8/1501 [00:00<01:36, 15.48it/s][A
Training:   1%|▎                                          | 11/1501 [00:00<01:26, 17.31it/s][A
Training:   1%|▎                                          | 13/1501 [00:00<01:22, 18.02it/s][A
Training:   1%|▍                                          | 15/1501 [00:00<01:23, 17.77it/s][A
Training:   1%|▍                          

Evaluation...:  84%|███████████████████████████████▊      | 140/167 [00:03<00:00, 38.50it/s][A[A

Evaluation...:  86%|████████████████████████████████▊     | 144/167 [00:03<00:00, 38.77it/s][A[A

Evaluation...:  89%|█████████████████████████████████▋    | 148/167 [00:03<00:00, 38.51it/s][A[A

Evaluation...:  92%|██████████████████████████████████▊   | 153/167 [00:04<00:00, 38.69it/s][A[A

Evaluation...:  95%|███████████████████████████████████▉  | 158/167 [00:04<00:00, 39.66it/s][A[A

Evaluation...:  97%|████████████████████████████████████▊ | 162/167 [00:04<00:00, 38.61it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 37.77it/s][A[A

Training:   6%|██▊                                        | 96/1501 [00:09<16:53,  1.39it/s][A
Training:   7%|██▊                                        | 98/1501 [00:10<12:12,  1.92it/s][A

>>> training loss:  0.3822, valid loss:  1.9430, valid f1 score:  0.4972



Training:   7%|██▊                                       | 100/1501 [00:10<08:55,  2.61it/s][A
Training:   7%|██▊                                       | 102/1501 [00:10<06:40,  3.49it/s][A
Training:   7%|██▉                                       | 104/1501 [00:10<05:01,  4.63it/s][A
Training:   7%|██▉                                       | 106/1501 [00:10<03:54,  5.95it/s][A
Training:   7%|███                                       | 108/1501 [00:10<03:11,  7.29it/s][A
Training:   7%|███                                       | 110/1501 [00:10<02:38,  8.79it/s][A
Training:   7%|███▏                                      | 112/1501 [00:10<02:15, 10.22it/s][A
Training:   8%|███▏                                      | 114/1501 [00:10<01:57, 11.77it/s][A
Training:   8%|███▏                                      | 116/1501 [00:11<01:44, 13.29it/s][A
Training:   8%|███▎                                      | 118/1501 [00:11<01:39, 13.88it/s][A
Training:   8%|███▎                    

Evaluation...:  86%|████████████████████████████████▊     | 144/167 [00:03<00:00, 37.87it/s][A[A

Evaluation...:  89%|█████████████████████████████████▋    | 148/167 [00:03<00:00, 37.86it/s][A[A

Evaluation...:  92%|██████████████████████████████████▊   | 153/167 [00:04<00:00, 38.24it/s][A[A

Evaluation...:  95%|███████████████████████████████████▉  | 158/167 [00:04<00:00, 39.20it/s][A[A

Evaluation...:  97%|████████████████████████████████████▊ | 162/167 [00:04<00:00, 37.97it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 37.75it/s][A[A

Training:  13%|█████▍                                    | 196/1501 [00:20<15:40,  1.39it/s][A
Training:  13%|█████▌                                    | 198/1501 [00:20<11:19,  1.92it/s][A

>>> training loss:  0.3596, valid loss:  1.9263, valid f1 score:  0.5024



Training:  13%|█████▌                                    | 200/1501 [00:20<08:16,  2.62it/s][A
Training:  13%|█████▋                                    | 202/1501 [00:20<06:10,  3.50it/s][A
Training:  14%|█████▋                                    | 204/1501 [00:20<04:39,  4.65it/s][A
Training:  14%|█████▊                                    | 206/1501 [00:20<03:37,  5.96it/s][A
Training:  14%|█████▊                                    | 208/1501 [00:20<02:55,  7.37it/s][A
Training:  14%|█████▉                                    | 210/1501 [00:20<02:23,  9.00it/s][A
Training:  14%|█████▉                                    | 212/1501 [00:21<02:01, 10.59it/s][A
Training:  14%|█████▉                                    | 214/1501 [00:21<01:46, 12.06it/s][A
Training:  14%|██████                                    | 216/1501 [00:21<01:37, 13.14it/s][A
Training:  15%|██████                                    | 218/1501 [00:21<01:28, 14.55it/s][A
Training:  15%|██████▏                 

Evaluation...:  87%|████████████████████████████████▉     | 145/167 [00:03<00:00, 37.42it/s][A[A

Evaluation...:  90%|██████████████████████████████████▏   | 150/167 [00:03<00:00, 38.76it/s][A[A

Evaluation...:  92%|███████████████████████████████████   | 154/167 [00:04<00:00, 38.02it/s][A[A

Evaluation...:  95%|███████████████████████████████████▉  | 158/167 [00:04<00:00, 38.42it/s][A[A

Evaluation...:  97%|████████████████████████████████████▊ | 162/167 [00:04<00:00, 37.37it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.11it/s][A[A

Training:  20%|████████▎                                 | 296/1501 [00:30<14:22,  1.40it/s][A
Training:  20%|████████▎                                 | 298/1501 [00:30<10:23,  1.93it/s][A

>>> training loss:  0.4060, valid loss:  1.9361, valid f1 score:  0.5053



Training:  20%|████████▍                                 | 300/1501 [00:30<07:35,  2.63it/s][A
Training:  20%|████████▍                                 | 302/1501 [00:30<05:38,  3.54it/s][A
Training:  20%|████████▌                                 | 304/1501 [00:30<04:19,  4.61it/s][A
Training:  20%|████████▌                                 | 306/1501 [00:30<03:20,  5.97it/s][A
Training:  21%|████████▌                                 | 308/1501 [00:30<02:38,  7.53it/s][A
Training:  21%|████████▋                                 | 310/1501 [00:31<02:09,  9.17it/s][A
Training:  21%|████████▋                                 | 312/1501 [00:31<01:51, 10.66it/s][A
Training:  21%|████████▊                                 | 314/1501 [00:31<01:39, 11.94it/s][A
Training:  21%|████████▊                                 | 316/1501 [00:31<01:29, 13.23it/s][A
Training:  21%|████████▉                                 | 318/1501 [00:31<01:24, 13.97it/s][A
Training:  21%|████████▉               

Evaluation...:  87%|█████████████████████████████████▏    | 146/167 [00:03<00:00, 37.63it/s][A[A

Evaluation...:  90%|██████████████████████████████████▎   | 151/167 [00:03<00:00, 39.07it/s][A[A

Evaluation...:  93%|███████████████████████████████████▎  | 155/167 [00:04<00:00, 38.48it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 38.91it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.30it/s][A[A

Training:  26%|███████████                               | 396/1501 [00:40<13:06,  1.41it/s][A
Training:  27%|███████████▏                              | 398/1501 [00:40<09:29,  1.94it/s][A

>>> training loss:  0.3896, valid loss:  1.9547, valid f1 score:  0.4918



Training:  27%|███████████▏                              | 400/1501 [00:40<06:54,  2.66it/s][A
Training:  27%|███████████▏                              | 402/1501 [00:40<05:08,  3.56it/s][A
Training:  27%|███████████▎                              | 404/1501 [00:40<03:54,  4.69it/s][A
Training:  27%|███████████▎                              | 406/1501 [00:40<03:01,  6.05it/s][A
Training:  27%|███████████▍                              | 408/1501 [00:40<02:25,  7.49it/s][A
Training:  27%|███████████▍                              | 410/1501 [00:41<02:00,  9.04it/s][A
Training:  27%|███████████▌                              | 412/1501 [00:41<01:41, 10.69it/s][A
Training:  28%|███████████▌                              | 414/1501 [00:41<01:28, 12.25it/s][A
Training:  28%|███████████▋                              | 416/1501 [00:41<01:19, 13.67it/s][A
Training:  28%|███████████▋                              | 418/1501 [00:41<01:12, 14.87it/s][A
Training:  28%|███████████▊            

Evaluation...:  88%|█████████████████████████████████▍    | 147/167 [00:03<00:00, 38.24it/s][A[A

Evaluation...:  90%|██████████████████████████████████▎   | 151/167 [00:03<00:00, 38.54it/s][A[A

Evaluation...:  93%|███████████████████████████████████▎  | 155/167 [00:04<00:00, 37.97it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 38.13it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.25it/s][A[A

Training:  33%|█████████████▉                            | 496/1501 [00:50<11:57,  1.40it/s][A
Training:  33%|█████████████▉                            | 498/1501 [00:50<08:36,  1.94it/s][A

>>> training loss:  0.3986, valid loss:  1.9995, valid f1 score:  0.4981



Training:  33%|█████████████▉                            | 500/1501 [00:50<06:20,  2.63it/s][A
Training:  33%|██████████████                            | 502/1501 [00:50<04:43,  3.52it/s][A
Training:  34%|██████████████                            | 504/1501 [00:50<03:33,  4.67it/s][A
Training:  34%|██████████████▏                           | 506/1501 [00:50<02:45,  6.01it/s][A
Training:  34%|██████████████▏                           | 508/1501 [00:51<02:11,  7.58it/s][A
Training:  34%|██████████████▎                           | 510/1501 [00:51<01:46,  9.26it/s][A
Training:  34%|██████████████▎                           | 512/1501 [00:51<01:34, 10.47it/s][A
Training:  34%|██████████████▍                           | 514/1501 [00:51<01:20, 12.22it/s][A
Training:  34%|██████████████▍                           | 516/1501 [00:51<01:15, 13.03it/s][A
Training:  35%|██████████████▍                           | 518/1501 [00:51<01:10, 14.00it/s][A
Training:  35%|██████████████▌         

Evaluation...:  87%|████████████████████████████████▉     | 145/167 [00:03<00:00, 38.10it/s][A[A

Evaluation...:  90%|██████████████████████████████████▏   | 150/167 [00:03<00:00, 39.86it/s][A[A

Evaluation...:  92%|███████████████████████████████████   | 154/167 [00:04<00:00, 38.76it/s][A[A

Evaluation...:  95%|████████████████████████████████████▏ | 159/167 [00:04<00:00, 39.60it/s][A[A

Evaluation...:  98%|█████████████████████████████████████ | 163/167 [00:04<00:00, 38.58it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.20it/s][A[A

Training:  40%|████████████████▋                         | 596/1501 [01:00<10:46,  1.40it/s][A
Training:  40%|████████████████▋                         | 598/1501 [01:00<07:46,  1.93it/s][A

>>> training loss:  0.3869, valid loss:  1.9987, valid f1 score:  0.4827



Training:  40%|████████████████▊                         | 600/1501 [01:00<05:40,  2.64it/s][A
Training:  40%|████████████████▊                         | 602/1501 [01:00<04:12,  3.55it/s][A
Training:  40%|████████████████▉                         | 604/1501 [01:00<03:11,  4.68it/s][A
Training:  40%|████████████████▉                         | 606/1501 [01:01<02:32,  5.88it/s][A
Training:  41%|█████████████████                         | 608/1501 [01:01<02:02,  7.30it/s][A
Training:  41%|█████████████████                         | 610/1501 [01:01<01:40,  8.88it/s][A
Training:  41%|█████████████████                         | 612/1501 [01:01<01:24, 10.48it/s][A
Training:  41%|█████████████████▏                        | 614/1501 [01:01<01:15, 11.70it/s][A
Training:  41%|█████████████████▏                        | 616/1501 [01:01<01:07, 13.12it/s][A
Training:  41%|█████████████████▎                        | 618/1501 [01:01<01:01, 14.30it/s][A
Training:  41%|█████████████████▍      

Evaluation...:  90%|██████████████████████████████████▏   | 150/167 [00:03<00:00, 39.09it/s][A[A

Evaluation...:  92%|███████████████████████████████████   | 154/167 [00:04<00:00, 38.50it/s][A[A

Evaluation...:  95%|████████████████████████████████████▏ | 159/167 [00:04<00:00, 39.69it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.01it/s][A[A

Training:  46%|███████████████████▍                      | 696/1501 [01:10<09:37,  1.39it/s][A
Training:  47%|███████████████████▌                      | 698/1501 [01:10<06:56,  1.93it/s][A

>>> training loss:  0.4362, valid loss:  1.9879, valid f1 score:  0.4865



Training:  47%|███████████████████▌                      | 700/1501 [01:10<05:03,  2.64it/s][A
Training:  47%|███████████████████▋                      | 702/1501 [01:10<03:46,  3.53it/s][A
Training:  47%|███████████████████▋                      | 704/1501 [01:11<02:52,  4.62it/s][A
Training:  47%|███████████████████▊                      | 706/1501 [01:11<02:13,  5.96it/s][A
Training:  47%|███████████████████▊                      | 708/1501 [01:11<01:46,  7.47it/s][A
Training:  47%|███████████████████▊                      | 710/1501 [01:11<01:29,  8.80it/s][A
Training:  47%|███████████████████▉                      | 712/1501 [01:11<01:14, 10.52it/s][A
Training:  48%|███████████████████▉                      | 714/1501 [01:11<01:06, 11.88it/s][A
Training:  48%|████████████████████                      | 716/1501 [01:11<00:59, 13.26it/s][A
Training:  48%|████████████████████                      | 718/1501 [01:11<00:54, 14.26it/s][A
Training:  48%|████████████████████▏   

Evaluation...:  88%|█████████████████████████████████▍    | 147/167 [00:03<00:00, 38.60it/s][A[A

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:03<00:00, 39.70it/s][A[A

Evaluation...:  93%|███████████████████████████████████▍  | 156/167 [00:04<00:00, 38.84it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 38.88it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.21it/s][A[A

Training:  53%|██████████████████████▎                   | 796/1501 [01:20<08:24,  1.40it/s][A
Training:  53%|██████████████████████▎                   | 798/1501 [01:20<06:03,  1.93it/s][A

>>> training loss:  0.4343, valid loss:  1.9814, valid f1 score:  0.5005



Training:  53%|██████████████████████▍                   | 800/1501 [01:21<04:26,  2.63it/s][A
Training:  53%|██████████████████████▍                   | 802/1501 [01:21<03:18,  3.52it/s][A
Training:  54%|██████████████████████▍                   | 804/1501 [01:21<02:29,  4.66it/s][A
Training:  54%|██████████████████████▌                   | 806/1501 [01:21<01:58,  5.88it/s][A
Training:  54%|██████████████████████▌                   | 808/1501 [01:21<01:33,  7.40it/s][A
Training:  54%|██████████████████████▋                   | 810/1501 [01:21<01:16,  9.00it/s][A
Training:  54%|██████████████████████▋                   | 812/1501 [01:21<01:06, 10.33it/s][A
Training:  54%|██████████████████████▊                   | 814/1501 [01:21<00:58, 11.82it/s][A
Training:  54%|██████████████████████▊                   | 816/1501 [01:21<00:52, 13.16it/s][A
Training:  54%|██████████████████████▉                   | 818/1501 [01:22<00:47, 14.40it/s][A
Training:  55%|██████████████████████▉ 

Evaluation...:  88%|█████████████████████████████████▍    | 147/167 [00:03<00:00, 38.25it/s][A[A

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:03<00:00, 39.36it/s][A[A

Evaluation...:  93%|███████████████████████████████████▍  | 156/167 [00:04<00:00, 38.70it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 38.24it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.14it/s][A[A

Training:  60%|█████████████████████████                 | 897/1501 [01:30<07:14,  1.39it/s][A
Training:  60%|█████████████████████████▏                | 899/1501 [01:31<05:13,  1.92it/s][A

>>> training loss:  0.4810, valid loss:  1.9654, valid f1 score:  0.5071



Training:  60%|█████████████████████████▏                | 901/1501 [01:31<03:51,  2.59it/s][A
Training:  60%|█████████████████████████▎                | 903/1501 [01:31<02:50,  3.50it/s][A
Training:  60%|█████████████████████████▎                | 905/1501 [01:31<02:09,  4.61it/s][A
Training:  60%|█████████████████████████▍                | 907/1501 [01:31<01:40,  5.90it/s][A
Training:  61%|█████████████████████████▍                | 910/1501 [01:31<01:12,  8.10it/s][A
Training:  61%|█████████████████████████▌                | 912/1501 [01:31<01:03,  9.27it/s][A
Training:  61%|█████████████████████████▌                | 914/1501 [01:31<00:55, 10.54it/s][A
Training:  61%|█████████████████████████▋                | 916/1501 [01:32<00:49, 11.86it/s][A
Training:  61%|█████████████████████████▋                | 918/1501 [01:32<00:45, 12.94it/s][A
Training:  61%|█████████████████████████▋                | 920/1501 [01:32<00:41, 14.04it/s][A
Training:  61%|████████████████████████

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:03<00:00, 39.42it/s][A[A

Evaluation...:  93%|███████████████████████████████████▍  | 156/167 [00:04<00:00, 38.79it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 38.80it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.07it/s][A[A

Training:  66%|███████████████████████████▊              | 996/1501 [01:41<06:01,  1.40it/s][A
Training:  66%|███████████████████████████▉              | 998/1501 [01:41<04:21,  1.92it/s][A

>>> training loss:  0.4844, valid loss:  1.9776, valid f1 score:  0.5061



Training:  67%|███████████████████████████▎             | 1000/1501 [01:41<03:11,  2.62it/s][A
Training:  67%|███████████████████████████▎             | 1002/1501 [01:41<02:22,  3.50it/s][A
Training:  67%|███████████████████████████▍             | 1004/1501 [01:41<01:48,  4.60it/s][A
Training:  67%|███████████████████████████▍             | 1006/1501 [01:41<01:24,  5.83it/s][A
Training:  67%|███████████████████████████▌             | 1008/1501 [01:41<01:07,  7.29it/s][A
Training:  67%|███████████████████████████▌             | 1010/1501 [01:41<00:55,  8.86it/s][A
Training:  67%|███████████████████████████▋             | 1012/1501 [01:42<00:47, 10.24it/s][A
Training:  68%|███████████████████████████▋             | 1014/1501 [01:42<00:42, 11.51it/s][A
Training:  68%|███████████████████████████▊             | 1016/1501 [01:42<00:37, 12.95it/s][A
Training:  68%|███████████████████████████▊             | 1018/1501 [01:42<00:34, 14.19it/s][A
Training:  68%|████████████████████████

Evaluation...:  88%|█████████████████████████████████▍    | 147/167 [00:03<00:00, 38.73it/s][A[A

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:03<00:00, 39.78it/s][A[A

Evaluation...:  93%|███████████████████████████████████▍  | 156/167 [00:04<00:00, 39.03it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 38.98it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.36it/s][A[A

Training:  73%|█████████████████████████████▉           | 1096/1501 [01:51<04:47,  1.41it/s][A
Training:  73%|█████████████████████████████▉           | 1098/1501 [01:51<03:27,  1.94it/s][A

>>> training loss:  0.5033, valid loss:  1.9987, valid f1 score:  0.4932



Training:  73%|██████████████████████████████           | 1100/1501 [01:51<02:31,  2.65it/s][A
Training:  73%|██████████████████████████████           | 1102/1501 [01:51<01:52,  3.53it/s][A
Training:  74%|██████████████████████████████▏          | 1104/1501 [01:51<01:25,  4.62it/s][A
Training:  74%|██████████████████████████████▏          | 1106/1501 [01:51<01:07,  5.88it/s][A
Training:  74%|██████████████████████████████▎          | 1108/1501 [01:51<00:53,  7.36it/s][A
Training:  74%|██████████████████████████████▎          | 1110/1501 [01:51<00:44,  8.89it/s][A
Training:  74%|██████████████████████████████▎          | 1112/1501 [01:52<00:36, 10.54it/s][A
Training:  74%|██████████████████████████████▍          | 1114/1501 [01:52<00:32, 12.03it/s][A
Training:  74%|██████████████████████████████▍          | 1116/1501 [01:52<00:28, 13.34it/s][A
Training:  74%|██████████████████████████████▌          | 1118/1501 [01:52<00:27, 14.18it/s][A
Training:  75%|████████████████████████

Evaluation...:  90%|██████████████████████████████████▎   | 151/167 [00:03<00:00, 39.26it/s][A[A

Evaluation...:  93%|███████████████████████████████████▎  | 155/167 [00:04<00:00, 38.44it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 38.72it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.16it/s][A[A

Training:  80%|████████████████████████████████▋        | 1196/1501 [02:01<03:38,  1.40it/s][A
Training:  80%|████████████████████████████████▋        | 1198/1501 [02:01<02:37,  1.93it/s][A

>>> training loss:  0.4995, valid loss:  2.0109, valid f1 score:  0.4990



Training:  80%|████████████████████████████████▊        | 1200/1501 [02:01<01:54,  2.63it/s][A
Training:  80%|████████████████████████████████▊        | 1202/1501 [02:01<01:25,  3.50it/s][A
Training:  80%|████████████████████████████████▉        | 1204/1501 [02:01<01:04,  4.61it/s][A
Training:  80%|████████████████████████████████▉        | 1206/1501 [02:01<00:49,  5.96it/s][A
Training:  80%|████████████████████████████████▉        | 1208/1501 [02:01<00:39,  7.51it/s][A
Training:  81%|█████████████████████████████████        | 1210/1501 [02:02<00:37,  7.80it/s][A
Training:  81%|█████████████████████████████████        | 1212/1501 [02:02<00:30,  9.42it/s][A
Training:  81%|█████████████████████████████████▏       | 1214/1501 [02:02<00:26, 10.78it/s][A
Training:  81%|█████████████████████████████████▏       | 1216/1501 [02:02<00:23, 12.33it/s][A
Training:  81%|█████████████████████████████████▎       | 1218/1501 [02:02<00:20, 13.54it/s][A
Training:  81%|████████████████████████

Evaluation...:  86%|████████████████████████████████▌     | 143/167 [00:03<00:00, 38.22it/s][A[A

Evaluation...:  88%|█████████████████████████████████▍    | 147/167 [00:03<00:00, 37.67it/s][A[A

Evaluation...:  90%|██████████████████████████████████▎   | 151/167 [00:04<00:00, 38.22it/s][A[A

Evaluation...:  93%|███████████████████████████████████▎  | 155/167 [00:04<00:00, 37.87it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 38.54it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 37.19it/s][A[A

Training:  86%|███████████████████████████████████▍     | 1296/1501 [02:11<02:30,  1.37it/s][A
Training:  86%|███████████████████████████████████▍     | 1298/1501 [02:11<01:47,  1.89it/s][A

>>> training loss:  0.5086, valid loss:  2.0039, valid f1 score:  0.4826



Training:  87%|███████████████████████████████████▌     | 1300/1501 [02:11<01:17,  2.59it/s][A
Training:  87%|███████████████████████████████████▌     | 1302/1501 [02:11<00:57,  3.46it/s][A
Training:  87%|███████████████████████████████████▌     | 1304/1501 [02:12<00:42,  4.58it/s][A
Training:  87%|███████████████████████████████████▋     | 1306/1501 [02:12<00:33,  5.90it/s][A
Training:  87%|███████████████████████████████████▋     | 1308/1501 [02:12<00:26,  7.37it/s][A
Training:  87%|███████████████████████████████████▊     | 1310/1501 [02:12<00:21,  9.01it/s][A
Training:  87%|███████████████████████████████████▊     | 1312/1501 [02:12<00:18, 10.43it/s][A
Training:  88%|███████████████████████████████████▉     | 1314/1501 [02:12<00:15, 12.00it/s][A
Training:  88%|███████████████████████████████████▉     | 1316/1501 [02:12<00:13, 13.33it/s][A
Training:  88%|████████████████████████████████████     | 1318/1501 [02:12<00:12, 14.25it/s][A
Training:  88%|████████████████████████

Evaluation...:  86%|████████████████████████████████▊     | 144/167 [00:03<00:00, 38.66it/s][A[A

Evaluation...:  89%|█████████████████████████████████▋    | 148/167 [00:03<00:00, 38.74it/s][A[A

Evaluation...:  92%|██████████████████████████████████▊   | 153/167 [00:04<00:00, 39.01it/s][A[A

Evaluation...:  95%|███████████████████████████████████▉  | 158/167 [00:04<00:00, 39.73it/s][A[A

Evaluation...:  97%|████████████████████████████████████▊ | 162/167 [00:04<00:00, 38.63it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 37.98it/s][A[A

Training:  93%|██████████████████████████████████████▏  | 1396/1501 [02:21<01:15,  1.39it/s][A
Training:  93%|██████████████████████████████████████▏  | 1398/1501 [02:21<00:53,  1.93it/s][A

>>> training loss:  0.5153, valid loss:  2.0139, valid f1 score:  0.4916



Training:  93%|██████████████████████████████████████▏  | 1400/1501 [02:21<00:38,  2.63it/s][A
Training:  93%|██████████████████████████████████████▎  | 1402/1501 [02:22<00:27,  3.54it/s][A
Training:  94%|██████████████████████████████████████▎  | 1404/1501 [02:22<00:20,  4.65it/s][A
Training:  94%|██████████████████████████████████████▍  | 1406/1501 [02:22<00:15,  5.98it/s][A
Training:  94%|██████████████████████████████████████▍  | 1408/1501 [02:22<00:12,  7.44it/s][A
Training:  94%|██████████████████████████████████████▌  | 1410/1501 [02:22<00:10,  8.97it/s][A
Training:  94%|██████████████████████████████████████▌  | 1412/1501 [02:22<00:08, 10.25it/s][A
Training:  94%|██████████████████████████████████████▌  | 1414/1501 [02:22<00:07, 11.42it/s][A
Training:  94%|██████████████████████████████████████▋  | 1416/1501 [02:22<00:06, 12.92it/s][A
Training:  94%|██████████████████████████████████████▋  | 1418/1501 [02:22<00:06, 13.80it/s][A
Training:  95%|████████████████████████

Evaluation...:  88%|█████████████████████████████████▍    | 147/167 [00:03<00:00, 39.18it/s][A[A

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:03<00:00, 39.99it/s][A[A

Evaluation...:  93%|███████████████████████████████████▍  | 156/167 [00:04<00:00, 39.16it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 38.66it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.38it/s][A[A

Training: 100%|████████████████████████████████████████▊| 1496/1501 [02:31<00:03,  1.39it/s][A
Training: 100%|████████████████████████████████████████▉| 1498/1501 [02:31<00:01,  1.91it/s][A

>>> training loss:  0.5185, valid loss:  1.9787, valid f1 score:  0.4892



Training: 100%|█████████████████████████████████████████| 1501/1501 [02:32<00:00,  9.87it/s][A
 62%|███████████████████████████████████                     | 5/8 [13:02<07:45, 155.08s/it]
Training:   0%|                                                    | 0/1501 [00:00<?, ?it/s][A
Training:   0%|                                            | 2/1501 [00:00<01:23, 17.89it/s][A
Training:   0%|                                            | 4/1501 [00:00<01:24, 17.73it/s][A
Training:   0%|▏                                           | 6/1501 [00:00<01:24, 17.75it/s][A
Training:   1%|▏                                           | 8/1501 [00:00<01:30, 16.53it/s][A
Training:   1%|▎                                          | 10/1501 [00:00<01:30, 16.52it/s][A
Training:   1%|▎                                          | 12/1501 [00:00<01:26, 17.25it/s][A
Training:   1%|▍                                          | 14/1501 [00:00<01:25, 17.29it/s][A
Training:   1%|▍                          

Evaluation...:  86%|████████████████████████████████▌     | 143/167 [00:03<00:00, 38.08it/s][A[A

Evaluation...:  88%|█████████████████████████████████▍    | 147/167 [00:03<00:00, 37.50it/s][A[A

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:03<00:00, 38.64it/s][A[A

Evaluation...:  93%|███████████████████████████████████▍  | 156/167 [00:04<00:00, 38.28it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 38.12it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.08it/s][A[A

Training:   6%|██▋                                        | 95/1501 [00:09<16:50,  1.39it/s][A
Training:   6%|██▊                                        | 97/1501 [00:09<12:10,  1.92it/s][A

>>> training loss:  0.3676, valid loss:  2.0234, valid f1 score:  0.4828



Training:   7%|██▊                                        | 99/1501 [00:10<08:52,  2.63it/s][A
Training:   7%|██▊                                       | 101/1501 [00:10<06:38,  3.51it/s][A
Training:   7%|██▉                                       | 103/1501 [00:10<05:00,  4.66it/s][A
Training:   7%|██▉                                       | 105/1501 [00:10<03:52,  6.00it/s][A
Training:   7%|██▉                                       | 107/1501 [00:10<03:07,  7.45it/s][A
Training:   7%|███                                       | 109/1501 [00:10<02:33,  9.05it/s][A
Training:   7%|███                                       | 111/1501 [00:10<02:09, 10.72it/s][A
Training:   8%|███▏                                      | 113/1501 [00:10<01:54, 12.16it/s][A
Training:   8%|███▏                                      | 115/1501 [00:10<01:43, 13.42it/s][A
Training:   8%|███▎                                      | 117/1501 [00:11<01:37, 14.18it/s][A
Training:   8%|███▎                    

Evaluation...:  88%|█████████████████████████████████▍    | 147/167 [00:03<00:00, 38.75it/s][A[A

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:03<00:00, 39.74it/s][A[A

Evaluation...:  93%|███████████████████████████████████▍  | 156/167 [00:04<00:00, 39.06it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 39.02it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.13it/s][A[A

Training:  13%|█████▍                                    | 196/1501 [00:20<15:34,  1.40it/s][A
Training:  13%|█████▌                                    | 198/1501 [00:20<11:15,  1.93it/s][A

>>> training loss:  0.3331, valid loss:  2.0201, valid f1 score:  0.5016



Training:  13%|█████▌                                    | 200/1501 [00:20<08:14,  2.63it/s][A
Training:  13%|█████▋                                    | 202/1501 [00:20<06:07,  3.53it/s][A
Training:  14%|█████▋                                    | 204/1501 [00:20<04:39,  4.64it/s][A
Training:  14%|█████▊                                    | 206/1501 [00:20<03:38,  5.92it/s][A
Training:  14%|█████▊                                    | 208/1501 [00:20<02:57,  7.29it/s][A
Training:  14%|█████▉                                    | 210/1501 [00:20<02:27,  8.76it/s][A
Training:  14%|█████▉                                    | 212/1501 [00:20<02:05, 10.30it/s][A
Training:  14%|█████▉                                    | 214/1501 [00:21<01:48, 11.91it/s][A
Training:  14%|██████                                    | 216/1501 [00:21<01:36, 13.29it/s][A
Training:  15%|██████                                    | 218/1501 [00:21<01:27, 14.58it/s][A
Training:  15%|██████▏                 

Evaluation...:  88%|█████████████████████████████████▍    | 147/167 [00:03<00:00, 38.86it/s][A[A

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:03<00:00, 39.32it/s][A[A

Evaluation...:  93%|███████████████████████████████████▍  | 156/167 [00:04<00:00, 38.78it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 38.86it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.31it/s][A[A

Training:  20%|████████▎                                 | 296/1501 [00:30<14:18,  1.40it/s][A
Training:  20%|████████▎                                 | 298/1501 [00:30<10:20,  1.94it/s][A

>>> training loss:  0.3226, valid loss:  2.0367, valid f1 score:  0.4976



Training:  20%|████████▍                                 | 300/1501 [00:30<07:35,  2.64it/s][A
Training:  20%|████████▍                                 | 302/1501 [00:30<05:36,  3.56it/s][A
Training:  20%|████████▌                                 | 304/1501 [00:30<04:16,  4.67it/s][A
Training:  20%|████████▌                                 | 306/1501 [00:30<03:19,  6.00it/s][A
Training:  21%|████████▌                                 | 308/1501 [00:30<02:38,  7.53it/s][A
Training:  21%|████████▋                                 | 310/1501 [00:30<02:09,  9.17it/s][A
Training:  21%|████████▋                                 | 312/1501 [00:31<01:52, 10.61it/s][A
Training:  21%|████████▊                                 | 314/1501 [00:31<01:40, 11.81it/s][A
Training:  21%|████████▊                                 | 316/1501 [00:31<01:31, 12.97it/s][A
Training:  21%|████████▉                                 | 318/1501 [00:31<01:22, 14.39it/s][A
Training:  21%|████████▉               

Evaluation...:  86%|████████████████████████████████▊     | 144/167 [00:03<00:00, 38.67it/s][A[A

Evaluation...:  89%|█████████████████████████████████▋    | 148/167 [00:03<00:00, 38.54it/s][A[A

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:04<00:00, 38.88it/s][A[A

Evaluation...:  93%|███████████████████████████████████▍  | 156/167 [00:04<00:00, 38.23it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 38.29it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 37.67it/s][A[A

Training:  26%|███████████                               | 396/1501 [00:40<13:20,  1.38it/s][A
Training:  27%|███████████▏                              | 398/1501 [00:40<09:36,  1.91it/s][A

>>> training loss:  0.3877, valid loss:  2.0523, valid f1 score:  0.5092



Training:  27%|███████████▏                              | 400/1501 [00:40<07:01,  2.61it/s][A
Training:  27%|███████████▏                              | 402/1501 [00:40<05:12,  3.52it/s][A
Training:  27%|███████████▎                              | 404/1501 [00:40<03:58,  4.61it/s][A
Training:  27%|███████████▎                              | 406/1501 [00:40<03:06,  5.89it/s][A
Training:  27%|███████████▍                              | 408/1501 [00:40<02:27,  7.41it/s][A
Training:  27%|███████████▍                              | 410/1501 [00:41<02:03,  8.84it/s][A
Training:  27%|███████████▌                              | 412/1501 [00:41<01:46, 10.26it/s][A
Training:  28%|███████████▌                              | 414/1501 [00:41<01:31, 11.93it/s][A
Training:  28%|███████████▋                              | 416/1501 [00:41<01:20, 13.51it/s][A
Training:  28%|███████████▋                              | 418/1501 [00:41<01:16, 14.15it/s][A
Training:  28%|███████████▊            

Evaluation...:  87%|█████████████████████████████████▏    | 146/167 [00:03<00:00, 37.26it/s][A[A

Evaluation...:  90%|██████████████████████████████████▎   | 151/167 [00:03<00:00, 38.04it/s][A[A

Evaluation...:  93%|███████████████████████████████████▎  | 155/167 [00:04<00:00, 37.68it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 38.31it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.16it/s][A[A

Training:  33%|█████████████▉                            | 496/1501 [00:50<11:58,  1.40it/s][A
Training:  33%|█████████████▉                            | 498/1501 [00:50<08:38,  1.93it/s][A

>>> training loss:  0.3719, valid loss:  2.0404, valid f1 score:  0.4911



Training:  33%|█████████████▉                            | 500/1501 [00:50<06:22,  2.62it/s][A
Training:  34%|██████████████                            | 503/1501 [00:50<04:11,  3.96it/s][A
Training:  34%|██████████████▏                           | 505/1501 [00:50<03:19,  5.00it/s][A
Training:  34%|██████████████▏                           | 507/1501 [00:51<02:37,  6.30it/s][A
Training:  34%|██████████████▏                           | 509/1501 [00:51<02:08,  7.70it/s][A
Training:  34%|██████████████▎                           | 511/1501 [00:51<01:46,  9.30it/s][A
Training:  34%|██████████████▎                           | 513/1501 [00:51<01:33, 10.54it/s][A
Training:  34%|██████████████▍                           | 515/1501 [00:51<01:22, 11.93it/s][A
Training:  34%|██████████████▍                           | 517/1501 [00:51<01:15, 13.09it/s][A
Training:  35%|██████████████▌                           | 519/1501 [00:51<01:07, 14.50it/s][A
Training:  35%|██████████████▌         

Evaluation...:  90%|██████████████████████████████████▎   | 151/167 [00:04<00:00, 38.38it/s][A[A

Evaluation...:  93%|███████████████████████████████████▎  | 155/167 [00:04<00:00, 37.07it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 37.79it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 37.77it/s][A[A

Training:  40%|████████████████▋                         | 595/1501 [01:00<11:09,  1.35it/s][A
Training:  40%|████████████████▋                         | 597/1501 [01:00<08:04,  1.87it/s][A

>>> training loss:  0.3713, valid loss:  2.0949, valid f1 score:  0.4798



Training:  40%|████████████████▊                         | 599/1501 [01:00<05:56,  2.53it/s][A
Training:  40%|████████████████▊                         | 601/1501 [01:01<04:23,  3.41it/s][A
Training:  40%|████████████████▊                         | 603/1501 [01:01<03:18,  4.52it/s][A
Training:  40%|████████████████▉                         | 605/1501 [01:01<02:34,  5.81it/s][A
Training:  40%|████████████████▉                         | 607/1501 [01:01<02:02,  7.32it/s][A
Training:  41%|█████████████████                         | 609/1501 [01:01<01:41,  8.77it/s][A
Training:  41%|█████████████████                         | 611/1501 [01:01<01:27, 10.12it/s][A
Training:  41%|█████████████████▏                        | 613/1501 [01:01<01:14, 11.87it/s][A
Training:  41%|█████████████████▏                        | 615/1501 [01:01<01:07, 13.14it/s][A
Training:  41%|█████████████████▎                        | 617/1501 [01:01<01:02, 14.20it/s][A
Training:  41%|█████████████████▎      

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:03<00:00, 39.89it/s][A[A

Evaluation...:  93%|███████████████████████████████████▍  | 156/167 [00:04<00:00, 39.26it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 39.22it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.77it/s][A[A

Training:  46%|███████████████████▍                      | 695/1501 [01:10<09:28,  1.42it/s][A
Training:  46%|███████████████████▌                      | 697/1501 [01:10<06:51,  1.96it/s][A

>>> training loss:  0.4224, valid loss:  2.0329, valid f1 score:  0.4919



Training:  47%|███████████████████▌                      | 699/1501 [01:10<05:01,  2.66it/s][A
Training:  47%|███████████████████▌                      | 701/1501 [01:11<03:43,  3.57it/s][A
Training:  47%|███████████████████▋                      | 703/1501 [01:11<02:48,  4.73it/s][A
Training:  47%|███████████████████▋                      | 705/1501 [01:11<02:10,  6.09it/s][A
Training:  47%|███████████████████▊                      | 707/1501 [01:11<01:44,  7.61it/s][A
Training:  47%|███████████████████▊                      | 709/1501 [01:11<01:25,  9.23it/s][A
Training:  47%|███████████████████▉                      | 711/1501 [01:11<01:12, 10.95it/s][A
Training:  48%|███████████████████▉                      | 713/1501 [01:11<01:03, 12.32it/s][A
Training:  48%|████████████████████                      | 715/1501 [01:11<00:58, 13.47it/s][A
Training:  48%|████████████████████                      | 717/1501 [01:11<00:54, 14.43it/s][A
Training:  48%|████████████████████    

Evaluation...:  88%|█████████████████████████████████▍    | 147/167 [00:03<00:00, 38.25it/s][A[A

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:03<00:00, 39.46it/s][A[A

Evaluation...:  93%|███████████████████████████████████▍  | 156/167 [00:04<00:00, 38.86it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 38.91it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.40it/s][A[A

Training:  53%|██████████████████████▏                   | 795/1501 [01:20<08:22,  1.41it/s][A
Training:  53%|██████████████████████▎                   | 797/1501 [01:20<06:01,  1.95it/s][A

>>> training loss:  0.4131, valid loss:  2.0633, valid f1 score:  0.4929



Training:  53%|██████████████████████▎                   | 799/1501 [01:20<04:25,  2.64it/s][A
Training:  53%|██████████████████████▍                   | 801/1501 [01:21<03:16,  3.56it/s][A
Training:  53%|██████████████████████▍                   | 803/1501 [01:21<02:30,  4.65it/s][A
Training:  54%|██████████████████████▌                   | 805/1501 [01:21<01:56,  5.96it/s][A
Training:  54%|██████████████████████▌                   | 807/1501 [01:21<01:33,  7.42it/s][A
Training:  54%|██████████████████████▋                   | 809/1501 [01:21<01:19,  8.68it/s][A
Training:  54%|██████████████████████▋                   | 811/1501 [01:21<01:07, 10.29it/s][A
Training:  54%|██████████████████████▋                   | 813/1501 [01:21<00:58, 11.74it/s][A
Training:  54%|██████████████████████▊                   | 815/1501 [01:21<00:52, 12.96it/s][A
Training:  54%|██████████████████████▊                   | 817/1501 [01:21<00:48, 14.12it/s][A
Training:  55%|██████████████████████▉ 

Evaluation...:  89%|█████████████████████████████████▋    | 148/167 [00:03<00:00, 38.86it/s][A[A

Evaluation...:  92%|██████████████████████████████████▊   | 153/167 [00:03<00:00, 39.31it/s][A[A

Evaluation...:  95%|███████████████████████████████████▉  | 158/167 [00:04<00:00, 40.08it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.57it/s][A[A

Training:  60%|█████████████████████████                 | 895/1501 [01:30<07:08,  1.42it/s][A
Training:  60%|█████████████████████████                 | 897/1501 [01:30<05:09,  1.95it/s][A

>>> training loss:  0.4220, valid loss:  2.0586, valid f1 score:  0.4899



Training:  60%|█████████████████████████▏                | 899/1501 [01:30<03:46,  2.66it/s][A
Training:  60%|█████████████████████████▏                | 901/1501 [01:31<02:48,  3.55it/s][A
Training:  60%|█████████████████████████▎                | 903/1501 [01:31<02:08,  4.64it/s][A
Training:  60%|█████████████████████████▎                | 905/1501 [01:31<01:39,  5.98it/s][A
Training:  60%|█████████████████████████▍                | 907/1501 [01:31<01:18,  7.52it/s][A
Training:  61%|█████████████████████████▍                | 909/1501 [01:31<01:06,  8.89it/s][A
Training:  61%|█████████████████████████▍                | 911/1501 [01:31<00:59,  9.88it/s][A
Training:  61%|█████████████████████████▌                | 913/1501 [01:31<00:53, 10.94it/s][A
Training:  61%|█████████████████████████▌                | 915/1501 [01:31<00:47, 12.31it/s][A
Training:  61%|█████████████████████████▋                | 917/1501 [01:32<00:42, 13.75it/s][A
Training:  61%|████████████████████████

Evaluation...:  87%|████████████████████████████████▉     | 145/167 [00:03<00:00, 38.19it/s][A[A

Evaluation...:  90%|██████████████████████████████████▏   | 150/167 [00:03<00:00, 40.00it/s][A[A

Evaluation...:  92%|███████████████████████████████████   | 154/167 [00:04<00:00, 39.02it/s][A[A

Evaluation...:  95%|████████████████████████████████████▏ | 159/167 [00:04<00:00, 40.06it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.25it/s][A[A

Training:  66%|███████████████████████████▊              | 995/1501 [01:40<05:59,  1.41it/s][A
Training:  66%|███████████████████████████▉              | 997/1501 [01:40<04:19,  1.94it/s][A

>>> training loss:  0.4205, valid loss:  2.0798, valid f1 score:  0.4858



Training:  67%|███████████████████████████▉              | 999/1501 [01:41<03:10,  2.63it/s][A
Training:  67%|███████████████████████████▎             | 1001/1501 [01:41<02:21,  3.53it/s][A
Training:  67%|███████████████████████████▍             | 1003/1501 [01:41<01:47,  4.64it/s][A
Training:  67%|███████████████████████████▍             | 1005/1501 [01:41<01:23,  5.93it/s][A
Training:  67%|███████████████████████████▌             | 1007/1501 [01:41<01:06,  7.43it/s][A
Training:  67%|███████████████████████████▌             | 1009/1501 [01:41<00:54,  8.99it/s][A
Training:  67%|███████████████████████████▌             | 1011/1501 [01:41<00:46, 10.48it/s][A
Training:  67%|███████████████████████████▋             | 1013/1501 [01:41<00:40, 12.13it/s][A
Training:  68%|███████████████████████████▋             | 1015/1501 [01:42<00:36, 13.25it/s][A
Training:  68%|███████████████████████████▊             | 1017/1501 [01:42<00:35, 13.80it/s][A
Training:  68%|████████████████████████

Evaluation...:  87%|████████████████████████████████▉     | 145/167 [00:03<00:00, 38.22it/s][A[A

Evaluation...:  90%|██████████████████████████████████▏   | 150/167 [00:03<00:00, 40.07it/s][A[A

Evaluation...:  93%|███████████████████████████████████▎  | 155/167 [00:04<00:00, 39.15it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 39.44it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.39it/s][A[A

Training:  73%|█████████████████████████████▉           | 1095/1501 [01:51<04:50,  1.40it/s][A
Training:  73%|█████████████████████████████▉           | 1097/1501 [01:51<03:29,  1.93it/s][A

>>> training loss:  0.4299, valid loss:  2.0664, valid f1 score:  0.4999



Training:  73%|██████████████████████████████           | 1099/1501 [01:51<02:32,  2.64it/s][A
Training:  73%|██████████████████████████████           | 1101/1501 [01:51<01:53,  3.51it/s][A
Training:  73%|██████████████████████████████▏          | 1103/1501 [01:51<01:26,  4.62it/s][A
Training:  74%|██████████████████████████████▏          | 1105/1501 [01:51<01:06,  5.94it/s][A
Training:  74%|██████████████████████████████▏          | 1107/1501 [01:51<00:53,  7.42it/s][A
Training:  74%|██████████████████████████████▎          | 1109/1501 [01:51<00:43,  9.09it/s][A
Training:  74%|██████████████████████████████▎          | 1111/1501 [01:52<00:37, 10.34it/s][A
Training:  74%|██████████████████████████████▍          | 1113/1501 [01:52<00:32, 11.88it/s][A
Training:  74%|██████████████████████████████▍          | 1115/1501 [01:52<00:29, 13.25it/s][A
Training:  74%|██████████████████████████████▌          | 1117/1501 [01:52<00:26, 14.28it/s][A
Training:  75%|████████████████████████

Evaluation...:  90%|██████████████████████████████████▏   | 150/167 [00:03<00:00, 40.54it/s][A[A

Evaluation...:  93%|███████████████████████████████████▎  | 155/167 [00:04<00:00, 39.68it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 39.73it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.42it/s][A[A

Training:  80%|████████████████████████████████▋        | 1195/1501 [02:01<03:37,  1.41it/s][A
Training:  80%|████████████████████████████████▋        | 1197/1501 [02:01<02:36,  1.95it/s][A

>>> training loss:  0.4547, valid loss:  2.0634, valid f1 score:  0.4963



Training:  80%|████████████████████████████████▊        | 1199/1501 [02:01<01:54,  2.63it/s][A
Training:  80%|████████████████████████████████▊        | 1201/1501 [02:01<01:25,  3.52it/s][A
Training:  80%|████████████████████████████████▊        | 1203/1501 [02:01<01:04,  4.65it/s][A
Training:  80%|████████████████████████████████▉        | 1205/1501 [02:01<00:49,  6.02it/s][A
Training:  80%|████████████████████████████████▉        | 1207/1501 [02:01<00:39,  7.52it/s][A
Training:  81%|█████████████████████████████████        | 1210/1501 [02:01<00:29,  9.97it/s][A
Training:  81%|█████████████████████████████████        | 1212/1501 [02:02<00:25, 11.48it/s][A
Training:  81%|█████████████████████████████████▏       | 1214/1501 [02:02<00:22, 12.61it/s][A
Training:  81%|█████████████████████████████████▏       | 1216/1501 [02:02<00:21, 13.46it/s][A
Training:  81%|█████████████████████████████████▎       | 1218/1501 [02:02<00:19, 14.68it/s][A
Training:  81%|████████████████████████

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:03<00:00, 40.22it/s][A[A

Evaluation...:  94%|███████████████████████████████████▋  | 157/167 [00:04<00:00, 40.10it/s][A[A

Evaluation...:  97%|████████████████████████████████████▊ | 162/167 [00:04<00:00, 39.21it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.29it/s][A[A

Training:  86%|███████████████████████████████████▍     | 1296/1501 [02:11<02:28,  1.38it/s][A
Training:  86%|███████████████████████████████████▍     | 1298/1501 [02:11<01:46,  1.91it/s][A

>>> training loss:  0.4534, valid loss:  2.0848, valid f1 score:  0.4961



Training:  87%|███████████████████████████████████▌     | 1300/1501 [02:11<01:17,  2.60it/s][A
Training:  87%|███████████████████████████████████▌     | 1302/1501 [02:11<00:57,  3.46it/s][A
Training:  87%|███████████████████████████████████▌     | 1304/1501 [02:11<00:43,  4.57it/s][A
Training:  87%|███████████████████████████████████▋     | 1306/1501 [02:11<00:33,  5.78it/s][A
Training:  87%|███████████████████████████████████▋     | 1308/1501 [02:12<00:27,  7.13it/s][A
Training:  87%|███████████████████████████████████▊     | 1310/1501 [02:12<00:21,  8.75it/s][A
Training:  87%|███████████████████████████████████▊     | 1312/1501 [02:12<00:18, 10.21it/s][A
Training:  88%|███████████████████████████████████▉     | 1314/1501 [02:12<00:16, 11.67it/s][A
Training:  88%|███████████████████████████████████▉     | 1316/1501 [02:12<00:14, 12.98it/s][A
Training:  88%|████████████████████████████████████     | 1318/1501 [02:12<00:12, 14.10it/s][A
Training:  88%|████████████████████████

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:03<00:00, 39.98it/s][A[A

Evaluation...:  93%|███████████████████████████████████▍  | 156/167 [00:04<00:00, 39.35it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 39.26it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.69it/s][A[A

Training:  93%|██████████████████████████████████████   | 1395/1501 [02:21<01:14,  1.41it/s][A
Training:  93%|██████████████████████████████████████▏  | 1397/1501 [02:21<00:53,  1.95it/s][A

>>> training loss:  0.4852, valid loss:  2.1027, valid f1 score:  0.4925



Training:  93%|██████████████████████████████████████▏  | 1399/1501 [02:21<00:38,  2.66it/s][A
Training:  93%|██████████████████████████████████████▎  | 1401/1501 [02:21<00:28,  3.55it/s][A
Training:  93%|██████████████████████████████████████▎  | 1403/1501 [02:21<00:20,  4.67it/s][A
Training:  94%|██████████████████████████████████████▍  | 1405/1501 [02:21<00:15,  6.00it/s][A
Training:  94%|██████████████████████████████████████▍  | 1407/1501 [02:21<00:12,  7.50it/s][A
Training:  94%|██████████████████████████████████████▍  | 1409/1501 [02:22<00:09,  9.21it/s][A
Training:  94%|██████████████████████████████████████▌  | 1411/1501 [02:22<00:08, 10.47it/s][A
Training:  94%|██████████████████████████████████████▌  | 1413/1501 [02:22<00:07, 11.84it/s][A
Training:  94%|██████████████████████████████████████▋  | 1415/1501 [02:22<00:06, 13.07it/s][A
Training:  94%|██████████████████████████████████████▋  | 1417/1501 [02:22<00:05, 14.24it/s][A
Training:  95%|████████████████████████

Evaluation...:  87%|████████████████████████████████▉     | 145/167 [00:03<00:00, 38.47it/s][A[A

Evaluation...:  90%|██████████████████████████████████▏   | 150/167 [00:03<00:00, 40.15it/s][A[A

Evaluation...:  93%|███████████████████████████████████▎  | 155/167 [00:04<00:00, 39.46it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 39.71it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.37it/s][A[A

Training: 100%|████████████████████████████████████████▊| 1495/1501 [02:31<00:04,  1.40it/s][A
Training: 100%|████████████████████████████████████████▉| 1497/1501 [02:31<00:02,  1.95it/s][A

>>> training loss:  0.4861, valid loss:  2.0618, valid f1 score:  0.4933



Training: 100%|████████████████████████████████████████▉| 1499/1501 [02:31<00:00,  2.65it/s][A
Training: 100%|█████████████████████████████████████████| 1501/1501 [02:31<00:00,  9.90it/s][A
 75%|██████████████████████████████████████████              | 6/8 [15:33<05:07, 153.90s/it]
Training:   0%|                                                    | 0/1501 [00:00<?, ?it/s][A
Training:   0%|                                            | 2/1501 [00:00<01:38, 15.26it/s][A
Training:   0%|                                            | 4/1501 [00:00<01:35, 15.71it/s][A
Training:   0%|▏                                           | 6/1501 [00:00<01:30, 16.57it/s][A
Training:   1%|▏                                           | 8/1501 [00:00<01:26, 17.35it/s][A
Training:   1%|▎                                          | 10/1501 [00:00<01:22, 18.16it/s][A
Training:   1%|▎                                          | 12/1501 [00:00<01:22, 18.02it/s][A
Training:   1%|▍                          

Evaluation...:  81%|██████████████████████████████▉       | 136/167 [00:03<00:00, 38.29it/s][A[A

Evaluation...:  84%|███████████████████████████████▊      | 140/167 [00:03<00:00, 38.63it/s][A[A

Evaluation...:  86%|████████████████████████████████▊     | 144/167 [00:03<00:00, 38.64it/s][A[A

Evaluation...:  89%|█████████████████████████████████▋    | 148/167 [00:03<00:00, 38.38it/s][A[A

Evaluation...:  92%|██████████████████████████████████▊   | 153/167 [00:04<00:00, 38.84it/s][A[A

Evaluation...:  95%|███████████████████████████████████▉  | 158/167 [00:04<00:00, 39.87it/s][A[A

Evaluation...:  97%|████████████████████████████████████▊ | 162/167 [00:04<00:00, 38.47it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 37.90it/s][A[A

Training:   6%|██▋                                        | 94/1501 [00:09<16:52,  1.39it/s][A
Training:   6%|██▊                                        | 96/1501 [00:09<12:09,  1.92it/s][A

>>> training loss:  0.3102, valid loss:  2.0922, valid f1 score:  0.4948



Training:   7%|██▊                                        | 98/1501 [00:10<08:54,  2.63it/s][A
Training:   7%|██▊                                       | 100/1501 [00:10<06:38,  3.51it/s][A
Training:   7%|██▊                                       | 102/1501 [00:10<05:03,  4.62it/s][A
Training:   7%|██▉                                       | 104/1501 [00:10<03:54,  5.96it/s][A
Training:   7%|██▉                                       | 106/1501 [00:10<03:04,  7.54it/s][A
Training:   7%|███                                       | 108/1501 [00:10<02:33,  9.08it/s][A
Training:   7%|███                                       | 110/1501 [00:10<02:10, 10.63it/s][A
Training:   7%|███▏                                      | 112/1501 [00:10<01:56, 11.91it/s][A
Training:   8%|███▏                                      | 114/1501 [00:10<01:45, 13.11it/s][A
Training:   8%|███▏                                      | 116/1501 [00:11<01:37, 14.23it/s][A
Training:   8%|███▎                    

Evaluation...:  90%|██████████████████████████████████▏   | 150/167 [00:03<00:00, 39.03it/s][A[A

Evaluation...:  92%|███████████████████████████████████   | 154/167 [00:04<00:00, 37.77it/s][A[A

Evaluation...:  95%|████████████████████████████████████▏ | 159/167 [00:04<00:00, 39.10it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 38.58it/s][A[A

Training:  13%|█████▍                                    | 194/1501 [00:19<15:26,  1.41it/s][A
Training:  13%|█████▍                                    | 196/1501 [00:19<11:11,  1.94it/s][A

>>> training loss:  0.3002, valid loss:  2.0915, valid f1 score:  0.5047



Training:  13%|█████▌                                    | 198/1501 [00:20<08:13,  2.64it/s][A
Training:  13%|█████▌                                    | 200/1501 [00:20<06:06,  3.55it/s][A
Training:  13%|█████▋                                    | 202/1501 [00:20<04:36,  4.69it/s][A
Training:  14%|█████▋                                    | 204/1501 [00:20<03:38,  5.93it/s][A
Training:  14%|█████▊                                    | 206/1501 [00:20<02:56,  7.35it/s][A
Training:  14%|█████▊                                    | 208/1501 [00:20<02:23,  9.00it/s][A
Training:  14%|█████▉                                    | 210/1501 [00:20<02:03, 10.45it/s][A
Training:  14%|█████▉                                    | 212/1501 [00:20<01:49, 11.74it/s][A
Training:  14%|█████▉                                    | 214/1501 [00:21<01:42, 12.60it/s][A
Training:  14%|██████                                    | 216/1501 [00:21<01:33, 13.72it/s][A
Training:  15%|██████                  

Evaluation...:  86%|████████████████████████████████▊     | 144/167 [00:03<00:00, 38.05it/s][A[A

Evaluation...:  89%|█████████████████████████████████▋    | 148/167 [00:04<00:00, 37.92it/s][A[A

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:04<00:00, 38.51it/s][A[A

Evaluation...:  93%|███████████████████████████████████▍  | 156/167 [00:04<00:00, 37.94it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 37.76it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 37.05it/s][A[A

Training:  20%|████████▎                                 | 295/1501 [00:30<13:25,  1.50it/s][A
Training:  20%|████████▎                                 | 297/1501 [00:30<10:00,  2.00it/s][A

>>> training loss:  0.3325, valid loss:  2.1045, valid f1 score:  0.4906



Training:  20%|████████▎                                 | 299/1501 [00:30<07:29,  2.67it/s][A
Training:  20%|████████▍                                 | 301/1501 [00:30<05:39,  3.53it/s][A
Training:  20%|████████▍                                 | 303/1501 [00:30<04:18,  4.63it/s][A
Training:  20%|████████▌                                 | 305/1501 [00:30<03:23,  5.86it/s][A
Training:  20%|████████▌                                 | 307/1501 [00:30<02:42,  7.34it/s][A
Training:  21%|████████▋                                 | 309/1501 [00:31<02:15,  8.79it/s][A
Training:  21%|████████▋                                 | 311/1501 [00:31<01:53, 10.45it/s][A
Training:  21%|████████▊                                 | 313/1501 [00:31<01:37, 12.17it/s][A
Training:  21%|████████▊                                 | 315/1501 [00:31<01:26, 13.63it/s][A
Training:  21%|████████▊                                 | 317/1501 [00:31<01:20, 14.72it/s][A
Training:  21%|████████▉               

Evaluation...:  83%|███████████████████████████████▍      | 138/167 [00:04<00:01, 25.03it/s][A[A

Evaluation...:  85%|████████████████████████████████▎     | 142/167 [00:04<00:00, 26.74it/s][A[A

Evaluation...:  87%|████████████████████████████████▉     | 145/167 [00:04<00:00, 25.05it/s][A[A

Evaluation...:  89%|█████████████████████████████████▋    | 148/167 [00:04<00:00, 25.66it/s][A[A

Evaluation...:  90%|██████████████████████████████████▎   | 151/167 [00:04<00:00, 25.78it/s][A[A

Evaluation...:  92%|███████████████████████████████████   | 154/167 [00:04<00:00, 24.69it/s][A[A

Evaluation...:  94%|███████████████████████████████████▋  | 157/167 [00:04<00:00, 25.05it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:05<00:00, 25.09it/s][A[A

Evaluation...:  98%|█████████████████████████████████████ | 163/167 [00:05<00:00, 25.07it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:05<00:00, 31.46it/s][A[A



>>> training loss:  0.3353, valid loss:  2.0903, valid f1 score:  0.5083



Training:  26%|███████████                               | 397/1501 [00:41<11:33,  1.59it/s][A
Training:  27%|███████████▏                              | 399/1501 [00:41<08:37,  2.13it/s][A
Training:  27%|███████████▏                              | 401/1501 [00:41<06:27,  2.84it/s][A
Training:  27%|███████████▎                              | 403/1501 [00:42<04:50,  3.78it/s][A
Training:  27%|███████████▎                              | 405/1501 [00:42<03:43,  4.90it/s][A
Training:  27%|███████████▍                              | 407/1501 [00:42<02:54,  6.28it/s][A
Training:  27%|███████████▍                              | 409/1501 [00:42<02:20,  7.80it/s][A
Training:  27%|███████████▌                              | 411/1501 [00:42<02:07,  8.53it/s][A
Training:  28%|███████████▌                              | 413/1501 [00:42<01:55,  9.44it/s][A
Training:  28%|███████████▌                              | 415/1501 [00:42<01:44, 10.44it/s][A
Training:  28%|███████████▋            

Evaluation...:  72%|███████████████████████████▌          | 121/167 [00:03<00:01, 35.37it/s][A[A

Evaluation...:  75%|████████████████████████████▍         | 125/167 [00:03<00:01, 35.62it/s][A[A

Evaluation...:  77%|█████████████████████████████▎        | 129/167 [00:04<00:01, 34.41it/s][A[A

Evaluation...:  80%|██████████████████████████████▎       | 133/167 [00:04<00:00, 34.83it/s][A[A

Evaluation...:  82%|███████████████████████████████▏      | 137/167 [00:04<00:00, 35.72it/s][A[A

Evaluation...:  84%|████████████████████████████████      | 141/167 [00:04<00:00, 35.43it/s][A[A

Evaluation...:  87%|████████████████████████████████▉     | 145/167 [00:04<00:00, 34.40it/s][A[A

Evaluation...:  90%|██████████████████████████████████▏   | 150/167 [00:04<00:00, 36.74it/s][A[A

Evaluation...:  92%|███████████████████████████████████   | 154/167 [00:04<00:00, 36.10it/s][A[A

Evaluation...:  95%|███████████████████████████████████▉  | 158/167 [00:04<00:00, 36.91it/s][A[A



>>> training loss:  0.3463, valid loss:  2.1338, valid f1 score:  0.4919



Training:  33%|█████████████▉                            | 499/1501 [00:53<07:22,  2.26it/s][A
Training:  33%|██████████████                            | 501/1501 [00:53<05:25,  3.07it/s][A
Training:  34%|██████████████                            | 503/1501 [00:53<04:03,  4.10it/s][A
Training:  34%|██████████████▏                           | 505/1501 [00:53<03:07,  5.32it/s][A
Training:  34%|██████████████▏                           | 507/1501 [00:54<02:28,  6.70it/s][A
Training:  34%|██████████████▏                           | 509/1501 [00:54<02:00,  8.22it/s][A
Training:  34%|██████████████▎                           | 511/1501 [00:54<01:42,  9.61it/s][A
Training:  34%|██████████████▎                           | 513/1501 [00:54<01:47,  9.22it/s][A
Training:  34%|██████████████▍                           | 515/1501 [00:54<01:32, 10.69it/s][A
Training:  34%|██████████████▍                           | 517/1501 [00:54<01:21, 12.05it/s][A
Training:  35%|██████████████▌         

Evaluation...:  78%|█████████████████████████████▌        | 130/167 [00:03<00:01, 34.04it/s][A[A

Evaluation...:  80%|██████████████████████████████▍       | 134/167 [00:04<00:00, 34.49it/s][A[A

Evaluation...:  83%|███████████████████████████████▍      | 138/167 [00:04<00:00, 33.20it/s][A[A

Evaluation...:  85%|████████████████████████████████▎     | 142/167 [00:04<00:00, 32.59it/s][A[A

Evaluation...:  87%|█████████████████████████████████▏    | 146/167 [00:04<00:00, 30.55it/s][A[A

Evaluation...:  90%|██████████████████████████████████▏   | 150/167 [00:04<00:00, 30.70it/s][A[A

Evaluation...:  92%|███████████████████████████████████   | 154/167 [00:04<00:00, 30.19it/s][A[A

Evaluation...:  95%|███████████████████████████████████▉  | 158/167 [00:04<00:00, 30.85it/s][A[A

Evaluation...:  97%|████████████████████████████████████▊ | 162/167 [00:05<00:00, 29.60it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:05<00:00, 32.01it/s][A[A



>>> training loss:  0.3642, valid loss:  2.1032, valid f1 score:  0.5061



Training:  40%|████████████████▊                         | 599/1501 [01:05<06:49,  2.20it/s][A
Training:  40%|████████████████▊                         | 601/1501 [01:06<05:05,  2.95it/s][A
Training:  40%|████████████████▊                         | 603/1501 [01:06<03:50,  3.89it/s][A
Training:  40%|████████████████▉                         | 605/1501 [01:06<03:02,  4.91it/s][A
Training:  40%|████████████████▉                         | 607/1501 [01:06<02:24,  6.19it/s][A
Training:  41%|█████████████████                         | 609/1501 [01:06<01:59,  7.45it/s][A
Training:  41%|█████████████████                         | 611/1501 [01:06<01:41,  8.73it/s][A
Training:  41%|█████████████████▏                        | 613/1501 [01:06<01:29,  9.92it/s][A
Training:  41%|█████████████████▏                        | 615/1501 [01:07<01:21, 10.92it/s][A
Training:  41%|█████████████████▎                        | 617/1501 [01:07<01:12, 12.24it/s][A
Training:  41%|█████████████████▎      

Evaluation...:  84%|████████████████████████████████      | 141/167 [00:04<00:00, 31.85it/s][A[A

Evaluation...:  87%|████████████████████████████████▉     | 145/167 [00:04<00:00, 30.10it/s][A[A

Evaluation...:  89%|█████████████████████████████████▉    | 149/167 [00:04<00:00, 31.04it/s][A[A

Evaluation...:  92%|██████████████████████████████████▊   | 153/167 [00:04<00:00, 31.26it/s][A[A

Evaluation...:  94%|███████████████████████████████████▋  | 157/167 [00:04<00:00, 32.70it/s][A[A

Evaluation...:  96%|████████████████████████████████████▋ | 161/167 [00:04<00:00, 31.71it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 34.46it/s][A[A

Training:  46%|███████████████████▍                      | 695/1501 [01:16<10:35,  1.27it/s][A
Training:  46%|███████████████████▌                      | 697/1501 [01:17<07:39,  1.75it/s][A

>>> training loss:  0.3611, valid loss:  2.1131, valid f1 score:  0.4986



Training:  47%|███████████████████▌                      | 699/1501 [01:17<05:38,  2.37it/s][A
Training:  47%|███████████████████▌                      | 701/1501 [01:17<04:11,  3.18it/s][A
Training:  47%|███████████████████▋                      | 703/1501 [01:17<03:08,  4.23it/s][A
Training:  47%|███████████████████▋                      | 705/1501 [01:17<02:27,  5.41it/s][A
Training:  47%|███████████████████▊                      | 707/1501 [01:17<01:58,  6.73it/s][A
Training:  47%|███████████████████▊                      | 709/1501 [01:17<01:39,  7.93it/s][A
Training:  47%|███████████████████▉                      | 711/1501 [01:17<01:28,  8.90it/s][A
Training:  48%|███████████████████▉                      | 713/1501 [01:18<01:19,  9.92it/s][A
Training:  48%|████████████████████                      | 715/1501 [01:18<01:12, 10.90it/s][A
Training:  48%|████████████████████                      | 717/1501 [01:18<01:07, 11.63it/s][A
Training:  48%|████████████████████    

Evaluation...:  83%|███████████████████████████████▍      | 138/167 [00:03<00:00, 36.06it/s][A[A

Evaluation...:  85%|████████████████████████████████▎     | 142/167 [00:04<00:00, 36.67it/s][A[A

Evaluation...:  87%|█████████████████████████████████▏    | 146/167 [00:04<00:00, 35.89it/s][A[A

Evaluation...:  90%|██████████████████████████████████▎   | 151/167 [00:04<00:00, 37.43it/s][A[A

Evaluation...:  93%|███████████████████████████████████▎  | 155/167 [00:04<00:00, 36.98it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 37.53it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 35.32it/s][A[A

Training:  53%|██████████████████████▏                   | 795/1501 [01:28<09:07,  1.29it/s][A
Training:  53%|██████████████████████▎                   | 797/1501 [01:28<06:34,  1.79it/s][A

>>> training loss:  0.3746, valid loss:  2.1289, valid f1 score:  0.5085



Training:  53%|██████████████████████▎                   | 799/1501 [01:28<04:49,  2.43it/s][A
Training:  53%|██████████████████████▍                   | 801/1501 [01:28<03:34,  3.27it/s][A
Training:  53%|██████████████████████▍                   | 803/1501 [01:28<02:40,  4.34it/s][A
Training:  54%|██████████████████████▌                   | 805/1501 [01:28<02:05,  5.54it/s][A
Training:  54%|██████████████████████▌                   | 807/1501 [01:28<01:39,  6.99it/s][A
Training:  54%|██████████████████████▋                   | 809/1501 [01:29<01:22,  8.42it/s][A
Training:  54%|██████████████████████▋                   | 811/1501 [01:29<01:10,  9.73it/s][A
Training:  54%|██████████████████████▋                   | 813/1501 [01:29<01:03, 10.84it/s][A
Training:  54%|██████████████████████▊                   | 815/1501 [01:29<00:55, 12.42it/s][A
Training:  54%|██████████████████████▊                   | 817/1501 [01:29<00:49, 13.94it/s][A
Training:  55%|██████████████████████▉ 

Evaluation...:  86%|████████████████████████████████▌     | 143/167 [00:04<00:00, 29.55it/s][A[A

Evaluation...:  87%|█████████████████████████████████▏    | 146/167 [00:04<00:00, 29.05it/s][A[A

Evaluation...:  90%|██████████████████████████████████▏   | 150/167 [00:04<00:00, 29.76it/s][A[A

Evaluation...:  92%|██████████████████████████████████▊   | 153/167 [00:04<00:00, 28.85it/s][A[A

Evaluation...:  93%|███████████████████████████████████▍  | 156/167 [00:04<00:00, 28.86it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 28.99it/s][A[A

Evaluation...:  98%|█████████████████████████████████████ | 163/167 [00:04<00:00, 28.65it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 34.13it/s][A[A

Training:  60%|█████████████████████████                 | 895/1501 [01:39<08:03,  1.25it/s][A

>>> training loss:  0.3995, valid loss:  2.1307, valid f1 score:  0.5032



Training:  60%|█████████████████████████                 | 897/1501 [01:39<05:50,  1.72it/s][A
Training:  60%|█████████████████████████▏                | 899/1501 [01:39<04:18,  2.33it/s][A
Training:  60%|█████████████████████████▏                | 901/1501 [01:39<03:12,  3.12it/s][A
Training:  60%|█████████████████████████▎                | 903/1501 [01:40<02:28,  4.04it/s][A
Training:  60%|█████████████████████████▎                | 905/1501 [01:40<01:54,  5.19it/s][A
Training:  60%|█████████████████████████▍                | 907/1501 [01:40<01:30,  6.54it/s][A
Training:  61%|█████████████████████████▍                | 909/1501 [01:40<01:14,  7.94it/s][A
Training:  61%|█████████████████████████▍                | 911/1501 [01:40<01:03,  9.36it/s][A
Training:  61%|█████████████████████████▌                | 913/1501 [01:40<00:53, 11.00it/s][A
Training:  61%|█████████████████████████▌                | 915/1501 [01:40<00:47, 12.30it/s][A
Training:  61%|████████████████████████

Evaluation...:  83%|███████████████████████████████▍      | 138/167 [00:03<00:00, 36.55it/s][A[A

Evaluation...:  86%|████████████████████████████████▌     | 143/167 [00:03<00:00, 37.39it/s][A[A

Evaluation...:  88%|█████████████████████████████████▍    | 147/167 [00:04<00:00, 37.30it/s][A[A

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:04<00:00, 38.42it/s][A[A

Evaluation...:  93%|███████████████████████████████████▍  | 156/167 [00:04<00:00, 37.62it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 37.50it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 36.33it/s][A[A

Training:  66%|███████████████████████████▊              | 995/1501 [01:50<06:18,  1.34it/s][A
Training:  66%|███████████████████████████▉              | 997/1501 [01:50<04:35,  1.83it/s][A

>>> training loss:  0.4452, valid loss:  2.1534, valid f1 score:  0.4972



Training:  67%|███████████████████████████▉              | 999/1501 [01:50<03:19,  2.51it/s][A
Training:  67%|███████████████████████████▎             | 1001/1501 [01:50<02:29,  3.35it/s][A
Training:  67%|███████████████████████████▍             | 1003/1501 [01:51<01:52,  4.43it/s][A
Training:  67%|███████████████████████████▍             | 1005/1501 [01:51<01:26,  5.72it/s][A
Training:  67%|███████████████████████████▌             | 1007/1501 [01:51<01:08,  7.17it/s][A
Training:  67%|███████████████████████████▌             | 1009/1501 [01:51<00:57,  8.60it/s][A
Training:  67%|███████████████████████████▌             | 1011/1501 [01:51<00:48, 10.13it/s][A
Training:  67%|███████████████████████████▋             | 1013/1501 [01:51<00:42, 11.60it/s][A
Training:  68%|███████████████████████████▋             | 1015/1501 [01:51<00:38, 12.70it/s][A
Training:  68%|███████████████████████████▊             | 1017/1501 [01:51<00:35, 13.61it/s][A
Training:  68%|████████████████████████

Evaluation...:  77%|█████████████████████████████▎        | 129/167 [00:03<00:01, 34.52it/s][A[A

Evaluation...:  80%|██████████████████████████████▎       | 133/167 [00:04<00:01, 33.10it/s][A[A

Evaluation...:  82%|███████████████████████████████▏      | 137/167 [00:04<00:00, 32.90it/s][A[A

Evaluation...:  84%|████████████████████████████████      | 141/167 [00:04<00:00, 31.78it/s][A[A

Evaluation...:  87%|████████████████████████████████▉     | 145/167 [00:04<00:00, 29.75it/s][A[A

Evaluation...:  89%|█████████████████████████████████▉    | 149/167 [00:04<00:00, 30.86it/s][A[A

Evaluation...:  92%|██████████████████████████████████▊   | 153/167 [00:04<00:00, 30.16it/s][A[A

Evaluation...:  94%|███████████████████████████████████▋  | 157/167 [00:04<00:00, 30.46it/s][A[A

Evaluation...:  96%|████████████████████████████████████▋ | 161/167 [00:05<00:00, 29.44it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:05<00:00, 31.90it/s][A[A



>>> training loss:  0.4166, valid loss:  2.1192, valid f1 score:  0.4980



Training:  73%|█████████████████████████████▉           | 1097/1501 [02:02<04:10,  1.61it/s][A
Training:  73%|██████████████████████████████           | 1099/1501 [02:02<03:03,  2.19it/s][A
Training:  73%|██████████████████████████████           | 1101/1501 [02:02<02:15,  2.95it/s][A
Training:  73%|██████████████████████████████▏          | 1103/1501 [02:02<01:43,  3.85it/s][A
Training:  74%|██████████████████████████████▏          | 1105/1501 [02:02<01:20,  4.95it/s][A
Training:  74%|██████████████████████████████▏          | 1107/1501 [02:02<01:06,  5.95it/s][A
Training:  74%|██████████████████████████████▎          | 1109/1501 [02:02<00:55,  7.08it/s][A
Training:  74%|██████████████████████████████▎          | 1111/1501 [02:03<00:47,  8.25it/s][A
Training:  74%|██████████████████████████████▍          | 1113/1501 [02:03<00:40,  9.51it/s][A
Training:  74%|██████████████████████████████▍          | 1115/1501 [02:03<00:35, 10.87it/s][A
Training:  74%|████████████████████████

Evaluation...:  78%|█████████████████████████████▌        | 130/167 [00:04<00:01, 33.70it/s][A[A

Evaluation...:  80%|██████████████████████████████▍       | 134/167 [00:04<00:00, 34.88it/s][A[A

Evaluation...:  83%|███████████████████████████████▍      | 138/167 [00:04<00:00, 35.45it/s][A[A

Evaluation...:  85%|████████████████████████████████▎     | 142/167 [00:04<00:00, 36.36it/s][A[A

Evaluation...:  87%|█████████████████████████████████▏    | 146/167 [00:04<00:00, 35.83it/s][A[A

Evaluation...:  90%|██████████████████████████████████▏   | 150/167 [00:04<00:00, 36.95it/s][A[A

Evaluation...:  92%|███████████████████████████████████   | 154/167 [00:04<00:00, 36.25it/s][A[A

Evaluation...:  95%|███████████████████████████████████▉  | 158/167 [00:04<00:00, 36.88it/s][A[A

Evaluation...:  97%|████████████████████████████████████▊ | 162/167 [00:04<00:00, 35.15it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:05<00:00, 32.97it/s][A[A



>>> training loss:  0.4416, valid loss:  2.1761, valid f1 score:  0.4848



Training:  80%|████████████████████████████████▋        | 1197/1501 [02:14<03:03,  1.66it/s][A
Training:  80%|████████████████████████████████▊        | 1199/1501 [02:14<02:13,  2.26it/s][A
Training:  80%|████████████████████████████████▊        | 1201/1501 [02:14<01:38,  3.03it/s][A
Training:  80%|████████████████████████████████▊        | 1203/1501 [02:14<01:14,  3.98it/s][A
Training:  80%|████████████████████████████████▉        | 1205/1501 [02:14<00:58,  5.05it/s][A
Training:  80%|████████████████████████████████▉        | 1207/1501 [02:14<00:46,  6.27it/s][A
Training:  81%|█████████████████████████████████        | 1209/1501 [02:14<00:38,  7.54it/s][A
Training:  81%|█████████████████████████████████        | 1211/1501 [02:14<00:33,  8.69it/s][A
Training:  81%|█████████████████████████████████▏       | 1213/1501 [02:15<00:29,  9.66it/s][A
Training:  81%|█████████████████████████████████▏       | 1215/1501 [02:15<00:26, 10.60it/s][A
Training:  81%|████████████████████████

Evaluation...:  72%|███████████████████████████▌          | 121/167 [00:03<00:01, 36.14it/s][A[A

Evaluation...:  75%|████████████████████████████▍         | 125/167 [00:03<00:01, 36.60it/s][A[A

Evaluation...:  77%|█████████████████████████████▎        | 129/167 [00:04<00:01, 35.23it/s][A[A

Evaluation...:  80%|██████████████████████████████▎       | 133/167 [00:04<00:00, 35.92it/s][A[A

Evaluation...:  83%|███████████████████████████████▍      | 138/167 [00:04<00:00, 37.20it/s][A[A

Evaluation...:  85%|████████████████████████████████▎     | 142/167 [00:04<00:00, 37.66it/s][A[A

Evaluation...:  87%|█████████████████████████████████▏    | 146/167 [00:04<00:00, 36.58it/s][A[A

Evaluation...:  90%|██████████████████████████████████▏   | 150/167 [00:04<00:00, 37.51it/s][A[A

Evaluation...:  92%|███████████████████████████████████   | 154/167 [00:04<00:00, 36.64it/s][A[A

Evaluation...:  95%|███████████████████████████████████▉  | 158/167 [00:04<00:00, 37.33it/s][A[A



>>> training loss:  0.4063, valid loss:  2.1422, valid f1 score:  0.4846



Training:  86%|███████████████████████████████████▍     | 1297/1501 [02:26<02:06,  1.61it/s][A
Training:  87%|███████████████████████████████████▍     | 1299/1501 [02:26<01:32,  2.19it/s][A
Training:  87%|███████████████████████████████████▌     | 1301/1501 [02:26<01:08,  2.93it/s][A
Training:  87%|███████████████████████████████████▌     | 1303/1501 [02:27<00:51,  3.85it/s][A
Training:  87%|███████████████████████████████████▋     | 1305/1501 [02:27<00:39,  4.92it/s][A
Training:  87%|███████████████████████████████████▋     | 1307/1501 [02:27<00:31,  6.08it/s][A
Training:  87%|███████████████████████████████████▊     | 1309/1501 [02:27<00:26,  7.34it/s][A
Training:  87%|███████████████████████████████████▊     | 1311/1501 [02:27<00:21,  8.67it/s][A
Training:  87%|███████████████████████████████████▊     | 1313/1501 [02:27<00:20,  9.39it/s][A
Training:  88%|███████████████████████████████████▉     | 1315/1501 [02:27<00:17, 10.69it/s][A
Training:  88%|████████████████████████

Evaluation...:  66%|█████████████████████████▎            | 111/167 [00:03<00:01, 28.65it/s][A[A

Evaluation...:  69%|██████████████████████████▏           | 115/167 [00:04<00:01, 29.19it/s][A[A

Evaluation...:  71%|██████████████████████████▊           | 118/167 [00:04<00:01, 27.74it/s][A[A

Evaluation...:  72%|███████████████████████████▌          | 121/167 [00:04<00:01, 28.01it/s][A[A

Evaluation...:  75%|████████████████████████████▍         | 125/167 [00:04<00:01, 28.86it/s][A[A

Evaluation...:  77%|█████████████████████████████▏        | 128/167 [00:04<00:01, 28.12it/s][A[A

Evaluation...:  78%|█████████████████████████████▊        | 131/167 [00:04<00:01, 26.20it/s][A[A

Evaluation...:  80%|██████████████████████████████▍       | 134/167 [00:04<00:01, 27.01it/s][A[A

Evaluation...:  83%|███████████████████████████████▍      | 138/167 [00:04<00:01, 27.99it/s][A[A

Evaluation...:  85%|████████████████████████████████▎     | 142/167 [00:05<00:00, 29.08it/s][A[A



>>> training loss:  0.4657, valid loss:  2.0980, valid f1 score:  0.4986



Training:  93%|██████████████████████████████████████▏  | 1397/1501 [02:39<01:12,  1.44it/s][A
Training:  93%|██████████████████████████████████████▏  | 1399/1501 [02:39<00:51,  1.97it/s][A
Training:  93%|██████████████████████████████████████▎  | 1401/1501 [02:40<00:37,  2.65it/s][A
Training:  93%|██████████████████████████████████████▎  | 1403/1501 [02:40<00:27,  3.54it/s][A
Training:  94%|██████████████████████████████████████▍  | 1405/1501 [02:40<00:21,  4.50it/s][A
Training:  94%|██████████████████████████████████████▍  | 1407/1501 [02:40<00:16,  5.71it/s][A
Training:  94%|██████████████████████████████████████▍  | 1409/1501 [02:40<00:13,  6.93it/s][A
Training:  94%|██████████████████████████████████████▌  | 1411/1501 [02:40<00:11,  8.08it/s][A
Training:  94%|██████████████████████████████████████▌  | 1413/1501 [02:40<00:09,  8.94it/s][A
Training:  94%|██████████████████████████████████████▋  | 1415/1501 [02:41<00:08,  9.95it/s][A
Training:  94%|████████████████████████

Evaluation...:  84%|███████████████████████████████▊      | 140/167 [00:03<00:00, 38.18it/s][A[A

Evaluation...:  86%|████████████████████████████████▊     | 144/167 [00:03<00:00, 37.51it/s][A[A

Evaluation...:  89%|█████████████████████████████████▋    | 148/167 [00:03<00:00, 36.76it/s][A[A

Evaluation...:  92%|██████████████████████████████████▊   | 153/167 [00:04<00:00, 37.66it/s][A[A

Evaluation...:  95%|███████████████████████████████████▉  | 158/167 [00:04<00:00, 38.87it/s][A[A

Evaluation...:  97%|████████████████████████████████████▊ | 162/167 [00:04<00:00, 37.92it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 37.70it/s][A[A

Training: 100%|████████████████████████████████████████▊| 1495/1501 [02:50<00:04,  1.38it/s][A
Training: 100%|████████████████████████████████████████▉| 1497/1501 [02:50<00:02,  1.90it/s][A

>>> training loss:  0.4691, valid loss:  2.1113, valid f1 score:  0.4982



Training: 100%|█████████████████████████████████████████| 1501/1501 [02:50<00:00,  8.79it/s][A
 88%|█████████████████████████████████████████████████       | 7/8 [18:24<02:39, 159.42s/it]
Training:   0%|                                                    | 0/1501 [00:00<?, ?it/s][A
Training:   0%|                                            | 2/1501 [00:00<01:23, 17.90it/s][A
Training:   0%|                                            | 4/1501 [00:00<01:30, 16.60it/s][A
Training:   0%|▏                                           | 6/1501 [00:00<01:30, 16.50it/s][A
Training:   1%|▏                                           | 8/1501 [00:00<01:34, 15.78it/s][A
Training:   1%|▎                                          | 10/1501 [00:00<01:30, 16.43it/s][A
Training:   1%|▎                                          | 12/1501 [00:00<01:32, 16.09it/s][A
Training:   1%|▍                                          | 14/1501 [00:00<01:32, 16.16it/s][A
Training:   1%|▍                          

Evaluation...:  88%|█████████████████████████████████▍    | 147/167 [00:03<00:00, 38.70it/s][A[A

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:04<00:00, 39.24it/s][A[A

Evaluation...:  93%|███████████████████████████████████▍  | 156/167 [00:04<00:00, 37.85it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 37.44it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 37.43it/s][A[A

Training:   6%|██▋                                        | 93/1501 [00:10<14:57,  1.57it/s][A
Training:   6%|██▋                                        | 95/1501 [00:10<11:13,  2.09it/s][A

>>> training loss:  0.3189, valid loss:  2.0959, valid f1 score:  0.4924



Training:   6%|██▊                                        | 97/1501 [00:10<08:42,  2.69it/s][A
Training:   7%|██▊                                        | 99/1501 [00:11<06:36,  3.54it/s][A
Training:   7%|██▊                                       | 101/1501 [00:11<05:02,  4.63it/s][A
Training:   7%|██▉                                       | 103/1501 [00:11<03:59,  5.85it/s][A
Training:   7%|██▉                                       | 105/1501 [00:11<03:11,  7.28it/s][A
Training:   7%|██▉                                       | 107/1501 [00:11<02:37,  8.87it/s][A
Training:   7%|███                                       | 109/1501 [00:11<02:12, 10.47it/s][A
Training:   7%|███                                       | 111/1501 [00:11<01:55, 12.03it/s][A
Training:   8%|███▏                                      | 113/1501 [00:11<01:43, 13.47it/s][A
Training:   8%|███▏                                      | 115/1501 [00:11<01:37, 14.18it/s][A
Training:   8%|███▎                    

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 40.59it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 39.34it/s][A[A

Training:  13%|█████▍                                    | 194/1501 [00:20<15:08,  1.44it/s][A
Training:  13%|█████▍                                    | 196/1501 [00:20<10:56,  1.99it/s][A

>>> training loss:  0.3123, valid loss:  2.1610, valid f1 score:  0.4956



Training:  13%|█████▌                                    | 198/1501 [00:20<08:00,  2.71it/s][A
Training:  13%|█████▌                                    | 200/1501 [00:21<05:58,  3.63it/s][A
Training:  13%|█████▋                                    | 202/1501 [00:21<04:29,  4.81it/s][A
Training:  14%|█████▋                                    | 204/1501 [00:21<03:30,  6.17it/s][A
Training:  14%|█████▊                                    | 206/1501 [00:21<02:47,  7.75it/s][A
Training:  14%|█████▊                                    | 208/1501 [00:21<02:19,  9.29it/s][A
Training:  14%|█████▉                                    | 210/1501 [00:21<01:59, 10.83it/s][A
Training:  14%|█████▉                                    | 212/1501 [00:21<01:46, 12.14it/s][A
Training:  14%|█████▉                                    | 214/1501 [00:21<01:37, 13.25it/s][A
Training:  14%|██████                                    | 216/1501 [00:21<01:30, 14.26it/s][A
Training:  15%|██████                  

Training:  20%|████████▎                                 | 296/1501 [00:30<09:52,  2.03it/s][A

>>> training loss:  0.3362, valid loss:  2.1944, valid f1 score:  0.4962



Training:  20%|████████▎                                 | 298/1501 [00:30<07:16,  2.76it/s][A
Training:  20%|████████▍                                 | 300/1501 [00:30<05:24,  3.70it/s][A
Training:  20%|████████▍                                 | 302/1501 [00:30<04:05,  4.89it/s][A
Training:  20%|████████▌                                 | 304/1501 [00:31<03:12,  6.23it/s][A
Training:  20%|████████▌                                 | 306/1501 [00:31<02:35,  7.67it/s][A
Training:  21%|████████▌                                 | 308/1501 [00:31<02:09,  9.22it/s][A
Training:  21%|████████▋                                 | 310/1501 [00:31<01:49, 10.91it/s][A
Training:  21%|████████▋                                 | 312/1501 [00:31<01:35, 12.46it/s][A
Training:  21%|████████▊                                 | 314/1501 [00:31<01:30, 13.18it/s][A
Training:  21%|████████▊                                 | 316/1501 [00:31<01:23, 14.15it/s][A
Training:  21%|████████▉               

Training:  26%|███████████                               | 394/1501 [00:40<12:40,  1.46it/s][A
Training:  26%|███████████                               | 396/1501 [00:40<09:09,  2.01it/s][A

>>> training loss:  0.3388, valid loss:  2.1545, valid f1 score:  0.4983



Training:  27%|███████████▏                              | 398/1501 [00:40<06:43,  2.74it/s][A
Training:  27%|███████████▏                              | 400/1501 [00:40<04:59,  3.68it/s][A
Training:  27%|███████████▏                              | 402/1501 [00:40<03:49,  4.80it/s][A
Training:  27%|███████████▎                              | 404/1501 [00:40<02:59,  6.10it/s][A
Training:  27%|███████████▎                              | 406/1501 [00:40<02:22,  7.68it/s][A
Training:  27%|███████████▍                              | 408/1501 [00:41<01:56,  9.38it/s][A
Training:  27%|███████████▍                              | 410/1501 [00:41<01:40, 10.87it/s][A
Training:  27%|███████████▌                              | 412/1501 [00:41<01:28, 12.33it/s][A
Training:  28%|███████████▌                              | 414/1501 [00:41<01:21, 13.39it/s][A
Training:  28%|███████████▋                              | 416/1501 [00:41<01:15, 14.42it/s][A
Training:  28%|███████████▋            

>>> training loss:  0.3272, valid loss:  2.1747, valid f1 score:  0.4933



Training:  33%|█████████████▉                            | 498/1501 [00:50<05:56,  2.81it/s][A
Training:  33%|█████████████▉                            | 500/1501 [00:50<04:26,  3.75it/s][A
Training:  33%|██████████████                            | 502/1501 [00:50<03:22,  4.94it/s][A
Training:  34%|██████████████                            | 504/1501 [00:50<02:38,  6.29it/s][A
Training:  34%|██████████████▏                           | 506/1501 [00:50<02:07,  7.81it/s][A
Training:  34%|██████████████▏                           | 508/1501 [00:50<01:46,  9.35it/s][A
Training:  34%|██████████████▎                           | 510/1501 [00:50<01:30, 10.94it/s][A
Training:  34%|██████████████▎                           | 512/1501 [00:51<01:21, 12.19it/s][A
Training:  34%|██████████████▍                           | 514/1501 [00:51<01:15, 13.08it/s][A
Training:  34%|██████████████▍                           | 516/1501 [00:51<01:09, 14.21it/s][A
Training:  35%|██████████████▍         

Training:  40%|████████████████▋                         | 596/1501 [00:59<07:26,  2.02it/s][A

>>> training loss:  0.3551, valid loss:  2.2354, valid f1 score:  0.5015



Training:  40%|████████████████▋                         | 598/1501 [00:59<05:28,  2.75it/s][A
Training:  40%|████████████████▊                         | 600/1501 [01:00<04:03,  3.70it/s][A
Training:  40%|████████████████▊                         | 602/1501 [01:00<03:03,  4.90it/s][A
Training:  40%|████████████████▉                         | 604/1501 [01:00<02:40,  5.59it/s][A
Training:  40%|████████████████▉                         | 606/1501 [01:00<02:06,  7.08it/s][A
Training:  41%|█████████████████                         | 608/1501 [01:00<01:42,  8.74it/s][A
Training:  41%|█████████████████                         | 610/1501 [01:00<01:25, 10.43it/s][A
Training:  41%|█████████████████                         | 612/1501 [01:00<01:13, 12.10it/s][A
Training:  41%|█████████████████▏                        | 614/1501 [01:00<01:05, 13.46it/s][A
Training:  41%|█████████████████▏                        | 616/1501 [01:01<00:59, 14.83it/s][A
Training:  41%|█████████████████▎      

Training:  46%|███████████████████▍                      | 693/1501 [01:09<09:25,  1.43it/s][A
Training:  46%|███████████████████▍                      | 695/1501 [01:09<06:50,  1.96it/s][A

>>> training loss:  0.3530, valid loss:  2.1683, valid f1 score:  0.5036



Training:  46%|███████████████████▌                      | 697/1501 [01:09<05:01,  2.67it/s][A
Training:  47%|███████████████████▌                      | 699/1501 [01:10<03:43,  3.59it/s][A
Training:  47%|███████████████████▌                      | 701/1501 [01:10<02:50,  4.69it/s][A
Training:  47%|███████████████████▋                      | 703/1501 [01:10<02:11,  6.05it/s][A
Training:  47%|███████████████████▋                      | 705/1501 [01:10<01:44,  7.65it/s][A
Training:  47%|███████████████████▊                      | 707/1501 [01:10<01:25,  9.31it/s][A
Training:  47%|███████████████████▊                      | 709/1501 [01:10<01:13, 10.81it/s][A
Training:  47%|███████████████████▉                      | 711/1501 [01:10<01:04, 12.34it/s][A
Training:  48%|███████████████████▉                      | 713/1501 [01:10<00:58, 13.49it/s][A
Training:  48%|████████████████████                      | 715/1501 [01:10<00:55, 14.09it/s][A
Training:  48%|████████████████████    

Evaluation...:  84%|████████████████████████████████      | 141/167 [00:04<00:00, 34.87it/s][A[A

Evaluation...:  87%|████████████████████████████████▉     | 145/167 [00:04<00:00, 33.87it/s][A[A

Evaluation...:  89%|█████████████████████████████████▉    | 149/167 [00:04<00:00, 35.43it/s][A[A

Evaluation...:  92%|██████████████████████████████████▊   | 153/167 [00:04<00:00, 35.52it/s][A[A

Evaluation...:  94%|███████████████████████████████████▋  | 157/167 [00:04<00:00, 36.49it/s][A[A

Evaluation...:  96%|████████████████████████████████████▋ | 161/167 [00:04<00:00, 35.65it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 34.35it/s][A[A

Training:  53%|██████████████████████▏                   | 793/1501 [01:20<09:22,  1.26it/s][A
Training:  53%|██████████████████████▏                   | 795/1501 [01:21<06:44,  1.74it/s][A

>>> training loss:  0.3747, valid loss:  2.1682, valid f1 score:  0.4958



Training:  53%|██████████████████████▎                   | 797/1501 [01:21<04:55,  2.38it/s][A
Training:  53%|██████████████████████▎                   | 799/1501 [01:21<03:40,  3.19it/s][A
Training:  53%|██████████████████████▍                   | 801/1501 [01:21<02:44,  4.24it/s][A
Training:  53%|██████████████████████▍                   | 803/1501 [01:21<02:06,  5.53it/s][A
Training:  54%|██████████████████████▌                   | 805/1501 [01:21<01:39,  7.02it/s][A
Training:  54%|██████████████████████▌                   | 807/1501 [01:21<01:19,  8.68it/s][A
Training:  54%|██████████████████████▋                   | 809/1501 [01:21<01:07, 10.32it/s][A
Training:  54%|██████████████████████▋                   | 811/1501 [01:22<00:59, 11.56it/s][A
Training:  54%|██████████████████████▋                   | 813/1501 [01:22<00:54, 12.58it/s][A
Training:  54%|██████████████████████▊                   | 815/1501 [01:22<00:49, 13.87it/s][A
Training:  54%|██████████████████████▊ 

Evaluation...:  83%|███████████████████████████████▋      | 139/167 [00:04<00:00, 36.58it/s][A[A

Evaluation...:  86%|████████████████████████████████▌     | 143/167 [00:04<00:00, 36.69it/s][A[A

Evaluation...:  88%|█████████████████████████████████▍    | 147/167 [00:04<00:00, 34.01it/s][A[A

Evaluation...:  90%|██████████████████████████████████▎   | 151/167 [00:04<00:00, 31.68it/s][A[A

Evaluation...:  93%|███████████████████████████████████▎  | 155/167 [00:04<00:00, 28.89it/s][A[A

Evaluation...:  95%|███████████████████████████████████▉  | 158/167 [00:04<00:00, 28.39it/s][A[A

Evaluation...:  96%|████████████████████████████████████▋ | 161/167 [00:04<00:00, 26.29it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:05<00:00, 32.12it/s][A[A

Training:  59%|████████████████████████▉                 | 893/1501 [01:32<08:32,  1.19it/s][A
Training:  60%|█████████████████████████                 | 895/1501 [01:32<06:08,  1.65it/s][A

>>> training loss:  0.3768, valid loss:  2.1649, valid f1 score:  0.4944



Training:  60%|█████████████████████████                 | 897/1501 [01:32<04:27,  2.26it/s][A
Training:  60%|█████████████████████████▏                | 899/1501 [01:32<03:19,  3.02it/s][A
Training:  60%|█████████████████████████▏                | 901/1501 [01:32<02:28,  4.04it/s][A
Training:  60%|█████████████████████████▎                | 903/1501 [01:32<01:55,  5.20it/s][A
Training:  60%|█████████████████████████▎                | 905/1501 [01:32<01:30,  6.56it/s][A
Training:  60%|█████████████████████████▍                | 907/1501 [01:32<01:13,  8.06it/s][A
Training:  61%|█████████████████████████▍                | 909/1501 [01:32<01:03,  9.39it/s][A
Training:  61%|█████████████████████████▍                | 911/1501 [01:33<00:55, 10.62it/s][A
Training:  61%|█████████████████████████▌                | 913/1501 [01:33<00:50, 11.61it/s][A
Training:  61%|█████████████████████████▌                | 915/1501 [01:33<00:46, 12.73it/s][A
Training:  61%|████████████████████████

Evaluation...:  86%|████████████████████████████████▌     | 143/167 [00:03<00:00, 36.37it/s][A[A

Evaluation...:  88%|█████████████████████████████████▍    | 147/167 [00:04<00:00, 36.48it/s][A[A

Evaluation...:  90%|██████████████████████████████████▎   | 151/167 [00:04<00:00, 37.22it/s][A[A

Evaluation...:  93%|███████████████████████████████████▎  | 155/167 [00:04<00:00, 36.42it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 37.28it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 36.50it/s][A[A

Training:  66%|███████████████████████████▊              | 993/1501 [01:43<06:19,  1.34it/s][A
Training:  66%|███████████████████████████▊              | 995/1501 [01:43<04:33,  1.85it/s][A

>>> training loss:  0.3371, valid loss:  2.1892, valid f1 score:  0.4950



Training:  66%|███████████████████████████▉              | 997/1501 [01:43<03:19,  2.53it/s][A
Training:  67%|███████████████████████████▉              | 999/1501 [01:43<02:27,  3.41it/s][A
Training:  67%|███████████████████████████▎             | 1001/1501 [01:43<01:51,  4.49it/s][A
Training:  67%|███████████████████████████▍             | 1003/1501 [01:43<01:26,  5.76it/s][A
Training:  67%|███████████████████████████▍             | 1005/1501 [01:43<01:09,  7.16it/s][A
Training:  67%|███████████████████████████▌             | 1007/1501 [01:43<00:57,  8.62it/s][A
Training:  67%|███████████████████████████▌             | 1009/1501 [01:44<00:48, 10.12it/s][A
Training:  67%|███████████████████████████▌             | 1011/1501 [01:44<00:42, 11.52it/s][A
Training:  67%|███████████████████████████▋             | 1013/1501 [01:44<00:38, 12.76it/s][A
Training:  68%|███████████████████████████▋             | 1015/1501 [01:44<00:35, 13.74it/s][A
Training:  68%|████████████████████████

Evaluation...:  86%|████████████████████████████████▌     | 143/167 [00:03<00:00, 36.32it/s][A[A

Evaluation...:  88%|█████████████████████████████████▍    | 147/167 [00:04<00:00, 36.44it/s][A[A

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:04<00:00, 37.75it/s][A[A

Evaluation...:  93%|███████████████████████████████████▍  | 156/167 [00:04<00:00, 37.28it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 37.18it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 36.60it/s][A[A

Training:  73%|█████████████████████████████▊           | 1093/1501 [01:53<05:03,  1.34it/s][A
Training:  73%|█████████████████████████████▉           | 1095/1501 [01:53<03:38,  1.85it/s][A

>>> training loss:  0.3912, valid loss:  2.2049, valid f1 score:  0.5006



Training:  73%|█████████████████████████████▉           | 1097/1501 [01:53<02:39,  2.54it/s][A
Training:  73%|██████████████████████████████           | 1099/1501 [01:54<01:58,  3.39it/s][A
Training:  73%|██████████████████████████████           | 1101/1501 [01:54<01:29,  4.47it/s][A
Training:  73%|██████████████████████████████▏          | 1103/1501 [01:54<01:08,  5.77it/s][A
Training:  74%|██████████████████████████████▏          | 1105/1501 [01:54<00:54,  7.22it/s][A
Training:  74%|██████████████████████████████▏          | 1107/1501 [01:54<00:45,  8.67it/s][A
Training:  74%|██████████████████████████████▎          | 1109/1501 [01:54<00:37, 10.33it/s][A
Training:  74%|██████████████████████████████▎          | 1111/1501 [01:54<00:33, 11.56it/s][A
Training:  74%|██████████████████████████████▍          | 1113/1501 [01:54<00:29, 13.22it/s][A
Training:  74%|██████████████████████████████▍          | 1115/1501 [01:54<00:26, 14.47it/s][A
Training:  74%|████████████████████████

Evaluation...:  86%|████████████████████████████████▊     | 144/167 [00:03<00:00, 37.09it/s][A[A

Evaluation...:  89%|█████████████████████████████████▋    | 148/167 [00:04<00:00, 36.60it/s][A[A

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:04<00:00, 37.28it/s][A[A

Evaluation...:  93%|███████████████████████████████████▍  | 156/167 [00:04<00:00, 36.31it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 35.81it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 36.97it/s][A[A

Training:  79%|████████████████████████████████▌        | 1193/1501 [02:03<03:47,  1.35it/s][A
Training:  80%|████████████████████████████████▋        | 1195/1501 [02:04<02:43,  1.87it/s][A

>>> training loss:  0.3841, valid loss:  2.2323, valid f1 score:  0.4932



Training:  80%|████████████████████████████████▋        | 1197/1501 [02:04<01:58,  2.56it/s][A
Training:  80%|████████████████████████████████▊        | 1199/1501 [02:04<01:28,  3.42it/s][A
Training:  80%|████████████████████████████████▊        | 1201/1501 [02:04<01:07,  4.47it/s][A
Training:  80%|████████████████████████████████▊        | 1203/1501 [02:04<00:52,  5.72it/s][A
Training:  80%|████████████████████████████████▉        | 1205/1501 [02:04<00:40,  7.25it/s][A
Training:  80%|████████████████████████████████▉        | 1207/1501 [02:04<00:33,  8.73it/s][A
Training:  81%|█████████████████████████████████        | 1209/1501 [02:04<00:28, 10.38it/s][A
Training:  81%|█████████████████████████████████        | 1211/1501 [02:05<00:24, 11.98it/s][A
Training:  81%|█████████████████████████████████▏       | 1213/1501 [02:05<00:21, 13.12it/s][A
Training:  81%|█████████████████████████████████▏       | 1215/1501 [02:05<00:20, 14.27it/s][A
Training:  81%|████████████████████████

Evaluation...:  84%|████████████████████████████████      | 141/167 [00:04<00:00, 35.63it/s][A[A

Evaluation...:  87%|████████████████████████████████▉     | 145/167 [00:04<00:00, 34.50it/s][A[A

Evaluation...:  89%|█████████████████████████████████▉    | 149/167 [00:04<00:00, 35.70it/s][A[A

Evaluation...:  92%|██████████████████████████████████▊   | 153/167 [00:04<00:00, 35.62it/s][A[A

Evaluation...:  94%|███████████████████████████████████▋  | 157/167 [00:04<00:00, 36.55it/s][A[A

Evaluation...:  96%|████████████████████████████████████▋ | 161/167 [00:04<00:00, 36.12it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 35.20it/s][A[A

Training:  86%|███████████████████████████████████▎     | 1293/1501 [02:14<02:40,  1.29it/s][A
Training:  86%|███████████████████████████████████▎     | 1295/1501 [02:14<01:55,  1.79it/s][A

>>> training loss:  0.4291, valid loss:  2.1996, valid f1 score:  0.4877



Training:  86%|███████████████████████████████████▍     | 1297/1501 [02:14<01:23,  2.45it/s][A
Training:  87%|███████████████████████████████████▍     | 1299/1501 [02:14<01:01,  3.30it/s][A
Training:  87%|███████████████████████████████████▌     | 1301/1501 [02:15<00:20,  9.63it/s][A
 88%|█████████████████████████████████████████████████       | 7/8 [20:39<02:57, 177.11s/it]


KeyboardInterrupt: 

## 预测并保存结果

In [None]:
def predict(config, id2label, model, test_dataloader):
    test_iterator = tqdm(test_dataloader, desc='Testing', total=len(test_dataloader))
    model.eval()
    test_preds = []
    
    with torch.no_grad():
        for batch in test_iterator:
            batch = {item: value.to(config['device']) for item, value in batch.items()}

            logits = model(**batch)[1]
            test_preds.append(logits.argmax(dim=-1).detach().cpu())
            
    test_preds = torch.cat(test_preds, dim=0).numpy()
    test_preds = [id2label[id_] for id_ in test_preds]
        
    test_df = pd.read_csv(config['test_file_path'], sep=',')
    test_df.insert(1, column=['label_pred'], value=test_preds)
    #test_df.drop(columns=['sentence'], inplace=True)
    test_df.to_csv('submission.csv', index=False, encoding='utf8')

In [None]:
predict(config, id2label, model, test_dataloader)