# 基于TextCNN的头条新闻分类笔记

## 编写配置

In [1]:
import torch 
import torch.nn as nn

config = {
    'train_file_path': '../../../data/toutiao_news_cls/train.csv',
    'test_file_path': '../../../data/toutiao_news_cls/test.csv',
    'train_val_ratio': 0.1,  # 10%用作验证集
    'vocab_size': 10000,   # 词典 3W
    'batch_size': 32,      # batch 大小 64
    'num_epochs': 10,      # 10次迭代
    'learning_rate': 1e-3, # 学习率
    'logging_step': 300,   # 每跑300个batch记录一次
    'seed': 2022           # 随机种子
}

config['device'] = 'cuda' if torch.cuda.is_available() else 'cpu' # cpu&gpu

import random
import numpy as np

def seed_everything(seed):
    random.seed(seed)
    np.random.seed(seed)
    torch.manual_seed(seed)
    torch.cuda.manual_seed_all(seed)
    return seed

seed_everything(config['seed'])

2022

## 获得词汇表

In [2]:
from collections import Counter
from tqdm import tqdm
import jieba

def get_vocab(config):
    token_counter = Counter()
    with open(config['train_file_path'], 'r', encoding='utf8') as f:
        lines = f.readlines()
        for line in tqdm(lines, desc='Counting tokens...', total=len(lines)):
            sent = line.split(',')[-1].strip()
            sent_cut = list(jieba.cut(sent))
            token_counter.update(sent_cut)
            
    vocab = set(token for token, _ in token_counter.most_common(config['vocab_size']))
    return vocab

In [3]:
vocab = get_vocab(config)
vocab

Counting tokens...:   0%|                                         | 0/53361 [00:00<?, ?it/s]Building prefix dict from the default dictionary ...
Dumping model to file cache /var/folders/19/dgxwsbgd76728hx577833nx00000gn/T/jieba.cache
Loading model cost 0.729 seconds.
Prefix dict has been built successfully.
Counting tokens...: 100%|███████████████████████████| 53361/53361 [00:06<00:00, 7934.29it/s]


{'金庸',
 '险',
 '个股',
 '们',
 '支队',
 '这座',
 '可达',
 '余年',
 '驾考',
 '旅游',
 '大好',
 'Apple',
 '全方位',
 '向往',
 '功勋',
 '范冰冰',
 '自拍',
 '论坛',
 '莫斯科',
 '上单',
 '郜林',
 '4.0',
 '涨停',
 '追',
 '忽而',
 '地块',
 '曝出',
 '在京举行',
 '主持',
 '曾经',
 '反对派',
 '厂长',
 '犹太人',
 '排名',
 '猪价',
 '许多',
 '貂蝉',
 '造假',
 '全城',
 '加强',
 '活动',
 '禁令',
 '读懂',
 '却说',
 '桑葚',
 '户外',
 '二维码',
 '印',
 '挽回',
 '扬州',
 'OMG',
 '声明',
 '280',
 '非法',
 '失踪',
 '神剧',
 '灾区',
 '人民日报',
 '维权',
 '旅行',
 '必须',
 '上山',
 '真题',
 '居然',
 '拍卖',
 '就够',
 '岳母',
 '手榴弹',
 '吸引',
 '毛',
 '苹果',
 '升',
 '不动产',
 '河南',
 '算是',
 '强大',
 '四川省',
 '科目',
 '孔',
 '居民',
 '续航',
 ' ',
 '现在',
 '六亲',
 '网购',
 '内蒙古',
 '地标',
 '史',
 '地点',
 '吸金',
 '舆论',
 '挑战者',
 '变动',
 '卡车',
 '碎',
 '校长',
 '全能',
 '想到',
 '雪域',
 '开战',
 '可怜',
 '卡',
 '故乡',
 '700',
 '主裁',
 '德云色',
 '廉价',
 '临时',
 '国安',
 '国乒',
 '列车',
 '挖出',
 '骂',
 '封号',
 '早上',
 '超过',
 '陈奕迅',
 '供',
 '方面',
 '外媒',
 '如何',
 '居',
 '行人',
 '投篮',
 '天文',
 '运动会',
 '禁赛',
 '老板',
 '下令',
 '拿下',
 '获得',
 '搭载',
 '形态',
 '干预',
 '抱怨',
 '帮助',
 '小时候',
 '我们',
 '泪目',
 '宣布',
 '长码',
 

## 获得词向量

In [4]:
import bz2

with bz2.open('../../../pt/sgns_weibo/sgns.weibo.word.bz2') as f:
    token_vector = f.readlines()    

In [5]:
for i, line in enumerate(token_vector):
    line_split = line.split()
    if i == 0:
        print(f'词汇规模:{(int)(line_split[0])}, 特征维度:{(int)(line_split[1])}')
    else:
        print(f"词汇:{line_split[0].decode('utf8')}\n特征:{line_split[1:]}")
    print()
    
    if i > 2:
        break

词汇规模:195202, 特征维度:300

词汇:，
特征:[b'0.094386', b'-0.200944', b'-0.030828', b'0.277130', b'-0.074674', b'0.239691', b'0.345185', b'0.298053', b'-0.026679', b'-0.077352', b'0.245854', b'-0.075995', b'0.058849', b'-0.176755', b'-0.072721', b'-0.246469', b'-0.182233', b'0.267472', b'0.109897', b'-0.266215', b'0.176660', b'-0.101581', b'0.374443', b'0.304319', b'0.024169', b'-0.158494', b'-0.254765', b'-0.265324', b'0.225498', b'-0.126215', b'-0.207172', b'-0.334429', b'-0.003584', b'-0.065530', b'0.174206', b'-0.097252', b'0.114595', b'-0.158193', b'-0.099948', b'-0.145332', b'-0.076565', b'-0.119460', b'0.074718', b'-0.056694', b'0.394867', b'-0.127122', b'0.270542', b'0.087482', b'-0.114715', b'0.124381', b'-0.149974', b'0.192933', b'0.131023', b'0.099271', b'-0.062209', b'0.079382', b'0.000578', b'-0.166215', b'0.155815', b'-0.279675', b'-0.184237', b'0.123209', b'0.043216', b'-0.308681', b'0.036135', b'0.064121', b'0.037674', b'0.026703', b'0.307341', b'0.089780', b'-0.057681', b'-0.2523

In [6]:
def get_embedding(vocab):
    token2embedding ={}

    with bz2.open('../../../pt/sgns_weibo/sgns.weibo.word.bz2') as f:
        token_vector = f.readlines()

        meta_info = token_vector[0].split()
        print(f'{(int)(meta_info[0])} tokens in embedding file in total, vector size is {(int)(meta_info[1])}')

        for line in tqdm(token_vector[1:]):
            line = line.split()
            token = line[0].decode('utf8')

            vector = line[1:]

            if token in vocab:
                token2embedding[token] = [float(num) for num in vector]

        # enumerate(, [start])
        token2id = {token: idx for idx, token in enumerate(token2embedding.keys(), 4)}
        id2embedding = {token2id[token]: embedding for token, embedding in token2embedding.items()}

        PAD, UNK, BOS, EOS = '<pad>', '<unk>', '<bos>', '<eos>'

        token2id[PAD] = 0
        token2id[UNK] = 1
        token2id[BOS] = 2
        token2id[EOS] = 3

        id2embedding[0] = [.0] * int(meta_info[1])
        id2embedding[1] = [.0] * int(meta_info[1])

        id2embedding[2] = np.random.random(int(meta_info[1])).tolist()
        id2embedding[3] = np.random.random(int(meta_info[1])).tolist()

        emb_mat = [id2embedding[idx] for idx in range(len(id2embedding))]

        return torch.tensor(emb_mat, dtype=torch.float), token2id, len(vocab)+4


In [7]:
emb_mat, token2id, config['vocab_size'] = get_embedding(vocab)

195202 tokens in embedding file in total, vector size is 300


100%|████████████████████████████████████████████| 195202/195202 [00:03<00:00, 60309.12it/s]


## 数据预处理并编写DataLoader

In [8]:
def tokenizer(sent, token2id):
    ids = [token2id.get(token, 1) for token in jieba.cut(sent)]
    return ids

In [9]:
import pandas as pd
from collections import defaultdict

In [10]:
def read_data(config, token2id, mode='train'):
    
    data_df = pd.read_csv(config[f'{mode}_file_path'], sep=',')
    LABEL, SENTENCE = 'label', 'sentence'
    data_df[SENTENCE].apply(lambda s: ' '.join([str(id_) for id_ in tokenizer(s, token2id)]))
    data_df['input_ids'] = data_df[SENTENCE].apply(lambda s: ' '.join([str(id_) for id_ in tokenizer(s, token2id)]))
    sentence_wids = np.array([[int(id_) for id_ in v.split()] for v in data_df['input_ids'].values])

    if mode == 'train':
        labels = data_df[LABEL].values
        
        X_train, y_train = defaultdict(list), []
        X_val, y_val = defaultdict(list), []
        num_val = int(config['train_val_ratio'] * len(data_df))
        
        # shuffle ids
        ids = np.random.choice(range(len(data_df)), size=len(data_df), replace=False)
        train_ids = ids[num_val:]
        val_ids = ids[:num_val]
        
        # get input_ids
        X_train['input_ids'], y_train = sentence_wids[train_ids], labels[train_ids]
        X_val['input_ids'], y_val = sentence_wids[val_ids], labels[val_ids]
        
        # label 
        label2id = {label: i for i, label in enumerate(np.unique(y_train))}
        id2label = {i: label for label, i in label2id.items()}
        y_train = torch.tensor([label2id[y] for y in y_train], dtype=torch.long)
        y_val = torch.tensor([label2id[y] for y in y_val], dtype=torch.long)

        return X_train, y_train, X_val, y_val, label2id, id2label

    else:
        X_test = defaultdict(list)
        X_test['input_ids'] = sentence_wids
        y_test = torch.zeros(len(data_df), dtype=torch.long)
        
        return X_test, y_test

In [11]:
# X_train, y_train, X_val, y_val, label2id, id2label = read_data(config, token2id, mode='train')

In [12]:
# X_test, y_test = read_data(config, token2id, mode='test')

#### Dataset提供数据集的封装，创建/继承Dataset必须实现:
+ __len__: 整个数据集的长度
+ __getitem__: 支持数据集索引的函数

In [13]:
from torch.utils.data import Dataset

class TNEWSDataset(Dataset):
    def __init__(self, X, y):
        self.x = X
        self.y = y
        
    def __getitem__(self, idx):
        return {
            'input_ids': self.x['input_ids'][idx],
            'label': self.y[idx]
        }
    
    def __len__(self):
        return self.y.size(0)

#### 使用DataLoader实现数据集的并行加载
+ DataLoader提供一个可迭代对象，实现数据并行加载，从TNEWSDataset返回一个example，取多次，最后形成一个长度为batch_size的列表examples
+ examples的格式：[dict1, dict2, ...]
+ collate_fn()将examples中的数据合并为Tensor

In [14]:
def collate_fn(examples):
    input_ids_lst = []
    labels = []
    for example in examples:
        input_ids_lst.append(example['input_ids'])
        labels.append(example['label'])
        
    # input_ids_lst中最长的句子长度
    max_length = max(len(input_ids) for input_ids in input_ids_lst)
    # 定义一个Tensor
    input_ids_tensor = torch.zeros((len(labels), max_length), dtype=torch.long)
    
    for i, input_ids in enumerate(input_ids_lst):
        seq_len = len(input_ids)
        input_ids_tensor[i, :seq_len] = torch.tensor(input_ids, dtype=torch.long)
    
    return {
        'input_ids': input_ids_tensor,
        'label': torch.tensor(labels, dtype=torch.long)
    }

In [15]:
from torch.utils.data import DataLoader

def build_dataloader(config, vocab):
    X_train, y_train, X_val, y_val, label2id, id2label = read_data(config, token2id, mode='train')
    X_test, y_test = read_data(config, token2id, mode='test')
    
    train_dataset = TNEWSDataset(X_train, y_train)
    val_dataset = TNEWSDataset(X_val, y_val)
    test_dataset = TNEWSDataset(X_test, y_test)
    
    train_dataloader = DataLoader(dataset=train_dataset, batch_size=config['batch_size'], num_workers=0, shuffle=True, collate_fn=collate_fn)
    val_dataloader = DataLoader(dataset=val_dataset, batch_size=config['batch_size'], num_workers=0, shuffle=False, collate_fn=collate_fn)
    test_dataloader = DataLoader(dataset=test_dataset, batch_size=config['batch_size'], num_workers=0, shuffle=False, collate_fn=collate_fn)

    return id2label, train_dataloader, val_dataloader, test_dataloader

In [16]:
id2label, train_dataloader, val_dataloader, test_dataloader = build_dataloader(config, vocab)

  import sys


In [17]:
for batch in train_dataloader:
    print(len(batch['input_ids']))
    print(batch)
    break

32
{'input_ids': tensor([[ 368,  749,  323,  624,   48,    1, 5674, 1957,  892, 3675,    0,    0,
            0,    0,    0,    0,    0,    0,    0,    0,    0],
        [8462,    1,  739,   34,   18,    1,   22,   56, 1411,   38,    8,    7,
           33,    1, 1411,  670,  260,   15,    1,    1,    7],
        [9009,    1,    1, 2188,    4,    1,    1,    1, 2998,    1,    0,    0,
            0,    0,    0,    0,    0,    0,    0,    0,    0],
        [5197,    1,    1, 5840,    0,    0,    0,    0,    0,    0,    0,    0,
            0,    0,    0,    0,    0,    0,    0,    0,    0],
        [ 340, 4981, 7492,  846,   17,    0,    0,    0,    0,    0,    0,    0,
            0,    0,    0,    0,    0,    0,    0,    0,    0],
        [   1,  492, 4721,   46,    1,    4,    1,  314,    1,  153,   12, 3680,
            5,  143,    0,    0,    0,    0,    0,    0,    0],
        [  15,  879,   41,    1,   32,  563,    4,    1,    1,    1, 1034,    8,
          114,   17,    0,    0,

## 实现TextCNN并训练验证

In [18]:
model_config = {
    'embedding_pretrained' : emb_mat,
    'num_filters' : 256,
    'emb_size' : emb_mat.shape[1],
    'dropout' : 0.3,
    'filter_sizes' : [2,3,5],
    'num_classes' : len(id2label)
}

In [19]:
emb_mat.dtype

torch.float32

In [20]:
import torch.nn.functional as F

class Model(nn.Module):
    def __init__(self, config):
        super(Model, self).__init__()
        
        self.embedding = nn.Embedding.from_pretrained(config['embedding_pretrained'], freeze=True)
        self.convs = nn.ModuleList([nn.Conv2d(1, config['num_filters'], (k, config['emb_size'])) for k in config['filter_sizes']])
        self.dropout = nn.Dropout(config['dropout'])
        
        self.fc = nn.Linear(len(config['filter_sizes']) * config['num_filters'], config['num_classes'])

        
    def convs_and_pool(self, x, conv):
        # x [batch_size, out_channels, seq_len_out, 1]
        # x [batch_size, out_channels, seq_len_out]
        x = F.relu(conv(x)).squeeze(3)
        
        # x [batch_size, out_channels, 1]
        # x [batch_size, out_channels]
        x = F.max_pool1d(x, x.size(2)).squeeze(2)
        
        return x
    
    def forward(self, input_ids=None, label=None):
        # out [batch_size, seq_len, embedding_dim]
        out = self.embedding(input_ids)
        
        # out [batch_size, 1, seq_len, embedding_dim]
        out = out.unsqueeze(1)
        
        # (batch_size, out_channels)
        out = torch.cat([self.convs_and_pool(out, conv) for conv in self.convs], 1)
        
        out = self.dropout(out)
        out = self.fc(out)
        output = (out, )
        
        if label is not None:  # for train
            loss_fct = nn.CrossEntropyLoss()
            loss = loss_fct(out, label)
            output = (loss,) + output
            
        return output

In [21]:
model = Model(model_config)

In [22]:
from sklearn.metrics import f1_score, precision_score, recall_score, accuracy_score

def evaluation(config, model, val_dataloader):
    model.eval()
    preds = []
    labels = []
    val_loss = 0.
    val_iterator = tqdm(val_dataloader, desc='Evaluation...', total=len(val_dataloader))
    with torch.no_grad():
        for batch in val_iterator:
            labels.append(batch['label'])
            batch = {item:value.to(config['device']) for item, value in batch.items()}
            
            # val output (loss, out)
            loss, logits = model(**batch)[:2]
            val_loss += loss.item()
            
            preds.append(logits.argmax(dim=-1).detach().cpu())
            
    avg_val_loss = val_loss/len(val_dataloader)
    labels = torch.cat(labels, dim=0).numpy()
    preds = torch.cat(preds, dim=0).numpy()
    
    f1 = f1_score(labels, preds, average='macro')
    precision = precision_score(labels, preds, average='macro')
    recall = recall_score(labels, preds, average='macro')
    accuracy = accuracy_score(labels, preds)

    return avg_val_loss, f1, precision, recall, accuracy

In [27]:
import pickle
from torch.optim import AdamW
from tqdm import trange

def train(model, config, id2label, train_dataloader, val_dataloader):
    optimizer = AdamW(model.parameters(), lr=config['learning_rate'])
    model.to(config['device'])
    epoches_iterator = trange(config['num_epochs'])
    
    # 200batch/epoch * 10epochs = global_step
    global_step = 0
    train_loss = 0.
    logging_loss = 0.
    
    best_f1 = 0.
    best_precision = 0.
    best_recall = 0.
    best_accuracy = 0.
    
    for epoch in epoches_iterator:
        train_iterator = tqdm(train_dataloader, desc='Training', total=len(train_dataloader))
        model.train()
        for batch in train_iterator:
            batch = {item:value.to(config['device']) for item, value in batch.items()}
            
            # train output (loss, out)
            loss = model(**batch)[0]
            
            model.zero_grad()
            loss.backward()
            optimizer.step()
            train_loss += loss
            global_step += 1
            
            if global_step % config['logging_step'] == 0:
                print_train_loss = train_loss / config['logging_step']
                train_loss = 0.
                avg_val_loss, f1, precision, recall, accuracy = evaluation(config, model, val_dataloader)

                if best_f1 < f1:
                    best_f1 = f1
                    best_precision = precision
                    best_recall = recall
                    best_accuracy = accuracy
                    print_log = f'''>>> training loss: {print_train_loss: .4f}, valid loss: {avg_val_loss: .4f}\n
                            valid f1 score: {f1: .4f}, valid precision score: {precision: .4f},
                            valid recall score: {recall: .4f}, valid accuracy score: {accuracy: .4f}'''
                    print(print_log)
                    with open('../../../pt_tmp/cls/textcnn_base_chinese/pytorch_model.pkl', 'wb') as f:
                        pickle.dump(model, f)

                model.train()
                
    return best_f1, best_precision, best_recall, best_accuracy

In [28]:
f1, precision, recall, accuracy = train(model, config, id2label, train_dataloader, val_dataloader)
print_log = f'''valid f1 score: {f1: .4f}, valid precision score: {precision: .4f},
                valid recall score: {recall: .4f}, valid accuracy score: {accuracy: .4f}'''
print(print_log)

  0%|                                                                | 0/10 [00:00<?, ?it/s]
Training:   0%|                                                    | 0/1501 [00:00<?, ?it/s][A
Training:   0%|                                            | 2/1501 [00:00<01:57, 12.71it/s][A
Training:   0%|                                            | 4/1501 [00:00<01:41, 14.76it/s][A
Training:   0%|▏                                           | 6/1501 [00:00<01:39, 15.05it/s][A
Training:   1%|▏                                           | 8/1501 [00:00<01:37, 15.37it/s][A
Training:   1%|▎                                          | 10/1501 [00:00<01:36, 15.51it/s][A
Training:   1%|▎                                          | 12/1501 [00:00<01:37, 15.31it/s][A
Training:   1%|▍                                          | 14/1501 [00:00<01:40, 14.84it/s][A
Training:   1%|▍                                          | 16/1501 [00:01<01:40, 14.79it/s][A
Training:   1%|▌                           

Training:  11%|████▋                                     | 168/1501 [00:10<01:21, 16.39it/s][A
Training:  11%|████▊                                     | 170/1501 [00:10<01:21, 16.26it/s][A
Training:  11%|████▊                                     | 172/1501 [00:10<01:18, 16.88it/s][A
Training:  12%|████▊                                     | 174/1501 [00:10<01:20, 16.51it/s][A
Training:  12%|████▉                                     | 176/1501 [00:10<01:19, 16.75it/s][A
Training:  12%|████▉                                     | 178/1501 [00:10<01:18, 16.93it/s][A
Training:  12%|█████                                     | 180/1501 [00:10<01:19, 16.69it/s][A
Training:  12%|█████                                     | 182/1501 [00:11<01:17, 16.92it/s][A
Training:  12%|█████▏                                    | 184/1501 [00:11<01:15, 17.42it/s][A
Training:  12%|█████▏                                    | 186/1501 [00:11<01:19, 16.63it/s][A
Training:  13%|█████▎                   

Evaluation...:  45%|█████████████████▌                     | 75/167 [00:02<00:02, 37.88it/s][A[A

Evaluation...:  47%|██████████████████▍                    | 79/167 [00:02<00:02, 38.28it/s][A[A

Evaluation...:  50%|███████████████████▍                   | 83/167 [00:02<00:02, 38.60it/s][A[A

Evaluation...:  52%|████████████████████▎                  | 87/167 [00:02<00:02, 36.75it/s][A[A

Evaluation...:  54%|█████████████████████▎                 | 91/167 [00:02<00:02, 36.22it/s][A[A

Evaluation...:  57%|██████████████████████▏                | 95/167 [00:02<00:02, 35.92it/s][A[A

Evaluation...:  59%|███████████████████████                | 99/167 [00:02<00:01, 36.00it/s][A[A

Evaluation...:  62%|███████████████████████▍              | 103/167 [00:02<00:01, 36.76it/s][A[A

Evaluation...:  64%|████████████████████████▎             | 107/167 [00:02<00:01, 37.40it/s][A[A

Evaluation...:  67%|█████████████████████████▍            | 112/167 [00:03<00:01, 38.90it/s][A[A



>>> training loss:  1.4154, valid loss:  1.4659

                            valid f1 score:  0.4721, valid precision score:  0.5316,
                            valid recall score:  0.4596, valid accuracy score:  0.5208



Training:  20%|████████▌                                 | 304/1501 [00:23<07:52,  2.53it/s][A
Training:  20%|████████▌                                 | 306/1501 [00:24<05:49,  3.42it/s][A
Training:  21%|████████▌                                 | 308/1501 [00:24<04:25,  4.49it/s][A
Training:  21%|████████▋                                 | 310/1501 [00:24<03:27,  5.73it/s][A
Training:  21%|████████▋                                 | 312/1501 [00:24<02:46,  7.12it/s][A
Training:  21%|████████▊                                 | 314/1501 [00:24<02:15,  8.73it/s][A
Training:  21%|████████▊                                 | 316/1501 [00:24<02:00,  9.84it/s][A
Training:  21%|████████▉                                 | 318/1501 [00:24<01:44, 11.33it/s][A
Training:  21%|████████▉                                 | 320/1501 [00:24<01:32, 12.72it/s][A
Training:  21%|█████████                                 | 322/1501 [00:24<01:24, 13.97it/s][A
Training:  22%|█████████               

Training:  32%|█████████████▎                            | 475/1501 [00:34<01:05, 15.66it/s][A
Training:  32%|█████████████▎                            | 477/1501 [00:34<01:02, 16.37it/s][A
Training:  32%|█████████████▍                            | 479/1501 [00:34<01:04, 15.92it/s][A
Training:  32%|█████████████▍                            | 481/1501 [00:34<01:04, 15.85it/s][A
Training:  32%|█████████████▌                            | 483/1501 [00:34<01:03, 15.93it/s][A
Training:  32%|█████████████▌                            | 485/1501 [00:34<01:01, 16.48it/s][A
Training:  32%|█████████████▋                            | 487/1501 [00:35<01:00, 16.68it/s][A
Training:  33%|█████████████▋                            | 489/1501 [00:35<01:00, 16.65it/s][A
Training:  33%|█████████████▋                            | 491/1501 [00:35<01:00, 16.65it/s][A
Training:  33%|█████████████▊                            | 493/1501 [00:35<01:00, 16.55it/s][A
Training:  33%|█████████████▊           

Evaluation...:  55%|█████████████████████▍                 | 92/167 [00:02<00:02, 37.40it/s][A[A

Evaluation...:  57%|██████████████████████▍                | 96/167 [00:02<00:01, 35.65it/s][A[A

Evaluation...:  60%|██████████████████████▊               | 100/167 [00:02<00:02, 33.26it/s][A[A

Evaluation...:  62%|███████████████████████▋              | 104/167 [00:02<00:01, 32.13it/s][A[A

Evaluation...:  65%|████████████████████████▌             | 108/167 [00:02<00:01, 31.81it/s][A[A

Evaluation...:  67%|█████████████████████████▍            | 112/167 [00:03<00:01, 32.84it/s][A[A

Evaluation...:  69%|██████████████████████████▍           | 116/167 [00:03<00:01, 34.36it/s][A[A

Evaluation...:  72%|███████████████████████████▎          | 120/167 [00:03<00:01, 34.63it/s][A[A

Evaluation...:  75%|████████████████████████████▍         | 125/167 [00:03<00:01, 37.18it/s][A[A

Evaluation...:  78%|█████████████████████████████▌        | 130/167 [00:03<00:00, 38.57it/s][A[A



>>> training loss:  1.4203, valid loss:  1.4690

                            valid f1 score:  0.4929, valid precision score:  0.5664,
                            valid recall score:  0.4792, valid accuracy score:  0.5204



Training:  40%|████████████████▉                         | 604/1501 [00:46<06:09,  2.43it/s][A
Training:  40%|████████████████▉                         | 606/1501 [00:46<04:34,  3.26it/s][A
Training:  41%|█████████████████                         | 608/1501 [00:47<03:27,  4.31it/s][A
Training:  41%|█████████████████                         | 610/1501 [00:47<02:41,  5.51it/s][A
Training:  41%|█████████████████                         | 612/1501 [00:47<02:10,  6.81it/s][A
Training:  41%|█████████████████▏                        | 614/1501 [00:47<01:49,  8.12it/s][A
Training:  41%|█████████████████▏                        | 616/1501 [00:47<01:34,  9.38it/s][A
Training:  41%|█████████████████▎                        | 618/1501 [00:47<01:22, 10.68it/s][A
Training:  41%|█████████████████▎                        | 620/1501 [00:47<01:16, 11.45it/s][A
Training:  41%|█████████████████▍                        | 622/1501 [00:48<01:11, 12.38it/s][A
Training:  42%|█████████████████▍      

Training:  52%|█████████████████████▋                    | 774/1501 [00:57<00:44, 16.22it/s][A
Training:  52%|█████████████████████▋                    | 776/1501 [00:57<00:43, 16.86it/s][A
Training:  52%|█████████████████████▊                    | 778/1501 [00:57<00:43, 16.72it/s][A
Training:  52%|█████████████████████▊                    | 780/1501 [00:58<00:43, 16.58it/s][A
Training:  52%|█████████████████████▉                    | 782/1501 [00:58<00:43, 16.53it/s][A
Training:  52%|█████████████████████▉                    | 784/1501 [00:58<00:42, 17.01it/s][A
Training:  52%|█████████████████████▉                    | 786/1501 [00:58<00:41, 17.30it/s][A
Training:  52%|██████████████████████                    | 788/1501 [00:58<00:40, 17.76it/s][A
Training:  53%|██████████████████████                    | 790/1501 [00:58<00:40, 17.67it/s][A
Training:  53%|██████████████████████▏                   | 792/1501 [00:58<00:42, 16.75it/s][A
Training:  53%|██████████████████████▏  

Evaluation...:  50%|███████████████████▌                   | 84/167 [00:02<00:02, 35.08it/s][A[A

Evaluation...:  53%|████████████████████▌                  | 88/167 [00:02<00:02, 33.07it/s][A[A

Evaluation...:  55%|█████████████████████▍                 | 92/167 [00:02<00:02, 34.26it/s][A[A

Evaluation...:  57%|██████████████████████▍                | 96/167 [00:02<00:02, 33.54it/s][A[A

Evaluation...:  60%|██████████████████████▊               | 100/167 [00:03<00:01, 34.21it/s][A[A

Evaluation...:  62%|███████████████████████▋              | 104/167 [00:03<00:01, 34.83it/s][A[A

Evaluation...:  65%|████████████████████████▌             | 108/167 [00:03<00:01, 35.85it/s][A[A

Evaluation...:  67%|█████████████████████████▍            | 112/167 [00:03<00:01, 36.51it/s][A[A

Evaluation...:  69%|██████████████████████████▍           | 116/167 [00:03<00:01, 36.32it/s][A[A

Evaluation...:  72%|███████████████████████████▎          | 120/167 [00:03<00:01, 33.06it/s][A[A



>>> training loss:  1.4743, valid loss:  1.4406

                            valid f1 score:  0.5041, valid precision score:  0.5589,
                            valid recall score:  0.4955, valid accuracy score:  0.5232



Training:  60%|█████████████████████████▎                | 904/1501 [01:11<04:33,  2.18it/s][A
Training:  60%|█████████████████████████▎                | 906/1501 [01:11<03:24,  2.92it/s][A
Training:  60%|█████████████████████████▍                | 908/1501 [01:11<02:35,  3.82it/s][A
Training:  61%|█████████████████████████▍                | 910/1501 [01:12<01:59,  4.93it/s][A
Training:  61%|█████████████████████████▌                | 912/1501 [01:12<01:35,  6.14it/s][A
Training:  61%|█████████████████████████▌                | 914/1501 [01:12<01:18,  7.52it/s][A
Training:  61%|█████████████████████████▋                | 916/1501 [01:12<01:05,  8.99it/s][A
Training:  61%|█████████████████████████▋                | 918/1501 [01:12<00:55, 10.52it/s][A
Training:  61%|█████████████████████████▋                | 920/1501 [01:12<00:49, 11.65it/s][A
Training:  61%|█████████████████████████▊                | 922/1501 [01:12<00:44, 12.95it/s][A
Training:  62%|████████████████████████

Training:  72%|█████████████████████████████▎           | 1074/1501 [01:23<00:35, 11.86it/s][A
Training:  72%|█████████████████████████████▍           | 1076/1501 [01:23<00:35, 11.91it/s][A
Training:  72%|█████████████████████████████▍           | 1078/1501 [01:23<00:35, 12.07it/s][A
Training:  72%|█████████████████████████████▌           | 1080/1501 [01:23<00:34, 12.28it/s][A
Training:  72%|█████████████████████████████▌           | 1082/1501 [01:23<00:34, 12.22it/s][A
Training:  72%|█████████████████████████████▌           | 1084/1501 [01:23<00:32, 12.99it/s][A
Training:  72%|█████████████████████████████▋           | 1086/1501 [01:24<00:33, 12.38it/s][A
Training:  72%|█████████████████████████████▋           | 1088/1501 [01:24<00:35, 11.68it/s][A
Training:  73%|█████████████████████████████▊           | 1090/1501 [01:24<00:37, 10.85it/s][A
Training:  73%|█████████████████████████████▊           | 1092/1501 [01:24<00:39, 10.43it/s][A
Training:  73%|█████████████████████████

Evaluation...:  51%|███████████████████▊                   | 85/167 [00:02<00:02, 37.22it/s][A[A

Evaluation...:  53%|████████████████████▊                  | 89/167 [00:02<00:02, 34.50it/s][A[A

Evaluation...:  56%|█████████████████████▋                 | 93/167 [00:02<00:02, 35.41it/s][A[A

Evaluation...:  58%|██████████████████████▋                | 97/167 [00:02<00:02, 34.75it/s][A[A

Evaluation...:  60%|██████████████████████▉               | 101/167 [00:02<00:01, 35.84it/s][A[A

Evaluation...:  63%|███████████████████████▉              | 105/167 [00:02<00:01, 35.99it/s][A[A

Evaluation...:  66%|█████████████████████████             | 110/167 [00:03<00:01, 38.32it/s][A[A

Evaluation...:  68%|█████████████████████████▉            | 114/167 [00:03<00:01, 38.05it/s][A[A

Evaluation...:  71%|██████████████████████████▊           | 118/167 [00:03<00:01, 37.56it/s][A[A

Evaluation...:  73%|███████████████████████████▊          | 122/167 [00:03<00:01, 37.04it/s][A[A



Training:  88%|████████████████████████████████████▏    | 1326/1501 [01:45<00:12, 13.47it/s][A
Training:  88%|████████████████████████████████████▎    | 1328/1501 [01:45<00:12, 13.69it/s][A
Training:  89%|████████████████████████████████████▎    | 1330/1501 [01:45<00:12, 13.81it/s][A
Training:  89%|████████████████████████████████████▍    | 1332/1501 [01:45<00:12, 13.88it/s][A
Training:  89%|████████████████████████████████████▍    | 1334/1501 [01:45<00:11, 14.17it/s][A
Training:  89%|████████████████████████████████████▍    | 1336/1501 [01:46<00:11, 14.66it/s][A
Training:  89%|████████████████████████████████████▌    | 1338/1501 [01:46<00:10, 15.57it/s][A
Training:  89%|████████████████████████████████████▌    | 1340/1501 [01:46<00:10, 15.81it/s][A
Training:  89%|████████████████████████████████████▋    | 1342/1501 [01:46<00:10, 15.43it/s][A
Training:  90%|████████████████████████████████████▋    | 1344/1501 [01:46<00:09, 15.83it/s][A
Training:  90%|█████████████████████████

Training: 100%|████████████████████████████████████████▊| 1496/1501 [01:56<00:00, 16.14it/s][A
Training: 100%|████████████████████████████████████████▉| 1498/1501 [01:56<00:00, 16.88it/s][A

Evaluation...:   0%|                                                | 0/167 [00:00<?, ?it/s][A[A

Evaluation...:   2%|▉                                       | 4/167 [00:00<00:04, 35.19it/s][A[A

Evaluation...:   5%|█▉                                      | 8/167 [00:00<00:04, 35.35it/s][A[A

Evaluation...:   7%|██▊                                    | 12/167 [00:00<00:04, 36.81it/s][A[A

Evaluation...:  10%|███▉                                   | 17/167 [00:00<00:03, 38.77it/s][A[A

Evaluation...:  13%|████▉                                  | 21/167 [00:00<00:03, 38.63it/s][A[A

Evaluation...:  15%|█████▊                                 | 25/167 [00:00<00:03, 38.44it/s][A[A

Evaluation...:  17%|██████▊                                | 29/167 [00:00<00:03, 37.66it/s][A[A

Evaluat

Training:   5%|██▏                                        | 76/1501 [00:04<01:21, 17.44it/s][A
Training:   5%|██▏                                        | 78/1501 [00:04<01:22, 17.28it/s][A
Training:   5%|██▎                                        | 80/1501 [00:04<01:23, 17.01it/s][A
Training:   5%|██▎                                        | 82/1501 [00:04<01:23, 17.08it/s][A
Training:   6%|██▍                                        | 84/1501 [00:04<01:26, 16.40it/s][A
Training:   6%|██▍                                        | 86/1501 [00:05<01:22, 17.19it/s][A
Training:   6%|██▌                                        | 88/1501 [00:05<01:21, 17.44it/s][A
Training:   6%|██▌                                        | 90/1501 [00:05<01:18, 17.96it/s][A
Training:   6%|██▋                                        | 92/1501 [00:05<01:21, 17.23it/s][A
Training:   6%|██▋                                        | 94/1501 [00:05<01:20, 17.55it/s][A
Training:   6%|██▊                      

Training:  16%|██████▉                                   | 247/1501 [00:14<01:15, 16.65it/s][A
Training:  17%|██████▉                                   | 249/1501 [00:14<01:14, 16.72it/s][A
Training:  17%|███████                                   | 251/1501 [00:14<01:14, 16.78it/s][A
Training:  17%|███████                                   | 253/1501 [00:14<01:11, 17.39it/s][A
Training:  17%|███████▏                                  | 255/1501 [00:14<01:13, 16.92it/s][A
Training:  17%|███████▏                                  | 257/1501 [00:15<01:13, 16.92it/s][A
Training:  17%|███████▏                                  | 259/1501 [00:15<01:12, 17.17it/s][A
Training:  17%|███████▎                                  | 261/1501 [00:15<01:12, 17.14it/s][A
Training:  18%|███████▎                                  | 263/1501 [00:15<01:11, 17.33it/s][A
Training:  18%|███████▍                                  | 265/1501 [00:15<01:13, 16.91it/s][A
Training:  18%|███████▍                 

>>> training loss:  1.2475, valid loss:  1.4462

                            valid f1 score:  0.5099, valid precision score:  0.5315,
                            valid recall score:  0.5088, valid accuracy score:  0.5255



Training:  20%|████████▍                                 | 303/1501 [00:21<07:21,  2.71it/s][A
Training:  20%|████████▌                                 | 305/1501 [00:22<05:27,  3.65it/s][A
Training:  20%|████████▌                                 | 307/1501 [00:22<04:08,  4.80it/s][A
Training:  21%|████████▋                                 | 309/1501 [00:22<03:15,  6.09it/s][A
Training:  21%|████████▋                                 | 311/1501 [00:22<02:38,  7.49it/s][A
Training:  21%|████████▊                                 | 313/1501 [00:22<02:10,  9.10it/s][A
Training:  21%|████████▊                                 | 315/1501 [00:22<01:51, 10.60it/s][A
Training:  21%|████████▊                                 | 317/1501 [00:22<01:38, 12.01it/s][A
Training:  21%|████████▉                                 | 319/1501 [00:22<01:30, 13.04it/s][A
Training:  21%|████████▉                                 | 321/1501 [00:22<01:25, 13.73it/s][A
Training:  22%|█████████               

Training:  32%|█████████████▏                            | 473/1501 [00:32<01:02, 16.43it/s][A
Training:  32%|█████████████▎                            | 475/1501 [00:32<01:01, 16.64it/s][A
Training:  32%|█████████████▎                            | 477/1501 [00:32<01:02, 16.43it/s][A
Training:  32%|█████████████▍                            | 479/1501 [00:32<01:01, 16.67it/s][A
Training:  32%|█████████████▍                            | 481/1501 [00:32<00:59, 17.12it/s][A
Training:  32%|█████████████▌                            | 483/1501 [00:32<00:59, 17.20it/s][A
Training:  32%|█████████████▌                            | 485/1501 [00:32<00:59, 17.08it/s][A
Training:  32%|█████████████▋                            | 487/1501 [00:32<00:58, 17.32it/s][A
Training:  33%|█████████████▋                            | 489/1501 [00:33<00:57, 17.54it/s][A
Training:  33%|█████████████▋                            | 491/1501 [00:33<00:57, 17.64it/s][A
Training:  33%|█████████████▊           

Evaluation...:  51%|███████████████████▊                   | 85/167 [00:02<00:02, 37.49it/s][A[A

Evaluation...:  53%|████████████████████▊                  | 89/167 [00:02<00:02, 35.17it/s][A[A

Evaluation...:  56%|█████████████████████▋                 | 93/167 [00:02<00:02, 36.00it/s][A[A

Evaluation...:  58%|██████████████████████▋                | 97/167 [00:02<00:01, 35.53it/s][A[A

Evaluation...:  60%|██████████████████████▉               | 101/167 [00:02<00:01, 36.68it/s][A[A

Evaluation...:  63%|███████████████████████▉              | 105/167 [00:02<00:01, 36.69it/s][A[A

Evaluation...:  66%|█████████████████████████             | 110/167 [00:02<00:01, 38.60it/s][A[A

Evaluation...:  68%|█████████████████████████▉            | 114/167 [00:03<00:01, 38.26it/s][A[A

Evaluation...:  71%|██████████████████████████▊           | 118/167 [00:03<00:01, 37.94it/s][A[A

Evaluation...:  73%|███████████████████████████▊          | 122/167 [00:03<00:01, 37.59it/s][A[A



Training:  48%|████████████████████▎                     | 725/1501 [00:51<00:46, 16.85it/s][A
Training:  48%|████████████████████▎                     | 727/1501 [00:51<00:45, 17.10it/s][A
Training:  49%|████████████████████▍                     | 729/1501 [00:52<00:46, 16.56it/s][A
Training:  49%|████████████████████▍                     | 731/1501 [00:52<00:46, 16.58it/s][A
Training:  49%|████████████████████▌                     | 733/1501 [00:52<00:45, 16.70it/s][A
Training:  49%|████████████████████▌                     | 735/1501 [00:52<00:45, 16.85it/s][A
Training:  49%|████████████████████▌                     | 737/1501 [00:52<00:47, 15.99it/s][A
Training:  49%|████████████████████▋                     | 739/1501 [00:52<00:47, 16.21it/s][A
Training:  49%|████████████████████▋                     | 741/1501 [00:52<00:45, 16.87it/s][A
Training:  50%|████████████████████▊                     | 743/1501 [00:52<00:46, 16.15it/s][A
Training:  50%|████████████████████▊    

Training:  60%|█████████████████████████                 | 895/1501 [01:01<00:36, 16.42it/s][A
Training:  60%|█████████████████████████                 | 897/1501 [01:01<00:35, 16.82it/s][A

Evaluation...:   0%|                                                | 0/167 [00:00<?, ?it/s][A[A

Evaluation...:   2%|▉                                       | 4/167 [00:00<00:04, 36.85it/s][A[A

Evaluation...:   5%|█▉                                      | 8/167 [00:00<00:04, 36.63it/s][A[A

Evaluation...:   7%|██▊                                    | 12/167 [00:00<00:04, 37.24it/s][A[A

Evaluation...:  10%|███▉                                   | 17/167 [00:00<00:03, 38.93it/s][A[A

Evaluation...:  13%|████▉                                  | 21/167 [00:00<00:03, 36.85it/s][A[A

Evaluation...:  15%|█████▊                                 | 25/167 [00:00<00:03, 36.65it/s][A[A

Evaluation...:  17%|██████▊                                | 29/167 [00:00<00:03, 36.15it/s][A[A

Evaluat

Training:  65%|███████████████████████████▍              | 979/1501 [01:11<00:29, 17.50it/s][A
Training:  65%|███████████████████████████▍              | 981/1501 [01:11<00:30, 17.31it/s][A
Training:  65%|███████████████████████████▌              | 983/1501 [01:11<00:31, 16.32it/s][A
Training:  66%|███████████████████████████▌              | 985/1501 [01:11<00:31, 16.60it/s][A
Training:  66%|███████████████████████████▌              | 987/1501 [01:11<00:30, 16.61it/s][A
Training:  66%|███████████████████████████▋              | 989/1501 [01:11<00:31, 16.46it/s][A
Training:  66%|███████████████████████████▋              | 991/1501 [01:12<00:31, 16.22it/s][A
Training:  66%|███████████████████████████▊              | 993/1501 [01:12<00:30, 16.64it/s][A
Training:  66%|███████████████████████████▊              | 995/1501 [01:12<00:30, 16.59it/s][A
Training:  66%|███████████████████████████▉              | 997/1501 [01:12<00:30, 16.74it/s][A
Training:  67%|█████████████████████████

Training:  77%|███████████████████████████████▍         | 1149/1501 [01:21<00:21, 16.18it/s][A
Training:  77%|███████████████████████████████▍         | 1151/1501 [01:21<00:20, 16.95it/s][A
Training:  77%|███████████████████████████████▍         | 1153/1501 [01:21<00:20, 17.03it/s][A
Training:  77%|███████████████████████████████▌         | 1155/1501 [01:21<00:20, 17.03it/s][A
Training:  77%|███████████████████████████████▌         | 1157/1501 [01:21<00:19, 17.34it/s][A
Training:  77%|███████████████████████████████▋         | 1159/1501 [01:22<00:20, 17.01it/s][A
Training:  77%|███████████████████████████████▋         | 1161/1501 [01:22<00:20, 16.99it/s][A
Training:  77%|███████████████████████████████▊         | 1163/1501 [01:22<00:19, 17.25it/s][A
Training:  78%|███████████████████████████████▊         | 1165/1501 [01:22<00:19, 17.59it/s][A
Training:  78%|███████████████████████████████▉         | 1167/1501 [01:22<00:19, 17.33it/s][A
Training:  78%|█████████████████████████

Training:  82%|█████████████████████████████████▋       | 1233/1501 [01:30<00:16, 16.00it/s][A
Training:  82%|█████████████████████████████████▋       | 1235/1501 [01:30<00:16, 16.40it/s][A
Training:  82%|█████████████████████████████████▊       | 1237/1501 [01:31<00:16, 16.37it/s][A
Training:  83%|█████████████████████████████████▊       | 1239/1501 [01:31<00:16, 16.26it/s][A
Training:  83%|█████████████████████████████████▉       | 1241/1501 [01:31<00:16, 16.23it/s][A
Training:  83%|█████████████████████████████████▉       | 1243/1501 [01:31<00:15, 16.48it/s][A
Training:  83%|██████████████████████████████████       | 1245/1501 [01:31<00:15, 16.71it/s][A
Training:  83%|██████████████████████████████████       | 1247/1501 [01:31<00:14, 17.16it/s][A
Training:  83%|██████████████████████████████████       | 1249/1501 [01:31<00:14, 17.08it/s][A
Training:  83%|██████████████████████████████████▏      | 1251/1501 [01:31<00:14, 16.75it/s][A
Training:  83%|█████████████████████████

Training:  93%|██████████████████████████████████████▎  | 1403/1501 [01:40<00:05, 16.48it/s][A
Training:  94%|██████████████████████████████████████▍  | 1405/1501 [01:40<00:05, 16.73it/s][A
Training:  94%|██████████████████████████████████████▍  | 1407/1501 [01:41<00:05, 17.12it/s][A
Training:  94%|██████████████████████████████████████▍  | 1409/1501 [01:41<00:05, 17.56it/s][A
Training:  94%|██████████████████████████████████████▌  | 1411/1501 [01:41<00:05, 17.69it/s][A
Training:  94%|██████████████████████████████████████▌  | 1413/1501 [01:41<00:05, 17.36it/s][A
Training:  94%|██████████████████████████████████████▋  | 1415/1501 [01:41<00:05, 16.85it/s][A
Training:  94%|██████████████████████████████████████▋  | 1417/1501 [01:41<00:04, 17.06it/s][A
Training:  95%|██████████████████████████████████████▊  | 1419/1501 [01:41<00:04, 16.95it/s][A
Training:  95%|██████████████████████████████████████▊  | 1421/1501 [01:41<00:04, 16.89it/s][A
Training:  95%|█████████████████████████

Evaluation...:  89%|█████████████████████████████████▋    | 148/167 [00:03<00:00, 36.94it/s][A[A

Evaluation...:  91%|██████████████████████████████████▌   | 152/167 [00:04<00:00, 37.42it/s][A[A

Evaluation...:  93%|███████████████████████████████████▍  | 156/167 [00:04<00:00, 33.67it/s][A[A

Evaluation...:  96%|████████████████████████████████████▍ | 160/167 [00:04<00:00, 34.21it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 37.36it/s][A[A

Training: 100%|█████████████████████████████████████████| 1501/1501 [01:51<00:00, 13.51it/s][A
 20%|███████████                                            | 2/10 [03:52<15:21, 115.20s/it]
Training:   0%|                                                    | 0/1501 [00:00<?, ?it/s][A
Training:   0%|                                            | 2/1501 [00:00<01:19, 18.83it/s][A
Training:   0%|                                            | 4/1501 [00:00<01:19, 18.88it/s][A
Training:   0%|▏       

Training:  10%|████▎                                     | 156/1501 [00:09<01:14, 17.98it/s][A
Training:  11%|████▍                                     | 158/1501 [00:09<01:14, 17.98it/s][A
Training:  11%|████▍                                     | 160/1501 [00:09<01:17, 17.40it/s][A
Training:  11%|████▌                                     | 162/1501 [00:09<01:15, 17.63it/s][A
Training:  11%|████▌                                     | 164/1501 [00:09<01:19, 16.79it/s][A
Training:  11%|████▋                                     | 166/1501 [00:09<01:17, 17.15it/s][A
Training:  11%|████▋                                     | 168/1501 [00:09<01:16, 17.50it/s][A
Training:  11%|████▊                                     | 170/1501 [00:09<01:20, 16.58it/s][A
Training:  11%|████▊                                     | 172/1501 [00:10<01:19, 16.65it/s][A
Training:  12%|████▊                                     | 174/1501 [00:10<01:18, 16.86it/s][A
Training:  12%|████▉                    

Evaluation...:  32%|████████████▌                          | 54/167 [00:01<00:03, 37.64it/s][A[A

Evaluation...:  35%|█████████████▌                         | 58/167 [00:01<00:02, 37.66it/s][A[A

Evaluation...:  37%|██████████████▍                        | 62/167 [00:01<00:02, 38.11it/s][A[A

Evaluation...:  40%|███████████████▍                       | 66/167 [00:01<00:02, 38.66it/s][A[A

Evaluation...:  42%|████████████████▎                      | 70/167 [00:01<00:02, 37.97it/s][A[A

Evaluation...:  44%|█████████████████▎                     | 74/167 [00:01<00:02, 37.72it/s][A[A

Evaluation...:  47%|██████████████████▍                    | 79/167 [00:02<00:02, 38.83it/s][A[A

Evaluation...:  50%|███████████████████▍                   | 83/167 [00:02<00:02, 39.15it/s][A[A

Evaluation...:  52%|████████████████████▎                  | 87/167 [00:02<00:02, 37.31it/s][A[A

Evaluation...:  54%|█████████████████████▎                 | 91/167 [00:02<00:02, 36.88it/s][A[A



Training:  27%|███████████▍                              | 410/1501 [00:28<01:05, 16.55it/s][A
Training:  27%|███████████▌                              | 412/1501 [00:28<01:06, 16.41it/s][A
Training:  28%|███████████▌                              | 414/1501 [00:28<01:05, 16.51it/s][A
Training:  28%|███████████▋                              | 416/1501 [00:28<01:07, 16.19it/s][A
Training:  28%|███████████▋                              | 418/1501 [00:28<01:04, 16.72it/s][A
Training:  28%|███████████▊                              | 420/1501 [00:29<01:03, 17.08it/s][A
Training:  28%|███████████▊                              | 422/1501 [00:29<01:02, 17.37it/s][A
Training:  28%|███████████▊                              | 424/1501 [00:29<01:01, 17.57it/s][A
Training:  28%|███████████▉                              | 426/1501 [00:29<01:00, 17.71it/s][A
Training:  29%|███████████▉                              | 428/1501 [00:29<00:59, 17.94it/s][A
Training:  29%|████████████             

Training:  39%|████████████████▏                         | 580/1501 [00:38<00:52, 17.46it/s][A
Training:  39%|████████████████▎                         | 582/1501 [00:38<00:52, 17.46it/s][A
Training:  39%|████████████████▎                         | 584/1501 [00:38<00:54, 16.80it/s][A
Training:  39%|████████████████▍                         | 586/1501 [00:38<00:55, 16.36it/s][A
Training:  39%|████████████████▍                         | 588/1501 [00:39<00:56, 16.24it/s][A
Training:  39%|████████████████▌                         | 590/1501 [00:39<00:55, 16.55it/s][A
Training:  39%|████████████████▌                         | 592/1501 [00:39<00:58, 15.61it/s][A
Training:  40%|████████████████▌                         | 594/1501 [00:39<00:56, 15.98it/s][A
Training:  40%|████████████████▋                         | 596/1501 [00:39<00:54, 16.75it/s][A

Evaluation...:   0%|                                                | 0/167 [00:00<?, ?it/s][A[A

Evaluation...:   2%|▉              

Training:  44%|██████████████████▋                       | 666/1501 [00:48<00:51, 16.19it/s][A
Training:  45%|██████████████████▋                       | 668/1501 [00:48<00:51, 16.24it/s][A
Training:  45%|██████████████████▋                       | 670/1501 [00:48<00:49, 16.68it/s][A
Training:  45%|██████████████████▊                       | 672/1501 [00:48<00:50, 16.58it/s][A
Training:  45%|██████████████████▊                       | 674/1501 [00:48<00:49, 16.79it/s][A
Training:  45%|██████████████████▉                       | 676/1501 [00:48<00:49, 16.59it/s][A
Training:  45%|██████████████████▉                       | 678/1501 [00:48<00:49, 16.69it/s][A
Training:  45%|███████████████████                       | 680/1501 [00:49<00:50, 16.10it/s][A
Training:  45%|███████████████████                       | 682/1501 [00:49<00:48, 17.01it/s][A
Training:  46%|███████████████████▏                      | 684/1501 [00:49<00:48, 16.92it/s][A
Training:  46%|███████████████████▏     

Training:  56%|███████████████████████▍                  | 836/1501 [00:58<00:39, 16.77it/s][A
Training:  56%|███████████████████████▍                  | 838/1501 [00:58<00:39, 16.84it/s][A
Training:  56%|███████████████████████▌                  | 840/1501 [00:58<00:39, 16.78it/s][A
Training:  56%|███████████████████████▌                  | 842/1501 [00:58<00:38, 17.28it/s][A
Training:  56%|███████████████████████▌                  | 844/1501 [00:58<00:37, 17.55it/s][A
Training:  56%|███████████████████████▋                  | 846/1501 [00:58<00:37, 17.69it/s][A
Training:  56%|███████████████████████▋                  | 848/1501 [00:58<00:37, 17.49it/s][A
Training:  57%|███████████████████████▊                  | 850/1501 [00:59<00:36, 17.69it/s][A
Training:  57%|███████████████████████▊                  | 852/1501 [00:59<00:36, 17.71it/s][A
Training:  57%|███████████████████████▉                  | 854/1501 [00:59<00:36, 17.51it/s][A
Training:  57%|███████████████████████▉ 

Training:  61%|█████████████████████████▋                | 920/1501 [01:07<00:41, 14.05it/s][A
Training:  61%|█████████████████████████▊                | 922/1501 [01:07<00:38, 15.03it/s][A
Training:  62%|█████████████████████████▊                | 924/1501 [01:07<00:37, 15.53it/s][A
Training:  62%|█████████████████████████▉                | 926/1501 [01:08<00:36, 15.97it/s][A
Training:  62%|█████████████████████████▉                | 928/1501 [01:08<00:34, 16.39it/s][A
Training:  62%|██████████████████████████                | 930/1501 [01:08<00:33, 16.85it/s][A
Training:  62%|██████████████████████████                | 932/1501 [01:08<00:33, 17.08it/s][A
Training:  62%|██████████████████████████▏               | 934/1501 [01:08<00:34, 16.67it/s][A
Training:  62%|██████████████████████████▏               | 936/1501 [01:08<00:34, 16.60it/s][A
Training:  62%|██████████████████████████▏               | 938/1501 [01:08<00:32, 17.08it/s][A
Training:  63%|█████████████████████████

Training:  73%|█████████████████████████████▊           | 1090/1501 [01:17<00:23, 17.23it/s][A
Training:  73%|█████████████████████████████▊           | 1092/1501 [01:17<00:23, 17.48it/s][A
Training:  73%|█████████████████████████████▉           | 1094/1501 [01:17<00:24, 16.86it/s][A
Training:  73%|█████████████████████████████▉           | 1096/1501 [01:18<00:23, 17.44it/s][A
Training:  73%|█████████████████████████████▉           | 1098/1501 [01:18<00:23, 17.40it/s][A
Training:  73%|██████████████████████████████           | 1100/1501 [01:18<00:23, 17.09it/s][A
Training:  73%|██████████████████████████████           | 1102/1501 [01:18<00:22, 17.53it/s][A
Training:  74%|██████████████████████████████▏          | 1104/1501 [01:18<00:22, 17.41it/s][A
Training:  74%|██████████████████████████████▏          | 1106/1501 [01:18<00:23, 16.90it/s][A
Training:  74%|██████████████████████████████▎          | 1108/1501 [01:18<00:22, 17.18it/s][A
Training:  74%|█████████████████████████

Evaluation...:  71%|██████████████████████████▊           | 118/167 [00:03<00:01, 34.68it/s][A[A

Evaluation...:  73%|███████████████████████████▊          | 122/167 [00:03<00:01, 34.44it/s][A[A

Evaluation...:  76%|████████████████████████████▉         | 127/167 [00:03<00:01, 36.07it/s][A[A

Evaluation...:  78%|█████████████████████████████▊        | 131/167 [00:04<00:01, 34.35it/s][A[A

Evaluation...:  81%|██████████████████████████████▋       | 135/167 [00:04<00:00, 32.61it/s][A[A

Evaluation...:  83%|███████████████████████████████▋      | 139/167 [00:04<00:00, 30.15it/s][A[A

Evaluation...:  86%|████████████████████████████████▌     | 143/167 [00:04<00:00, 29.78it/s][A[A

Evaluation...:  88%|█████████████████████████████████▍    | 147/167 [00:04<00:00, 29.66it/s][A[A

Evaluation...:  90%|██████████████████████████████████▏   | 150/167 [00:04<00:00, 29.41it/s][A[A

Evaluation...:  92%|███████████████████████████████████   | 154/167 [00:04<00:00, 30.71it/s][A[A



Training:  89%|████████████████████████████████████▌    | 1340/1501 [01:38<00:09, 17.80it/s][A
Training:  89%|████████████████████████████████████▋    | 1342/1501 [01:38<00:09, 17.34it/s][A
Training:  90%|████████████████████████████████████▋    | 1344/1501 [01:38<00:09, 17.10it/s][A
Training:  90%|████████████████████████████████████▊    | 1346/1501 [01:38<00:09, 17.20it/s][A
Training:  90%|████████████████████████████████████▊    | 1348/1501 [01:38<00:08, 17.55it/s][A
Training:  90%|████████████████████████████████████▉    | 1350/1501 [01:39<00:08, 17.20it/s][A
Training:  90%|████████████████████████████████████▉    | 1352/1501 [01:39<00:08, 17.18it/s][A
Training:  90%|████████████████████████████████████▉    | 1354/1501 [01:39<00:08, 17.87it/s][A
Training:  90%|█████████████████████████████████████    | 1356/1501 [01:39<00:08, 16.93it/s][A
Training:  90%|█████████████████████████████████████    | 1358/1501 [01:39<00:08, 16.94it/s][A
Training:  91%|█████████████████████████

Evaluation...:  14%|█████▌                                 | 24/167 [00:00<00:04, 30.22it/s][A[A

Evaluation...:  17%|██████▌                                | 28/167 [00:00<00:04, 29.31it/s][A[A

Evaluation...:  19%|███████▏                               | 31/167 [00:01<00:04, 29.29it/s][A[A

Evaluation...:  20%|███████▉                               | 34/167 [00:01<00:04, 29.08it/s][A[A

Evaluation...:  22%|████████▋                              | 37/167 [00:01<00:04, 28.54it/s][A[A

Evaluation...:  25%|█████████▌                             | 41/167 [00:01<00:04, 30.23it/s][A[A

Evaluation...:  27%|██████████▌                            | 45/167 [00:01<00:03, 31.47it/s][A[A

Evaluation...:  29%|███████████▍                           | 49/167 [00:01<00:03, 31.80it/s][A[A

Evaluation...:  32%|████████████▍                          | 53/167 [00:01<00:03, 32.41it/s][A[A

Evaluation...:  34%|█████████████▎                         | 57/167 [00:01<00:03, 30.73it/s][A[A



>>> training loss:  1.1581, valid loss:  1.4665

                            valid f1 score:  0.5103, valid precision score:  0.5416,
                            valid recall score:  0.4968, valid accuracy score:  0.5260



Training:   0%|                                                    | 0/1501 [00:00<?, ?it/s][A
Training:   0%|                                            | 2/1501 [00:00<01:28, 17.03it/s][A
Training:   0%|                                            | 4/1501 [00:00<01:24, 17.71it/s][A
Training:   0%|▏                                           | 6/1501 [00:00<01:28, 16.93it/s][A
Training:   1%|▏                                           | 8/1501 [00:00<01:32, 16.19it/s][A
Training:   1%|▎                                          | 10/1501 [00:00<01:33, 16.01it/s][A
Training:   1%|▎                                          | 12/1501 [00:00<01:40, 14.82it/s][A
Training:   1%|▍                                          | 14/1501 [00:00<01:52, 13.25it/s][A
Training:   1%|▍                                          | 16/1501 [00:01<02:02, 12.09it/s][A
Training:   1%|▌                                          | 18/1501 [00:01<01:58, 12.54it/s][A
Training:   1%|▌                       

Training:  11%|████▊                                     | 170/1501 [00:11<01:22, 16.18it/s][A
Training:  11%|████▊                                     | 172/1501 [00:11<01:22, 16.02it/s][A
Training:  12%|████▊                                     | 174/1501 [00:12<01:26, 15.33it/s][A
Training:  12%|████▉                                     | 176/1501 [00:12<01:26, 15.37it/s][A
Training:  12%|████▉                                     | 178/1501 [00:12<01:29, 14.75it/s][A
Training:  12%|█████                                     | 180/1501 [00:12<01:31, 14.47it/s][A
Training:  12%|█████                                     | 182/1501 [00:12<01:31, 14.45it/s][A
Training:  12%|█████▏                                    | 184/1501 [00:12<01:30, 14.49it/s][A
Training:  12%|█████▏                                    | 186/1501 [00:12<01:30, 14.59it/s][A
Training:  13%|█████▎                                    | 188/1501 [00:13<01:29, 14.70it/s][A
Training:  13%|█████▎                   

Evaluation...:  50%|███████████████████▌                   | 84/167 [00:02<00:02, 38.41it/s][A[A

Evaluation...:  53%|████████████████████▌                  | 88/167 [00:02<00:02, 36.33it/s][A[A

Evaluation...:  55%|█████████████████████▍                 | 92/167 [00:02<00:02, 36.83it/s][A[A

Evaluation...:  57%|██████████████████████▍                | 96/167 [00:02<00:01, 36.81it/s][A[A

Evaluation...:  60%|██████████████████████▊               | 100/167 [00:02<00:01, 37.02it/s][A[A

Evaluation...:  62%|███████████████████████▋              | 104/167 [00:02<00:01, 37.66it/s][A[A

Evaluation...:  65%|████████████████████████▊             | 109/167 [00:02<00:01, 39.39it/s][A[A

Evaluation...:  68%|█████████████████████████▋            | 113/167 [00:03<00:01, 39.45it/s][A[A

Evaluation...:  70%|██████████████████████████▌           | 117/167 [00:03<00:01, 39.19it/s][A[A

Evaluation...:  72%|███████████████████████████▌          | 121/167 [00:03<00:01, 38.36it/s][A[A



Training:  28%|███████████▉                              | 427/1501 [00:32<01:04, 16.74it/s][A
Training:  29%|████████████                              | 429/1501 [00:32<01:01, 17.44it/s][A
Training:  29%|████████████                              | 431/1501 [00:32<01:02, 17.20it/s][A
Training:  29%|████████████                              | 433/1501 [00:32<00:59, 17.87it/s][A
Training:  29%|████████████▏                             | 436/1501 [00:33<00:59, 18.02it/s][A
Training:  29%|████████████▎                             | 438/1501 [00:33<00:59, 17.72it/s][A
Training:  29%|████████████▎                             | 440/1501 [00:33<01:00, 17.54it/s][A
Training:  29%|████████████▎                             | 442/1501 [00:33<00:59, 17.81it/s][A
Training:  30%|████████████▍                             | 444/1501 [00:33<00:58, 17.98it/s][A
Training:  30%|████████████▍                             | 446/1501 [00:33<01:00, 17.45it/s][A
Training:  30%|████████████▌            

Evaluation...:   2%|▉                                       | 4/167 [00:00<00:04, 39.13it/s][A[A

Evaluation...:   5%|██▏                                     | 9/167 [00:00<00:03, 40.32it/s][A[A

Evaluation...:   8%|███▎                                   | 14/167 [00:00<00:03, 41.88it/s][A[A

Evaluation...:  11%|████▍                                  | 19/167 [00:00<00:03, 41.67it/s][A[A

Evaluation...:  14%|█████▌                                 | 24/167 [00:00<00:03, 40.71it/s][A[A

Evaluation...:  17%|██████▊                                | 29/167 [00:00<00:03, 38.17it/s][A[A

Evaluation...:  20%|███████▋                               | 33/167 [00:00<00:03, 38.02it/s][A[A

Evaluation...:  22%|████████▋                              | 37/167 [00:00<00:03, 36.42it/s][A[A

Evaluation...:  25%|█████████▌                             | 41/167 [00:01<00:03, 36.47it/s][A[A

Evaluation...:  27%|██████████▌                            | 45/167 [00:01<00:03, 37.27it/s][A[A



Training:  46%|███████████████████▏                      | 687/1501 [00:52<00:48, 16.79it/s][A
Training:  46%|███████████████████▎                      | 689/1501 [00:52<00:47, 17.24it/s][A
Training:  46%|███████████████████▎                      | 691/1501 [00:52<00:49, 16.33it/s][A
Training:  46%|███████████████████▍                      | 693/1501 [00:52<00:48, 16.53it/s][A
Training:  46%|███████████████████▍                      | 695/1501 [00:52<00:47, 16.95it/s][A
Training:  46%|███████████████████▌                      | 697/1501 [00:52<00:47, 17.02it/s][A
Training:  47%|███████████████████▌                      | 699/1501 [00:52<00:46, 17.11it/s][A
Training:  47%|███████████████████▌                      | 701/1501 [00:52<00:46, 17.14it/s][A
Training:  47%|███████████████████▋                      | 703/1501 [00:53<00:45, 17.37it/s][A
Training:  47%|███████████████████▋                      | 705/1501 [00:53<00:46, 17.17it/s][A
Training:  47%|███████████████████▊     

Training:  57%|████████████████████████                  | 860/1501 [01:01<00:34, 18.80it/s][A
Training:  57%|████████████████████████▏                 | 863/1501 [01:02<00:33, 19.28it/s][A
Training:  58%|████████████████████████▏                 | 865/1501 [01:02<00:33, 18.81it/s][A
Training:  58%|████████████████████████▎                 | 867/1501 [01:02<00:33, 18.67it/s][A
Training:  58%|████████████████████████▎                 | 869/1501 [01:02<00:34, 18.59it/s][A
Training:  58%|████████████████████████▎                 | 871/1501 [01:02<00:33, 18.84it/s][A
Training:  58%|████████████████████████▍                 | 873/1501 [01:02<00:37, 16.84it/s][A
Training:  58%|████████████████████████▍                 | 875/1501 [01:02<00:43, 14.38it/s][A
Training:  58%|████████████████████████▌                 | 877/1501 [01:03<00:41, 14.96it/s][A
Training:  59%|████████████████████████▌                 | 879/1501 [01:03<00:39, 15.91it/s][A
Training:  59%|████████████████████████▋

Training:  64%|██████████████████████████▊               | 956/1501 [01:11<00:30, 17.90it/s][A
Training:  64%|██████████████████████████▊               | 958/1501 [01:12<00:30, 17.99it/s][A
Training:  64%|██████████████████████████▊               | 960/1501 [01:12<00:29, 18.13it/s][A
Training:  64%|██████████████████████████▉               | 962/1501 [01:12<00:29, 18.47it/s][A
Training:  64%|██████████████████████████▉               | 964/1501 [01:12<00:30, 17.63it/s][A
Training:  64%|███████████████████████████               | 966/1501 [01:12<00:31, 17.11it/s][A
Training:  64%|███████████████████████████               | 968/1501 [01:12<00:30, 17.71it/s][A
Training:  65%|███████████████████████████▏              | 970/1501 [01:12<00:29, 17.98it/s][A
Training:  65%|███████████████████████████▏              | 972/1501 [01:12<00:28, 18.27it/s][A
Training:  65%|███████████████████████████▎              | 974/1501 [01:12<00:29, 17.89it/s][A
Training:  65%|█████████████████████████

Training:  75%|██████████████████████████████▊          | 1127/1501 [01:22<00:31, 11.98it/s][A
Training:  75%|██████████████████████████████▊          | 1129/1501 [01:22<00:31, 11.67it/s][A
Training:  75%|██████████████████████████████▉          | 1131/1501 [01:22<00:31, 11.63it/s][A
Training:  75%|██████████████████████████████▉          | 1133/1501 [01:23<00:29, 12.48it/s][A
Training:  76%|███████████████████████████████          | 1135/1501 [01:23<00:28, 12.78it/s][A
Training:  76%|███████████████████████████████          | 1137/1501 [01:23<00:28, 12.63it/s][A
Training:  76%|███████████████████████████████          | 1139/1501 [01:23<00:26, 13.41it/s][A
Training:  76%|███████████████████████████████▏         | 1141/1501 [01:23<00:26, 13.38it/s][A
Training:  76%|███████████████████████████████▏         | 1143/1501 [01:23<00:31, 11.21it/s][A
Training:  76%|███████████████████████████████▎         | 1145/1501 [01:24<00:30, 11.69it/s][A
Training:  76%|█████████████████████████

Training:  80%|████████████████████████████████▊        | 1199/1501 [01:34<03:34,  1.41it/s][A
Training:  80%|████████████████████████████████▊        | 1201/1501 [01:34<02:35,  1.93it/s][A
Training:  80%|████████████████████████████████▊        | 1203/1501 [01:34<01:58,  2.51it/s][A
Training:  80%|████████████████████████████████▉        | 1205/1501 [01:35<01:35,  3.10it/s][A
Training:  80%|████████████████████████████████▉        | 1206/1501 [01:35<01:23,  3.52it/s][A
Training:  80%|████████████████████████████████▉        | 1207/1501 [01:35<01:15,  3.91it/s][A
Training:  80%|████████████████████████████████▉        | 1208/1501 [01:35<01:05,  4.47it/s][A
Training:  81%|█████████████████████████████████        | 1209/1501 [01:35<00:57,  5.11it/s][A
Training:  81%|█████████████████████████████████        | 1210/1501 [01:35<00:51,  5.60it/s][A
Training:  81%|█████████████████████████████████        | 1212/1501 [01:35<00:38,  7.48it/s][A
Training:  81%|█████████████████████████

Training:  88%|████████████████████████████████████     | 1319/1501 [01:47<00:20,  8.92it/s][A
Training:  88%|████████████████████████████████████     | 1320/1501 [01:48<00:22,  7.91it/s][A
Training:  88%|████████████████████████████████████     | 1321/1501 [01:48<00:21,  8.32it/s][A
Training:  88%|████████████████████████████████████     | 1322/1501 [01:48<00:20,  8.65it/s][A
Training:  88%|████████████████████████████████████▏    | 1323/1501 [01:48<00:19,  8.92it/s][A
Training:  88%|████████████████████████████████████▏    | 1324/1501 [01:48<00:20,  8.68it/s][A
Training:  88%|████████████████████████████████████▏    | 1325/1501 [01:48<00:20,  8.64it/s][A
Training:  88%|████████████████████████████████████▏    | 1327/1501 [01:48<00:18,  9.46it/s][A
Training:  88%|████████████████████████████████████▎    | 1328/1501 [01:48<00:18,  9.54it/s][A
Training:  89%|████████████████████████████████████▎    | 1330/1501 [01:49<00:15, 10.80it/s][A
Training:  89%|█████████████████████████

Training:  98%|████████████████████████████████████████▎| 1478/1501 [02:00<00:01, 13.56it/s][A
Training:  99%|████████████████████████████████████████▍| 1480/1501 [02:00<00:01, 14.45it/s][A
Training:  99%|████████████████████████████████████████▍| 1482/1501 [02:00<00:01, 14.89it/s][A
Training:  99%|████████████████████████████████████████▌| 1484/1501 [02:00<00:01, 15.06it/s][A
Training:  99%|████████████████████████████████████████▌| 1486/1501 [02:00<00:00, 15.33it/s][A
Training:  99%|████████████████████████████████████████▋| 1488/1501 [02:00<00:00, 16.07it/s][A
Training:  99%|████████████████████████████████████████▋| 1490/1501 [02:01<00:00, 14.84it/s][A
Training:  99%|████████████████████████████████████████▊| 1492/1501 [02:01<00:00, 13.00it/s][A
Training: 100%|████████████████████████████████████████▊| 1494/1501 [02:01<00:00, 13.49it/s][A
Training: 100%|████████████████████████████████████████▊| 1496/1501 [02:01<00:00, 14.86it/s][A

Evaluation...:   0%|                   

Training:   4%|█▊                                         | 64/1501 [00:04<01:28, 16.26it/s][A
Training:   4%|█▉                                         | 66/1501 [00:05<01:27, 16.31it/s][A
Training:   5%|█▉                                         | 68/1501 [00:05<01:23, 17.11it/s][A
Training:   5%|██                                         | 70/1501 [00:05<01:20, 17.68it/s][A
Training:   5%|██                                         | 72/1501 [00:05<01:20, 17.76it/s][A
Training:   5%|██                                         | 74/1501 [00:05<01:19, 17.91it/s][A
Training:   5%|██▏                                        | 76/1501 [00:05<01:22, 17.17it/s][A
Training:   5%|██▏                                        | 78/1501 [00:05<01:23, 17.02it/s][A
Training:   5%|██▎                                        | 80/1501 [00:05<01:21, 17.45it/s][A
Training:   5%|██▎                                        | 82/1501 [00:05<01:18, 18.02it/s][A
Training:   6%|██▍                      

Training:  16%|██████▌                                   | 235/1501 [00:14<01:30, 13.96it/s][A
Training:  16%|██████▋                                   | 237/1501 [00:15<01:27, 14.38it/s][A
Training:  16%|██████▋                                   | 239/1501 [00:15<01:23, 15.09it/s][A
Training:  16%|██████▋                                   | 241/1501 [00:15<01:18, 15.99it/s][A
Training:  16%|██████▊                                   | 243/1501 [00:15<01:15, 16.65it/s][A
Training:  16%|██████▊                                   | 245/1501 [00:15<01:16, 16.47it/s][A
Training:  16%|██████▉                                   | 247/1501 [00:15<01:18, 16.02it/s][A
Training:  17%|██████▉                                   | 249/1501 [00:15<01:17, 16.09it/s][A
Training:  17%|███████                                   | 251/1501 [00:15<01:13, 17.06it/s][A
Training:  17%|███████                                   | 253/1501 [00:15<01:13, 17.09it/s][A
Training:  17%|███████▏                 

Training:  22%|█████████▏                                | 329/1501 [00:24<01:09, 16.94it/s][A
Training:  22%|█████████▎                                | 331/1501 [00:25<01:08, 17.09it/s][A
Training:  22%|█████████▎                                | 333/1501 [00:25<01:05, 17.81it/s][A
Training:  22%|█████████▎                                | 335/1501 [00:25<01:05, 17.92it/s][A
Training:  22%|█████████▍                                | 337/1501 [00:25<01:05, 17.65it/s][A
Training:  23%|█████████▍                                | 339/1501 [00:25<01:07, 17.12it/s][A
Training:  23%|█████████▌                                | 341/1501 [00:25<01:21, 14.24it/s][A
Training:  23%|█████████▌                                | 343/1501 [00:25<01:22, 14.11it/s][A
Training:  23%|█████████▋                                | 345/1501 [00:25<01:17, 14.97it/s][A
Training:  23%|█████████▋                                | 347/1501 [00:26<01:14, 15.51it/s][A
Training:  23%|█████████▊               

Training:  34%|██████████████▏                           | 506/1501 [00:35<00:53, 18.46it/s][A
Training:  34%|██████████████▏                           | 508/1501 [00:35<00:54, 18.30it/s][A
Training:  34%|██████████████▎                           | 510/1501 [00:35<00:55, 17.75it/s][A
Training:  34%|██████████████▎                           | 512/1501 [00:36<00:56, 17.55it/s][A
Training:  34%|██████████████▍                           | 514/1501 [00:36<00:57, 17.04it/s][A
Training:  34%|██████████████▍                           | 516/1501 [00:36<00:57, 17.20it/s][A
Training:  35%|██████████████▍                           | 518/1501 [00:36<00:55, 17.87it/s][A
Training:  35%|██████████████▌                           | 520/1501 [00:36<00:56, 17.47it/s][A
Training:  35%|██████████████▌                           | 522/1501 [00:36<00:55, 17.63it/s][A
Training:  35%|██████████████▋                           | 524/1501 [00:36<01:04, 15.09it/s][A
Training:  35%|██████████████▋          

Training:  40%|████████████████▋                         | 598/1501 [00:46<08:12,  1.83it/s][A
Training:  40%|████████████████▊                         | 600/1501 [00:46<06:00,  2.50it/s][A
Training:  40%|████████████████▊                         | 602/1501 [00:46<04:28,  3.35it/s][A
Training:  40%|████████████████▉                         | 604/1501 [00:46<03:23,  4.40it/s][A
Training:  40%|████████████████▉                         | 606/1501 [00:47<02:46,  5.37it/s][A
Training:  41%|█████████████████                         | 608/1501 [00:47<02:16,  6.55it/s][A
Training:  41%|█████████████████                         | 610/1501 [00:47<01:55,  7.74it/s][A
Training:  41%|█████████████████                         | 612/1501 [00:47<01:41,  8.75it/s][A
Training:  41%|█████████████████▏                        | 614/1501 [00:47<01:30,  9.78it/s][A
Training:  41%|█████████████████▏                        | 616/1501 [00:47<01:23, 10.55it/s][A
Training:  41%|█████████████████▎       

Training:  51%|█████████████████████▍                    | 768/1501 [00:58<01:00, 12.12it/s][A
Training:  51%|█████████████████████▌                    | 770/1501 [00:58<01:04, 11.41it/s][A
Training:  51%|█████████████████████▌                    | 772/1501 [00:59<01:03, 11.45it/s][A
Training:  52%|█████████████████████▋                    | 774/1501 [00:59<01:04, 11.28it/s][A
Training:  52%|█████████████████████▋                    | 776/1501 [00:59<01:00, 11.95it/s][A
Training:  52%|█████████████████████▊                    | 778/1501 [00:59<00:59, 12.06it/s][A
Training:  52%|█████████████████████▊                    | 780/1501 [00:59<00:56, 12.87it/s][A
Training:  52%|█████████████████████▉                    | 782/1501 [00:59<00:51, 14.09it/s][A
Training:  52%|█████████████████████▉                    | 784/1501 [00:59<00:47, 15.12it/s][A
Training:  52%|█████████████████████▉                    | 786/1501 [01:00<00:47, 15.00it/s][A
Training:  52%|██████████████████████   

Evaluation...:  47%|██████████████████▍                    | 79/167 [00:02<00:02, 38.16it/s][A[A

Evaluation...:  50%|███████████████████▍                   | 83/167 [00:02<00:02, 38.05it/s][A[A

Evaluation...:  52%|████████████████████▎                  | 87/167 [00:02<00:02, 36.25it/s][A[A

Evaluation...:  54%|█████████████████████▎                 | 91/167 [00:02<00:02, 36.38it/s][A[A

Evaluation...:  57%|██████████████████████▏                | 95/167 [00:02<00:02, 35.65it/s][A[A

Evaluation...:  59%|███████████████████████                | 99/167 [00:02<00:01, 35.51it/s][A[A

Evaluation...:  62%|███████████████████████▍              | 103/167 [00:03<00:01, 35.91it/s][A[A

Evaluation...:  64%|████████████████████████▎             | 107/167 [00:03<00:01, 36.27it/s][A[A

Evaluation...:  67%|█████████████████████████▍            | 112/167 [00:03<00:01, 37.78it/s][A[A

Evaluation...:  69%|██████████████████████████▍           | 116/167 [00:03<00:01, 38.02it/s][A[A



>>> training loss:  0.7307, valid loss:  1.6164

                            valid f1 score:  0.5177, valid precision score:  0.5384,
                            valid recall score:  0.5081, valid accuracy score:  0.5300



Training:  60%|█████████████████████████▏                | 900/1501 [01:11<04:12,  2.38it/s][A
Training:  60%|█████████████████████████▏                | 902/1501 [01:11<03:06,  3.21it/s][A
Training:  60%|█████████████████████████▎                | 904/1501 [01:12<02:20,  4.24it/s][A
Training:  60%|█████████████████████████▎                | 906/1501 [01:12<01:49,  5.46it/s][A
Training:  60%|█████████████████████████▍                | 908/1501 [01:12<01:26,  6.82it/s][A
Training:  61%|█████████████████████████▍                | 910/1501 [01:12<01:11,  8.25it/s][A
Training:  61%|█████████████████████████▌                | 912/1501 [01:12<01:00,  9.71it/s][A
Training:  61%|█████████████████████████▌                | 914/1501 [01:12<00:51, 11.37it/s][A
Training:  61%|█████████████████████████▋                | 916/1501 [01:12<00:45, 12.89it/s][A
Training:  61%|█████████████████████████▋                | 918/1501 [01:12<00:41, 14.02it/s][A
Training:  61%|████████████████████████

Training:  71%|█████████████████████████████            | 1066/1501 [01:23<00:29, 14.75it/s][A
Training:  71%|█████████████████████████████▏           | 1068/1501 [01:23<00:28, 14.94it/s][A
Training:  71%|█████████████████████████████▏           | 1070/1501 [01:23<00:27, 15.51it/s][A
Training:  71%|█████████████████████████████▎           | 1072/1501 [01:24<00:27, 15.80it/s][A
Training:  72%|█████████████████████████████▎           | 1074/1501 [01:24<00:28, 15.11it/s][A
Training:  72%|█████████████████████████████▍           | 1076/1501 [01:24<00:32, 13.04it/s][A
Training:  72%|█████████████████████████████▍           | 1078/1501 [01:24<00:33, 12.67it/s][A
Training:  72%|█████████████████████████████▌           | 1080/1501 [01:24<00:31, 13.41it/s][A
Training:  72%|█████████████████████████████▌           | 1082/1501 [01:24<00:29, 14.36it/s][A
Training:  72%|█████████████████████████████▌           | 1084/1501 [01:25<00:28, 14.79it/s][A
Training:  72%|█████████████████████████

Evaluation...:  47%|██████████████████▍                    | 79/167 [00:02<00:02, 37.52it/s][A[A

Evaluation...:  50%|███████████████████▌                   | 84/167 [00:02<00:02, 38.21it/s][A[A

Evaluation...:  53%|████████████████████▌                  | 88/167 [00:02<00:02, 35.17it/s][A[A

Evaluation...:  55%|█████████████████████▍                 | 92/167 [00:02<00:02, 35.85it/s][A[A

Evaluation...:  57%|██████████████████████▍                | 96/167 [00:02<00:01, 35.59it/s][A[A

Evaluation...:  60%|██████████████████████▊               | 100/167 [00:02<00:01, 34.93it/s][A[A

Evaluation...:  62%|███████████████████████▋              | 104/167 [00:02<00:01, 35.42it/s][A[A

Evaluation...:  65%|████████████████████████▌             | 108/167 [00:02<00:01, 36.49it/s][A[A

Evaluation...:  67%|█████████████████████████▍            | 112/167 [00:03<00:01, 36.12it/s][A[A

Evaluation...:  69%|██████████████████████████▍           | 116/167 [00:03<00:01, 36.78it/s][A[A



Training:  88%|████████████████████████████████████     | 1320/1501 [01:44<00:10, 16.75it/s][A
Training:  88%|████████████████████████████████████     | 1322/1501 [01:44<00:10, 16.64it/s][A
Training:  88%|████████████████████████████████████▏    | 1324/1501 [01:44<00:10, 16.67it/s][A
Training:  88%|████████████████████████████████████▏    | 1326/1501 [01:44<00:10, 16.84it/s][A
Training:  88%|████████████████████████████████████▎    | 1328/1501 [01:44<00:10, 16.73it/s][A
Training:  89%|████████████████████████████████████▎    | 1330/1501 [01:44<00:10, 17.01it/s][A
Training:  89%|████████████████████████████████████▍    | 1332/1501 [01:44<00:09, 17.23it/s][A
Training:  89%|████████████████████████████████████▍    | 1334/1501 [01:44<00:09, 17.45it/s][A
Training:  89%|████████████████████████████████████▍    | 1336/1501 [01:44<00:09, 17.34it/s][A
Training:  89%|████████████████████████████████████▌    | 1338/1501 [01:45<00:09, 17.16it/s][A
Training:  89%|█████████████████████████

Training:  99%|████████████████████████████████████████▋| 1490/1501 [01:54<00:00, 18.26it/s][A
Training:  99%|████████████████████████████████████████▊| 1492/1501 [01:54<00:00, 18.24it/s][A
Training: 100%|████████████████████████████████████████▊| 1494/1501 [01:54<00:00, 17.69it/s][A

Evaluation...:   0%|                                                | 0/167 [00:00<?, ?it/s][A[A

Evaluation...:   2%|▉                                       | 4/167 [00:00<00:04, 36.45it/s][A[A

Evaluation...:   5%|█▉                                      | 8/167 [00:00<00:04, 37.25it/s][A[A

Evaluation...:   7%|██▊                                    | 12/167 [00:00<00:04, 37.74it/s][A[A

Evaluation...:  10%|███▉                                   | 17/167 [00:00<00:03, 38.97it/s][A[A

Evaluation...:  13%|████▉                                  | 21/167 [00:00<00:03, 38.73it/s][A[A

Evaluation...:  15%|█████▊                                 | 25/167 [00:00<00:03, 39.04it/s][A[A

Evaluation.

Training:   5%|██▏                                        | 76/1501 [00:04<01:23, 16.97it/s][A
Training:   5%|██▏                                        | 78/1501 [00:04<01:21, 17.52it/s][A
Training:   5%|██▎                                        | 80/1501 [00:04<01:19, 17.97it/s][A
Training:   5%|██▎                                        | 82/1501 [00:04<01:18, 18.10it/s][A
Training:   6%|██▍                                        | 84/1501 [00:04<01:20, 17.68it/s][A
Training:   6%|██▍                                        | 86/1501 [00:04<01:18, 17.97it/s][A
Training:   6%|██▌                                        | 88/1501 [00:05<01:19, 17.78it/s][A
Training:   6%|██▌                                        | 90/1501 [00:05<01:19, 17.68it/s][A
Training:   6%|██▋                                        | 92/1501 [00:05<01:19, 17.78it/s][A
Training:   6%|██▋                                        | 94/1501 [00:05<01:22, 17.10it/s][A
Training:   6%|██▊                      

Training:  16%|██████▉                                   | 246/1501 [00:14<01:13, 17.16it/s][A
Training:  17%|██████▉                                   | 248/1501 [00:14<01:12, 17.21it/s][A
Training:  17%|██████▉                                   | 250/1501 [00:14<01:11, 17.46it/s][A
Training:  17%|███████                                   | 252/1501 [00:14<01:12, 17.20it/s][A
Training:  17%|███████                                   | 254/1501 [00:14<01:10, 17.61it/s][A
Training:  17%|███████▏                                  | 256/1501 [00:14<01:08, 18.06it/s][A
Training:  17%|███████▏                                  | 258/1501 [00:14<01:08, 18.22it/s][A
Training:  17%|███████▎                                  | 260/1501 [00:15<01:08, 18.13it/s][A
Training:  17%|███████▎                                  | 262/1501 [00:15<01:10, 17.51it/s][A
Training:  18%|███████▍                                  | 264/1501 [00:15<01:09, 17.77it/s][A
Training:  18%|███████▍                 

Training:  23%|█████████▍                                | 338/1501 [00:23<01:09, 16.80it/s][A
Training:  23%|█████████▌                                | 340/1501 [00:23<01:11, 16.29it/s][A
Training:  23%|█████████▌                                | 342/1501 [00:24<01:09, 16.77it/s][A
Training:  23%|█████████▋                                | 344/1501 [00:24<01:08, 16.95it/s][A
Training:  23%|█████████▋                                | 346/1501 [00:24<01:08, 16.90it/s][A
Training:  23%|█████████▋                                | 348/1501 [00:24<01:07, 17.07it/s][A
Training:  23%|█████████▊                                | 350/1501 [00:24<01:05, 17.44it/s][A
Training:  23%|█████████▊                                | 352/1501 [00:24<01:05, 17.42it/s][A
Training:  24%|█████████▉                                | 354/1501 [00:24<01:09, 16.44it/s][A
Training:  24%|█████████▉                                | 356/1501 [00:24<01:11, 16.01it/s][A
Training:  24%|██████████               

Training:  34%|██████████████▏                           | 509/1501 [00:33<00:55, 18.02it/s][A
Training:  34%|██████████████▎                           | 512/1501 [00:34<00:53, 18.39it/s][A
Training:  34%|██████████████▍                           | 514/1501 [00:34<00:56, 17.58it/s][A
Training:  34%|██████████████▍                           | 516/1501 [00:34<00:56, 17.55it/s][A
Training:  35%|██████████████▍                           | 518/1501 [00:34<00:56, 17.49it/s][A
Training:  35%|██████████████▌                           | 520/1501 [00:34<00:55, 17.75it/s][A
Training:  35%|██████████████▌                           | 522/1501 [00:34<00:57, 17.17it/s][A
Training:  35%|██████████████▋                           | 524/1501 [00:34<00:57, 17.13it/s][A
Training:  35%|██████████████▋                           | 526/1501 [00:34<00:56, 17.24it/s][A
Training:  35%|██████████████▊                           | 528/1501 [00:34<00:57, 17.02it/s][A
Training:  35%|██████████████▊          

Training:  40%|████████████████▋                         | 598/1501 [00:43<08:12,  1.83it/s][A
Training:  40%|████████████████▊                         | 600/1501 [00:43<06:00,  2.50it/s][A
Training:  40%|████████████████▊                         | 602/1501 [00:44<04:28,  3.35it/s][A
Training:  40%|████████████████▉                         | 604/1501 [00:44<03:25,  4.36it/s][A
Training:  40%|████████████████▉                         | 606/1501 [00:44<02:41,  5.55it/s][A
Training:  41%|█████████████████                         | 608/1501 [00:44<02:17,  6.50it/s][A
Training:  41%|█████████████████                         | 610/1501 [00:44<01:59,  7.45it/s][A
Training:  41%|█████████████████                         | 612/1501 [00:44<01:41,  8.72it/s][A
Training:  41%|█████████████████▏                        | 614/1501 [00:45<01:36,  9.16it/s][A
Training:  41%|█████████████████▏                        | 616/1501 [00:45<01:31,  9.62it/s][A
Training:  41%|█████████████████▎       

Training:  51%|█████████████████████▍                    | 768/1501 [00:54<00:48, 15.03it/s][A
Training:  51%|█████████████████████▌                    | 770/1501 [00:54<00:51, 14.15it/s][A
Training:  51%|█████████████████████▌                    | 772/1501 [00:54<00:51, 14.08it/s][A
Training:  52%|█████████████████████▋                    | 774/1501 [00:54<00:48, 14.97it/s][A
Training:  52%|█████████████████████▋                    | 776/1501 [00:54<00:46, 15.67it/s][A
Training:  52%|█████████████████████▊                    | 778/1501 [00:55<00:44, 16.34it/s][A
Training:  52%|█████████████████████▊                    | 780/1501 [00:55<00:43, 16.48it/s][A
Training:  52%|█████████████████████▉                    | 782/1501 [00:55<00:47, 15.21it/s][A
Training:  52%|█████████████████████▉                    | 784/1501 [00:55<00:50, 14.16it/s][A
Training:  52%|█████████████████████▉                    | 786/1501 [00:55<00:52, 13.54it/s][A
Training:  52%|██████████████████████   

Evaluation...:  54%|█████████████████████▎                 | 91/167 [00:02<00:01, 38.78it/s][A[A

Evaluation...:  57%|██████████████████████▏                | 95/167 [00:02<00:01, 38.23it/s][A[A

Evaluation...:  59%|███████████████████████                | 99/167 [00:02<00:01, 38.27it/s][A[A

Evaluation...:  62%|███████████████████████▍              | 103/167 [00:02<00:01, 38.52it/s][A[A

Evaluation...:  65%|████████████████████████▌             | 108/167 [00:02<00:01, 40.26it/s][A[A

Evaluation...:  68%|█████████████████████████▋            | 113/167 [00:02<00:01, 41.03it/s][A[A

Evaluation...:  71%|██████████████████████████▊           | 118/167 [00:03<00:01, 40.54it/s][A[A

Evaluation...:  74%|███████████████████████████▉          | 123/167 [00:03<00:01, 40.51it/s][A[A

Evaluation...:  77%|█████████████████████████████▏        | 128/167 [00:03<00:00, 41.94it/s][A[A

Evaluation...:  80%|██████████████████████████████▎       | 133/167 [00:03<00:00, 39.55it/s][A[A



Training:  68%|████████████████████████████             | 1028/1501 [01:14<00:27, 17.12it/s][A
Training:  69%|████████████████████████████▏            | 1030/1501 [01:15<00:26, 17.64it/s][A
Training:  69%|████████████████████████████▏            | 1032/1501 [01:15<00:26, 17.90it/s][A
Training:  69%|████████████████████████████▏            | 1034/1501 [01:15<00:26, 17.51it/s][A
Training:  69%|████████████████████████████▎            | 1036/1501 [01:15<00:25, 17.98it/s][A
Training:  69%|████████████████████████████▎            | 1038/1501 [01:15<00:25, 18.23it/s][A
Training:  69%|████████████████████████████▍            | 1040/1501 [01:15<00:25, 17.87it/s][A
Training:  69%|████████████████████████████▍            | 1042/1501 [01:15<00:26, 17.04it/s][A
Training:  70%|████████████████████████████▌            | 1044/1501 [01:15<00:27, 16.43it/s][A
Training:  70%|████████████████████████████▌            | 1046/1501 [01:16<00:27, 16.37it/s][A
Training:  70%|█████████████████████████

Evaluation...:   7%|██▊                                    | 12/167 [00:00<00:04, 33.04it/s][A[A

Evaluation...:  10%|███▋                                   | 16/167 [00:00<00:04, 32.87it/s][A[A

Evaluation...:  12%|████▋                                  | 20/167 [00:00<00:04, 33.70it/s][A[A

Evaluation...:  14%|█████▌                                 | 24/167 [00:00<00:04, 35.22it/s][A[A

Evaluation...:  17%|██████▌                                | 28/167 [00:00<00:03, 35.66it/s][A[A

Evaluation...:  19%|███████▍                               | 32/167 [00:00<00:03, 34.75it/s][A[A

Evaluation...:  22%|████████▍                              | 36/167 [00:01<00:03, 34.08it/s][A[A

Evaluation...:  24%|█████████▎                             | 40/167 [00:01<00:03, 34.03it/s][A[A

Evaluation...:  26%|██████████▎                            | 44/167 [00:01<00:03, 33.80it/s][A[A

Evaluation...:  29%|███████████▏                           | 48/167 [00:01<00:03, 34.13it/s][A[A



Training:  86%|███████████████████████████████████      | 1285/1501 [01:34<00:13, 15.63it/s][A
Training:  86%|███████████████████████████████████▏     | 1287/1501 [01:35<00:13, 16.09it/s][A
Training:  86%|███████████████████████████████████▏     | 1289/1501 [01:35<00:12, 16.75it/s][A
Training:  86%|███████████████████████████████████▎     | 1291/1501 [01:35<00:12, 17.30it/s][A
Training:  86%|███████████████████████████████████▎     | 1293/1501 [01:35<00:14, 14.04it/s][A
Training:  86%|███████████████████████████████████▎     | 1295/1501 [01:35<00:14, 14.26it/s][A
Training:  86%|███████████████████████████████████▍     | 1297/1501 [01:35<00:13, 15.09it/s][A
Training:  87%|███████████████████████████████████▍     | 1299/1501 [01:35<00:12, 15.55it/s][A
Training:  87%|███████████████████████████████████▌     | 1301/1501 [01:35<00:12, 16.35it/s][A
Training:  87%|███████████████████████████████████▌     | 1303/1501 [01:36<00:12, 16.47it/s][A
Training:  87%|█████████████████████████

Training:  97%|███████████████████████████████████████▋ | 1455/1501 [01:46<00:02, 15.54it/s][A
Training:  97%|███████████████████████████████████████▊ | 1457/1501 [01:46<00:02, 15.60it/s][A
Training:  97%|███████████████████████████████████████▊ | 1459/1501 [01:46<00:02, 15.87it/s][A
Training:  97%|███████████████████████████████████████▉ | 1461/1501 [01:46<00:02, 15.38it/s][A
Training:  97%|███████████████████████████████████████▉ | 1463/1501 [01:46<00:02, 15.45it/s][A
Training:  98%|████████████████████████████████████████ | 1465/1501 [01:46<00:02, 15.08it/s][A
Training:  98%|████████████████████████████████████████ | 1467/1501 [01:46<00:02, 15.27it/s][A
Training:  98%|████████████████████████████████████████▏| 1469/1501 [01:47<00:02, 15.30it/s][A
Training:  98%|████████████████████████████████████████▏| 1471/1501 [01:47<00:01, 15.60it/s][A
Training:  98%|████████████████████████████████████████▏| 1473/1501 [01:47<00:01, 15.64it/s][A
Training:  98%|█████████████████████████

Training:   2%|█                                          | 36/1501 [00:02<01:24, 17.33it/s][A
Training:   3%|█                                          | 38/1501 [00:02<01:25, 17.03it/s][A
Training:   3%|█▏                                         | 40/1501 [00:02<01:24, 17.30it/s][A
Training:   3%|█▏                                         | 42/1501 [00:02<01:24, 17.30it/s][A
Training:   3%|█▎                                         | 44/1501 [00:02<01:25, 16.95it/s][A
Training:   3%|█▎                                         | 46/1501 [00:02<01:28, 16.53it/s][A
Training:   3%|█▍                                         | 48/1501 [00:02<01:26, 16.73it/s][A
Training:   3%|█▍                                         | 50/1501 [00:03<01:24, 17.22it/s][A
Training:   3%|█▍                                         | 52/1501 [00:03<01:30, 16.10it/s][A
Training:   4%|█▌                                         | 54/1501 [00:03<01:26, 16.81it/s][A
Training:   4%|█▌                       

Training:  14%|█████▊                                    | 206/1501 [00:12<01:16, 16.92it/s][A
Training:  14%|█████▊                                    | 208/1501 [00:12<01:14, 17.37it/s][A
Training:  14%|█████▉                                    | 210/1501 [00:12<01:13, 17.49it/s][A
Training:  14%|█████▉                                    | 212/1501 [00:13<01:14, 17.30it/s][A
Training:  14%|█████▉                                    | 214/1501 [00:13<01:15, 17.09it/s][A
Training:  14%|██████                                    | 216/1501 [00:13<01:13, 17.48it/s][A
Training:  15%|██████                                    | 218/1501 [00:13<01:12, 17.63it/s][A
Training:  15%|██████▏                                   | 220/1501 [00:13<01:14, 17.27it/s][A
Training:  15%|██████▏                                   | 222/1501 [00:13<01:13, 17.37it/s][A
Training:  15%|██████▎                                   | 224/1501 [00:13<01:13, 17.27it/s][A
Training:  15%|██████▎                  

Evaluation...:  96%|████████████████████████████████████▋ | 161/167 [00:04<00:00, 35.01it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 36.18it/s][A[A

Training:  20%|████████▏                                 | 294/1501 [00:22<15:10,  1.33it/s][A
Training:  20%|████████▎                                 | 296/1501 [00:22<10:58,  1.83it/s][A
Training:  20%|████████▎                                 | 298/1501 [00:22<08:01,  2.50it/s][A
Training:  20%|████████▍                                 | 300/1501 [00:22<05:57,  3.36it/s][A
Training:  20%|████████▍                                 | 302/1501 [00:22<04:29,  4.45it/s][A
Training:  20%|████████▌                                 | 304/1501 [00:23<03:27,  5.77it/s][A
Training:  20%|████████▌                                 | 306/1501 [00:23<02:46,  7.19it/s][A
Training:  21%|████████▌                                 | 308/1501 [00:23<02:15,  8.78it/s][A
Training:  21%|████████▋        

Training:  31%|████████████▊                             | 460/1501 [00:32<01:08, 15.23it/s][A
Training:  31%|████████████▉                             | 462/1501 [00:32<01:11, 14.49it/s][A
Training:  31%|████████████▉                             | 464/1501 [00:32<01:11, 14.51it/s][A
Training:  31%|█████████████                             | 466/1501 [00:32<01:25, 12.08it/s][A
Training:  31%|█████████████                             | 468/1501 [00:32<01:20, 12.83it/s][A
Training:  31%|█████████████▏                            | 470/1501 [00:33<01:14, 13.86it/s][A
Training:  31%|█████████████▏                            | 472/1501 [00:33<01:10, 14.50it/s][A
Training:  32%|█████████████▎                            | 474/1501 [00:33<01:08, 14.89it/s][A
Training:  32%|█████████████▎                            | 476/1501 [00:33<01:07, 15.29it/s][A
Training:  32%|█████████████▍                            | 478/1501 [00:33<01:06, 15.50it/s][A
Training:  32%|█████████████▍           

Evaluation...:  41%|████████████████                       | 69/167 [00:01<00:02, 35.74it/s][A[A

Evaluation...:  44%|█████████████████                      | 73/167 [00:02<00:02, 33.34it/s][A[A

Evaluation...:  46%|█████████████████▉                     | 77/167 [00:02<00:03, 25.27it/s][A[A

Evaluation...:  48%|██████████████████▋                    | 80/167 [00:02<00:03, 25.30it/s][A[A

Evaluation...:  50%|███████████████████▍                   | 83/167 [00:02<00:03, 26.01it/s][A[A

Evaluation...:  51%|████████████████████                   | 86/167 [00:02<00:03, 26.32it/s][A[A

Evaluation...:  53%|████████████████████▊                  | 89/167 [00:02<00:02, 26.59it/s][A[A

Evaluation...:  56%|█████████████████████▋                 | 93/167 [00:02<00:02, 28.24it/s][A[A

Evaluation...:  58%|██████████████████████▋                | 97/167 [00:02<00:02, 28.84it/s][A[A

Evaluation...:  60%|██████████████████████▉               | 101/167 [00:03<00:02, 29.47it/s][A[A



Training:  47%|███████████████████▊                      | 710/1501 [00:53<00:49, 16.00it/s][A
Training:  47%|███████████████████▉                      | 712/1501 [00:53<00:47, 16.56it/s][A
Training:  48%|███████████████████▉                      | 714/1501 [00:54<00:46, 16.76it/s][A
Training:  48%|████████████████████                      | 716/1501 [00:54<00:45, 17.12it/s][A
Training:  48%|████████████████████                      | 718/1501 [00:54<00:45, 17.15it/s][A
Training:  48%|████████████████████▏                     | 720/1501 [00:54<00:46, 16.72it/s][A
Training:  48%|████████████████████▏                     | 722/1501 [00:54<00:50, 15.52it/s][A
Training:  48%|████████████████████▎                     | 724/1501 [00:54<00:54, 14.24it/s][A
Training:  48%|████████████████████▎                     | 726/1501 [00:54<01:05, 11.75it/s][A
Training:  49%|████████████████████▎                     | 728/1501 [00:55<01:02, 12.37it/s][A
Training:  49%|████████████████████▍    

Training:  59%|████████████████████████▌                 | 880/1501 [01:04<00:38, 16.24it/s][A
Training:  59%|████████████████████████▋                 | 882/1501 [01:04<00:36, 16.92it/s][A
Training:  59%|████████████████████████▋                 | 884/1501 [01:04<00:35, 17.45it/s][A
Training:  59%|████████████████████████▊                 | 886/1501 [01:04<00:36, 16.92it/s][A
Training:  59%|████████████████████████▊                 | 888/1501 [01:04<00:35, 17.15it/s][A
Training:  59%|████████████████████████▉                 | 890/1501 [01:05<00:35, 17.09it/s][A
Training:  59%|████████████████████████▉                 | 892/1501 [01:05<00:35, 17.39it/s][A

Evaluation...:   0%|                                                | 0/167 [00:00<?, ?it/s][A[A

Evaluation...:   2%|▉                                       | 4/167 [00:00<00:05, 29.98it/s][A[A

Evaluation...:   4%|█▋                                      | 7/167 [00:00<00:05, 29.61it/s][A[A

Evaluation...:   7%|██▌    

Training:  64%|██████████████████████████▉               | 964/1501 [01:15<00:36, 14.81it/s][A
Training:  64%|███████████████████████████               | 966/1501 [01:15<00:36, 14.67it/s][A
Training:  64%|███████████████████████████               | 968/1501 [01:15<00:39, 13.41it/s][A
Training:  65%|███████████████████████████▏              | 970/1501 [01:15<00:39, 13.33it/s][A
Training:  65%|███████████████████████████▏              | 972/1501 [01:15<00:37, 14.01it/s][A
Training:  65%|███████████████████████████▎              | 974/1501 [01:15<00:37, 14.15it/s][A
Training:  65%|███████████████████████████▎              | 976/1501 [01:16<00:42, 12.44it/s][A
Training:  65%|███████████████████████████▎              | 978/1501 [01:16<00:39, 13.21it/s][A
Training:  65%|███████████████████████████▍              | 980/1501 [01:16<00:39, 13.05it/s][A
Training:  65%|███████████████████████████▍              | 982/1501 [01:16<00:38, 13.55it/s][A
Training:  66%|█████████████████████████

Training:  76%|██████████████████████████████▉          | 1134/1501 [01:27<00:28, 12.83it/s][A
Training:  76%|███████████████████████████████          | 1136/1501 [01:27<00:25, 14.05it/s][A
Training:  76%|███████████████████████████████          | 1138/1501 [01:27<00:24, 14.77it/s][A
Training:  76%|███████████████████████████████▏         | 1140/1501 [01:27<00:22, 15.70it/s][A
Training:  76%|███████████████████████████████▏         | 1142/1501 [01:27<00:22, 16.00it/s][A
Training:  76%|███████████████████████████████▏         | 1144/1501 [01:27<00:21, 16.66it/s][A
Training:  76%|███████████████████████████████▎         | 1146/1501 [01:27<00:21, 16.42it/s][A
Training:  76%|███████████████████████████████▎         | 1148/1501 [01:27<00:21, 16.70it/s][A
Training:  77%|███████████████████████████████▍         | 1150/1501 [01:27<00:21, 16.47it/s][A
Training:  77%|███████████████████████████████▍         | 1152/1501 [01:28<00:22, 15.67it/s][A
Training:  77%|█████████████████████████

Training:  81%|█████████████████████████████████▏       | 1216/1501 [01:37<00:22, 12.78it/s][A
Training:  81%|█████████████████████████████████▎       | 1218/1501 [01:37<00:21, 13.06it/s][A
Training:  81%|█████████████████████████████████▎       | 1220/1501 [01:37<00:21, 13.00it/s][A
Training:  81%|█████████████████████████████████▍       | 1222/1501 [01:38<00:22, 12.31it/s][A
Training:  82%|█████████████████████████████████▍       | 1224/1501 [01:38<00:22, 12.22it/s][A
Training:  82%|█████████████████████████████████▍       | 1226/1501 [01:38<00:21, 12.53it/s][A
Training:  82%|█████████████████████████████████▌       | 1228/1501 [01:38<00:19, 13.67it/s][A
Training:  82%|█████████████████████████████████▌       | 1230/1501 [01:38<00:18, 14.49it/s][A
Training:  82%|█████████████████████████████████▋       | 1232/1501 [01:38<00:17, 15.28it/s][A
Training:  82%|█████████████████████████████████▋       | 1234/1501 [01:38<00:17, 15.31it/s][A
Training:  82%|█████████████████████████

Training:  93%|█████████████████████████████████████▉   | 1389/1501 [01:48<00:07, 15.50it/s][A
Training:  93%|█████████████████████████████████████▉   | 1391/1501 [01:48<00:06, 16.25it/s][A
Training:  93%|██████████████████████████████████████   | 1393/1501 [01:49<00:07, 15.00it/s][A
Training:  93%|██████████████████████████████████████   | 1395/1501 [01:49<00:07, 14.17it/s][A
Training:  93%|██████████████████████████████████████▏  | 1397/1501 [01:49<00:07, 14.34it/s][A
Training:  93%|██████████████████████████████████████▏  | 1399/1501 [01:49<00:08, 12.72it/s][A
Training:  93%|██████████████████████████████████████▎  | 1401/1501 [01:49<00:07, 13.24it/s][A
Training:  93%|██████████████████████████████████████▎  | 1403/1501 [01:49<00:06, 14.15it/s][A
Training:  94%|██████████████████████████████████████▍  | 1405/1501 [01:50<00:07, 12.82it/s][A
Training:  94%|██████████████████████████████████████▍  | 1407/1501 [01:50<00:07, 13.06it/s][A
Training:  94%|█████████████████████████

Evaluation...:  75%|████████████████████████████▍         | 125/167 [00:03<00:01, 29.10it/s][A[A

Evaluation...:  77%|█████████████████████████████▎        | 129/167 [00:04<00:01, 30.21it/s][A[A

Evaluation...:  80%|██████████████████████████████▎       | 133/167 [00:04<00:01, 30.58it/s][A[A

Evaluation...:  82%|███████████████████████████████▏      | 137/167 [00:04<00:00, 32.16it/s][A[A

Evaluation...:  84%|████████████████████████████████      | 141/167 [00:04<00:00, 27.55it/s][A[A

Evaluation...:  87%|████████████████████████████████▉     | 145/167 [00:04<00:00, 29.59it/s][A[A

Evaluation...:  89%|█████████████████████████████████▉    | 149/167 [00:04<00:00, 29.63it/s][A[A

Evaluation...:  92%|██████████████████████████████████▊   | 153/167 [00:04<00:00, 30.93it/s][A[A

Evaluation...:  94%|███████████████████████████████████▋  | 157/167 [00:04<00:00, 30.24it/s][A[A

Evaluation...:  96%|████████████████████████████████████▋ | 161/167 [00:05<00:00, 32.04it/s][A[A



Training:   9%|███▊                                      | 136/1501 [00:09<01:24, 16.18it/s][A
Training:   9%|███▊                                      | 138/1501 [00:09<01:28, 15.41it/s][A
Training:   9%|███▉                                      | 140/1501 [00:09<01:26, 15.78it/s][A
Training:   9%|███▉                                      | 142/1501 [00:09<01:24, 16.07it/s][A
Training:  10%|████                                      | 144/1501 [00:10<01:36, 14.13it/s][A
Training:  10%|████                                      | 146/1501 [00:10<01:36, 14.00it/s][A
Training:  10%|████▏                                     | 148/1501 [00:10<01:35, 14.24it/s][A
Training:  10%|████▏                                     | 150/1501 [00:10<01:37, 13.93it/s][A
Training:  10%|████▎                                     | 152/1501 [00:10<01:38, 13.76it/s][A
Training:  10%|████▎                                     | 154/1501 [00:10<01:33, 14.34it/s][A
Training:  10%|████▎                    

Evaluation...:  14%|█████▌                                 | 24/167 [00:00<00:04, 35.42it/s][A[A

Evaluation...:  17%|██████▌                                | 28/167 [00:00<00:04, 34.05it/s][A[A

Evaluation...:  19%|███████▍                               | 32/167 [00:00<00:03, 34.54it/s][A[A

Evaluation...:  22%|████████▍                              | 36/167 [00:01<00:03, 35.41it/s][A[A

Evaluation...:  24%|█████████▎                             | 40/167 [00:01<00:03, 35.56it/s][A[A

Evaluation...:  26%|██████████▎                            | 44/167 [00:01<00:03, 33.71it/s][A[A

Evaluation...:  29%|███████████▏                           | 48/167 [00:01<00:03, 33.23it/s][A[A

Evaluation...:  31%|████████████▏                          | 52/167 [00:01<00:03, 34.31it/s][A[A

Evaluation...:  34%|█████████████                          | 56/167 [00:01<00:03, 33.18it/s][A[A

Evaluation...:  37%|██████████████▏                        | 61/167 [00:01<00:02, 35.60it/s][A[A



Training:  26%|██████████▉                               | 391/1501 [00:30<01:22, 13.47it/s][A
Training:  26%|██████████▉                               | 393/1501 [00:31<01:21, 13.57it/s][A
Training:  26%|███████████                               | 395/1501 [00:31<01:19, 13.91it/s][A
Training:  26%|███████████                               | 397/1501 [00:31<01:15, 14.69it/s][A
Training:  27%|███████████▏                              | 399/1501 [00:31<01:12, 15.20it/s][A
Training:  27%|███████████▏                              | 401/1501 [00:31<01:09, 15.81it/s][A
Training:  27%|███████████▎                              | 403/1501 [00:31<01:08, 15.92it/s][A
Training:  27%|███████████▎                              | 405/1501 [00:31<01:10, 15.64it/s][A
Training:  27%|███████████▍                              | 407/1501 [00:31<01:06, 16.45it/s][A
Training:  27%|███████████▍                              | 409/1501 [00:32<01:15, 14.54it/s][A
Training:  27%|███████████▌             

Training:  37%|███████████████▋                          | 561/1501 [00:42<00:51, 18.38it/s][A
Training:  38%|███████████████▊                          | 563/1501 [00:42<00:53, 17.63it/s][A
Training:  38%|███████████████▊                          | 565/1501 [00:42<00:51, 18.00it/s][A
Training:  38%|███████████████▊                          | 567/1501 [00:42<00:53, 17.50it/s][A
Training:  38%|███████████████▉                          | 569/1501 [00:42<00:56, 16.44it/s][A
Training:  38%|███████████████▉                          | 571/1501 [00:43<00:57, 16.14it/s][A
Training:  38%|████████████████                          | 573/1501 [00:43<00:56, 16.40it/s][A
Training:  38%|████████████████                          | 575/1501 [00:43<00:54, 17.00it/s][A
Training:  38%|████████████████▏                         | 577/1501 [00:43<00:53, 17.19it/s][A
Training:  39%|████████████████▏                         | 579/1501 [00:43<00:54, 16.91it/s][A
Training:  39%|████████████████▎        

Training:  43%|██████████████████                        | 645/1501 [00:51<00:46, 18.54it/s][A
Training:  43%|██████████████████                        | 647/1501 [00:52<00:47, 17.90it/s][A
Training:  43%|██████████████████▏                       | 649/1501 [00:52<00:49, 17.17it/s][A
Training:  43%|██████████████████▏                       | 651/1501 [00:52<00:49, 17.21it/s][A
Training:  44%|██████████████████▎                       | 654/1501 [00:52<00:47, 17.93it/s][A
Training:  44%|██████████████████▎                       | 656/1501 [00:52<00:47, 17.70it/s][A
Training:  44%|██████████████████▍                       | 658/1501 [00:52<00:46, 17.99it/s][A
Training:  44%|██████████████████▍                       | 660/1501 [00:52<00:49, 17.15it/s][A
Training:  44%|██████████████████▌                       | 662/1501 [00:52<00:56, 14.91it/s][A
Training:  44%|██████████████████▌                       | 664/1501 [00:53<01:03, 13.25it/s][A
Training:  44%|██████████████████▋      

Training:  54%|██████████████████████▊                   | 815/1501 [01:03<00:40, 16.75it/s][A
Training:  54%|██████████████████████▊                   | 817/1501 [01:03<00:40, 16.94it/s][A
Training:  55%|██████████████████████▉                   | 819/1501 [01:03<00:39, 17.12it/s][A
Training:  55%|██████████████████████▉                   | 821/1501 [01:03<00:39, 17.12it/s][A
Training:  55%|███████████████████████                   | 823/1501 [01:03<00:38, 17.63it/s][A
Training:  55%|███████████████████████                   | 825/1501 [01:04<00:39, 17.11it/s][A
Training:  55%|███████████████████████▏                  | 827/1501 [01:04<00:39, 17.06it/s][A
Training:  55%|███████████████████████▏                  | 829/1501 [01:04<00:37, 17.77it/s][A
Training:  55%|███████████████████████▎                  | 831/1501 [01:04<00:38, 17.22it/s][A
Training:  55%|███████████████████████▎                  | 833/1501 [01:04<00:39, 17.11it/s][A
Training:  56%|███████████████████████▎ 

Training:  60%|█████████████████████████                 | 895/1501 [01:13<06:13,  1.62it/s][A
Training:  60%|█████████████████████████                 | 897/1501 [01:13<04:33,  2.21it/s][A
Training:  60%|█████████████████████████▏                | 899/1501 [01:13<03:21,  2.99it/s][A
Training:  60%|█████████████████████████▏                | 901/1501 [01:14<02:31,  3.96it/s][A
Training:  60%|█████████████████████████▎                | 903/1501 [01:14<01:56,  5.13it/s][A
Training:  60%|█████████████████████████▎                | 905/1501 [01:14<01:33,  6.40it/s][A
Training:  60%|█████████████████████████▍                | 907/1501 [01:14<01:16,  7.79it/s][A
Training:  61%|█████████████████████████▍                | 909/1501 [01:14<01:05,  9.06it/s][A
Training:  61%|█████████████████████████▍                | 911/1501 [01:14<00:54, 10.74it/s][A
Training:  61%|█████████████████████████▌                | 913/1501 [01:14<00:47, 12.42it/s][A
Training:  61%|█████████████████████████

Training:  71%|█████████████████████████████            | 1065/1501 [01:25<00:32, 13.36it/s][A
Training:  71%|█████████████████████████████▏           | 1067/1501 [01:26<00:31, 13.66it/s][A
Training:  71%|█████████████████████████████▏           | 1069/1501 [01:26<00:31, 13.56it/s][A
Training:  71%|█████████████████████████████▎           | 1071/1501 [01:26<00:30, 14.10it/s][A
Training:  71%|█████████████████████████████▎           | 1073/1501 [01:26<00:30, 13.88it/s][A
Training:  72%|█████████████████████████████▎           | 1075/1501 [01:26<00:31, 13.32it/s][A
Training:  72%|█████████████████████████████▍           | 1077/1501 [01:26<00:33, 12.82it/s][A
Training:  72%|█████████████████████████████▍           | 1079/1501 [01:26<00:33, 12.64it/s][A
Training:  72%|█████████████████████████████▌           | 1081/1501 [01:27<00:31, 13.31it/s][A
Training:  72%|█████████████████████████████▌           | 1083/1501 [01:27<00:29, 14.36it/s][A
Training:  72%|█████████████████████████

Evaluation...:  41%|███████████████▉                       | 68/167 [00:02<00:03, 28.59it/s][A[A

Evaluation...:  43%|████████████████▌                      | 71/167 [00:02<00:03, 27.37it/s][A[A

Evaluation...:  44%|█████████████████▎                     | 74/167 [00:02<00:03, 27.15it/s][A[A

Evaluation...:  46%|█████████████████▉                     | 77/167 [00:02<00:03, 27.04it/s][A[A

Evaluation...:  49%|██████████████████▉                    | 81/167 [00:02<00:03, 28.58it/s][A[A

Evaluation...:  50%|███████████████████▌                   | 84/167 [00:02<00:02, 28.68it/s][A[A

Evaluation...:  52%|████████████████████▎                  | 87/167 [00:03<00:02, 27.75it/s][A[A

Evaluation...:  54%|█████████████████████▎                 | 91/167 [00:03<00:02, 29.69it/s][A[A

Evaluation...:  57%|██████████████████████▏                | 95/167 [00:03<00:02, 30.94it/s][A[A

Evaluation...:  59%|███████████████████████                | 99/167 [00:03<00:02, 32.48it/s][A[A



Training:  87%|███████████████████████████████████▊     | 1309/1501 [01:47<00:11, 16.30it/s][A
Training:  87%|███████████████████████████████████▊     | 1311/1501 [01:47<00:11, 17.05it/s][A
Training:  87%|███████████████████████████████████▊     | 1313/1501 [01:48<00:11, 16.27it/s][A
Training:  88%|███████████████████████████████████▉     | 1315/1501 [01:48<00:11, 16.21it/s][A
Training:  88%|███████████████████████████████████▉     | 1317/1501 [01:48<00:11, 16.39it/s][A
Training:  88%|████████████████████████████████████     | 1319/1501 [01:48<00:10, 16.70it/s][A
Training:  88%|████████████████████████████████████     | 1321/1501 [01:48<00:10, 16.79it/s][A
Training:  88%|████████████████████████████████████▏    | 1323/1501 [01:48<00:10, 16.63it/s][A
Training:  88%|████████████████████████████████████▏    | 1325/1501 [01:48<00:10, 16.56it/s][A
Training:  88%|████████████████████████████████████▏    | 1327/1501 [01:48<00:11, 15.76it/s][A
Training:  89%|█████████████████████████

Training:  99%|████████████████████████████████████████▍| 1479/1501 [01:58<00:01, 15.37it/s][A
Training:  99%|████████████████████████████████████████▍| 1481/1501 [01:58<00:01, 16.06it/s][A
Training:  99%|████████████████████████████████████████▌| 1483/1501 [01:58<00:01, 16.05it/s][A
Training:  99%|████████████████████████████████████████▌| 1485/1501 [01:59<00:00, 16.42it/s][A
Training:  99%|████████████████████████████████████████▌| 1487/1501 [01:59<00:00, 16.72it/s][A
Training:  99%|████████████████████████████████████████▋| 1489/1501 [01:59<00:00, 16.77it/s][A
Training:  99%|████████████████████████████████████████▋| 1491/1501 [01:59<00:00, 17.18it/s][A

Evaluation...:   0%|                                                | 0/167 [00:00<?, ?it/s][A[A

Evaluation...:   2%|▉                                       | 4/167 [00:00<00:04, 37.80it/s][A[A

Evaluation...:   5%|█▉                                      | 8/167 [00:00<00:04, 36.14it/s][A[A

Evaluation...:   7%|██▊    

Training:   4%|█▋                                         | 58/1501 [00:03<01:26, 16.69it/s][A
Training:   4%|█▋                                         | 60/1501 [00:03<01:28, 16.36it/s][A
Training:   4%|█▊                                         | 62/1501 [00:03<01:27, 16.43it/s][A
Training:   4%|█▊                                         | 64/1501 [00:04<01:30, 15.81it/s][A
Training:   4%|█▉                                         | 66/1501 [00:04<01:25, 16.81it/s][A
Training:   5%|█▉                                         | 68/1501 [00:04<01:27, 16.35it/s][A
Training:   5%|██                                         | 70/1501 [00:04<01:23, 17.05it/s][A
Training:   5%|██                                         | 72/1501 [00:04<01:34, 15.09it/s][A
Training:   5%|██                                         | 74/1501 [00:04<01:48, 13.13it/s][A
Training:   5%|██▏                                        | 76/1501 [00:04<01:56, 12.23it/s][A
Training:   5%|██▏                      

Training:  15%|██████▍                                   | 228/1501 [00:14<01:15, 16.92it/s][A
Training:  15%|██████▍                                   | 230/1501 [00:14<01:14, 16.98it/s][A
Training:  15%|██████▍                                   | 232/1501 [00:14<01:15, 16.71it/s][A
Training:  16%|██████▌                                   | 234/1501 [00:14<01:35, 13.27it/s][A
Training:  16%|██████▌                                   | 236/1501 [00:15<01:39, 12.71it/s][A
Training:  16%|██████▋                                   | 238/1501 [00:15<01:38, 12.79it/s][A
Training:  16%|██████▋                                   | 240/1501 [00:15<01:37, 12.89it/s][A
Training:  16%|██████▊                                   | 242/1501 [00:15<01:44, 12.10it/s][A
Training:  16%|██████▊                                   | 244/1501 [00:15<01:36, 13.05it/s][A
Training:  16%|██████▉                                   | 246/1501 [00:15<01:33, 13.49it/s][A
Training:  17%|██████▉                  

Training:  21%|████████▊                                 | 314/1501 [00:24<01:47, 10.99it/s][A
Training:  21%|████████▊                                 | 316/1501 [00:24<01:35, 12.42it/s][A
Training:  21%|████████▉                                 | 318/1501 [00:24<01:27, 13.45it/s][A
Training:  21%|████████▉                                 | 320/1501 [00:25<01:21, 14.54it/s][A
Training:  21%|█████████                                 | 322/1501 [00:25<01:17, 15.17it/s][A
Training:  22%|█████████                                 | 324/1501 [00:25<01:15, 15.58it/s][A
Training:  22%|█████████                                 | 326/1501 [00:25<01:17, 15.22it/s][A
Training:  22%|█████████▏                                | 328/1501 [00:25<01:14, 15.80it/s][A
Training:  22%|█████████▏                                | 330/1501 [00:25<01:14, 15.71it/s][A
Training:  22%|█████████▎                                | 332/1501 [00:25<01:11, 16.31it/s][A
Training:  22%|█████████▎               

Training:  32%|█████████████▌                            | 484/1501 [00:36<00:58, 17.27it/s][A
Training:  32%|█████████████▌                            | 486/1501 [00:36<01:00, 16.78it/s][A
Training:  33%|█████████████▋                            | 488/1501 [00:36<00:58, 17.39it/s][A
Training:  33%|█████████████▋                            | 490/1501 [00:36<01:00, 16.82it/s][A
Training:  33%|█████████████▊                            | 492/1501 [00:36<00:59, 17.07it/s][A
Training:  33%|█████████████▊                            | 494/1501 [00:36<01:01, 16.35it/s][A
Training:  33%|█████████████▉                            | 496/1501 [00:37<01:00, 16.72it/s][A
Training:  33%|█████████████▉                            | 498/1501 [00:37<00:58, 17.26it/s][A
Training:  33%|█████████████▉                            | 500/1501 [00:37<00:58, 17.01it/s][A
Training:  33%|██████████████                            | 502/1501 [00:37<00:57, 17.51it/s][A
Training:  34%|██████████████           

Evaluation...:  79%|██████████████████████████████        | 132/167 [00:03<00:00, 39.81it/s][A[A

Evaluation...:  81%|██████████████████████████████▉       | 136/167 [00:03<00:00, 38.63it/s][A[A

Evaluation...:  84%|███████████████████████████████▊      | 140/167 [00:03<00:00, 37.05it/s][A[A

Evaluation...:  86%|████████████████████████████████▊     | 144/167 [00:03<00:00, 37.37it/s][A[A

Evaluation...:  89%|█████████████████████████████████▋    | 148/167 [00:03<00:00, 36.80it/s][A[A

Evaluation...:  92%|██████████████████████████████████▊   | 153/167 [00:03<00:00, 37.66it/s][A[A

Evaluation...:  94%|███████████████████████████████████▋  | 157/167 [00:04<00:00, 34.73it/s][A[A

Evaluation...:  96%|████████████████████████████████████▋ | 161/167 [00:04<00:00, 35.08it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 37.98it/s][A[A

Training:  40%|████████████████▌                         | 593/1501 [00:47<10:49,  1.40it/s][A
Trai

Training:  50%|████████████████████▊                     | 743/1501 [00:55<00:43, 17.34it/s][A
Training:  50%|████████████████████▊                     | 745/1501 [00:56<00:42, 17.63it/s][A
Training:  50%|████████████████████▉                     | 747/1501 [00:56<00:42, 17.83it/s][A
Training:  50%|████████████████████▉                     | 749/1501 [00:56<00:42, 17.67it/s][A
Training:  50%|█████████████████████                     | 751/1501 [00:56<00:42, 17.81it/s][A
Training:  50%|█████████████████████                     | 753/1501 [00:56<00:40, 18.41it/s][A
Training:  50%|█████████████████████▏                    | 755/1501 [00:56<00:39, 18.66it/s][A
Training:  50%|█████████████████████▏                    | 757/1501 [00:56<00:42, 17.62it/s][A
Training:  51%|█████████████████████▏                    | 759/1501 [00:56<00:42, 17.43it/s][A
Training:  51%|█████████████████████▎                    | 761/1501 [00:56<00:41, 17.80it/s][A
Training:  51%|█████████████████████▎   

Evaluation...:  35%|█████████████▌                         | 58/167 [00:01<00:02, 40.61it/s][A[A

Evaluation...:  38%|██████████████▋                        | 63/167 [00:01<00:02, 40.74it/s][A[A

Evaluation...:  41%|███████████████▉                       | 68/167 [00:01<00:02, 42.39it/s][A[A

Evaluation...:  44%|█████████████████                      | 73/167 [00:01<00:02, 41.01it/s][A[A

Evaluation...:  47%|██████████████████▏                    | 78/167 [00:01<00:02, 41.25it/s][A[A

Evaluation...:  50%|███████████████████▍                   | 83/167 [00:02<00:02, 41.62it/s][A[A

Evaluation...:  53%|████████████████████▌                  | 88/167 [00:02<00:02, 39.30it/s][A[A

Evaluation...:  56%|█████████████████████▋                 | 93/167 [00:02<00:01, 39.70it/s][A[A

Evaluation...:  58%|██████████████████████▋                | 97/167 [00:02<00:01, 39.15it/s][A[A

Evaluation...:  61%|███████████████████████▏              | 102/167 [00:02<00:01, 40.20it/s][A[A



Training:  68%|███████████████████████████▊             | 1018/1501 [01:15<00:25, 18.73it/s][A
Training:  68%|███████████████████████████▊             | 1020/1501 [01:15<00:25, 18.75it/s][A
Training:  68%|███████████████████████████▉             | 1022/1501 [01:15<00:25, 18.92it/s][A
Training:  68%|███████████████████████████▉             | 1024/1501 [01:15<00:25, 18.90it/s][A
Training:  68%|████████████████████████████             | 1026/1501 [01:15<00:24, 19.03it/s][A
Training:  68%|████████████████████████████             | 1028/1501 [01:15<00:24, 19.17it/s][A
Training:  69%|████████████████████████████▏            | 1030/1501 [01:16<00:25, 18.84it/s][A
Training:  69%|████████████████████████████▏            | 1032/1501 [01:16<00:25, 18.75it/s][A
Training:  69%|████████████████████████████▏            | 1034/1501 [01:16<00:25, 18.66it/s][A
Training:  69%|████████████████████████████▎            | 1036/1501 [01:16<00:24, 18.61it/s][A
Training:  69%|█████████████████████████

Evaluation...:   5%|█▉                                      | 8/167 [00:00<00:06, 25.66it/s][A[A

Evaluation...:   7%|██▌                                    | 11/167 [00:00<00:06, 23.43it/s][A[A

Evaluation...:   8%|███▎                                   | 14/167 [00:00<00:06, 24.48it/s][A[A

Evaluation...:  10%|███▉                                   | 17/167 [00:00<00:06, 23.13it/s][A[A

Evaluation...:  12%|████▋                                  | 20/167 [00:00<00:06, 22.37it/s][A[A

Evaluation...:  14%|█████▌                                 | 24/167 [00:00<00:05, 26.30it/s][A[A

Evaluation...:  16%|██████▎                                | 27/167 [00:01<00:05, 25.84it/s][A[A

Evaluation...:  19%|███████▏                               | 31/167 [00:01<00:04, 27.89it/s][A[A

Evaluation...:  20%|███████▉                               | 34/167 [00:01<00:04, 26.75it/s][A[A

Evaluation...:  22%|████████▋                              | 37/167 [00:01<00:05, 25.57it/s][A[A



Training:  85%|██████████████████████████████████▉      | 1277/1501 [01:34<00:13, 17.12it/s][A
Training:  85%|██████████████████████████████████▉      | 1279/1501 [01:34<00:13, 16.96it/s][A
Training:  85%|██████████████████████████████████▉      | 1281/1501 [01:35<00:12, 17.32it/s][A
Training:  85%|███████████████████████████████████      | 1283/1501 [01:35<00:12, 16.94it/s][A
Training:  86%|███████████████████████████████████      | 1285/1501 [01:35<00:12, 17.43it/s][A
Training:  86%|███████████████████████████████████▏     | 1287/1501 [01:35<00:12, 16.81it/s][A
Training:  86%|███████████████████████████████████▏     | 1289/1501 [01:35<00:12, 17.07it/s][A
Training:  86%|███████████████████████████████████▎     | 1291/1501 [01:35<00:12, 17.37it/s][A
Training:  86%|███████████████████████████████████▎     | 1293/1501 [01:35<00:12, 17.22it/s][A
Training:  86%|███████████████████████████████████▎     | 1295/1501 [01:35<00:12, 16.27it/s][A
Training:  86%|█████████████████████████

Training:  96%|███████████████████████████████████████▌ | 1447/1501 [01:44<00:03, 16.61it/s][A
Training:  97%|███████████████████████████████████████▌ | 1449/1501 [01:45<00:03, 15.18it/s][A
Training:  97%|███████████████████████████████████████▋ | 1451/1501 [01:45<00:03, 15.92it/s][A
Training:  97%|███████████████████████████████████████▋ | 1453/1501 [01:45<00:02, 16.47it/s][A
Training:  97%|███████████████████████████████████████▋ | 1455/1501 [01:45<00:02, 16.62it/s][A
Training:  97%|███████████████████████████████████████▊ | 1457/1501 [01:45<00:02, 17.09it/s][A
Training:  97%|███████████████████████████████████████▊ | 1459/1501 [01:45<00:02, 17.10it/s][A
Training:  97%|███████████████████████████████████████▉ | 1461/1501 [01:45<00:02, 16.14it/s][A
Training:  97%|███████████████████████████████████████▉ | 1463/1501 [01:45<00:02, 15.93it/s][A
Training:  98%|████████████████████████████████████████ | 1465/1501 [01:46<00:02, 16.45it/s][A
Training:  98%|█████████████████████████

Training:   2%|▊                                          | 30/1501 [00:01<01:26, 17.05it/s][A
Training:   2%|▉                                          | 32/1501 [00:02<01:26, 17.05it/s][A
Training:   2%|▉                                          | 34/1501 [00:02<01:26, 17.05it/s][A
Training:   2%|█                                          | 36/1501 [00:02<01:25, 17.15it/s][A
Training:   3%|█                                          | 38/1501 [00:02<01:24, 17.25it/s][A
Training:   3%|█▏                                         | 40/1501 [00:02<01:23, 17.55it/s][A
Training:   3%|█▏                                         | 42/1501 [00:02<01:23, 17.40it/s][A
Training:   3%|█▎                                         | 44/1501 [00:02<01:27, 16.62it/s][A
Training:   3%|█▎                                         | 46/1501 [00:02<01:25, 16.95it/s][A
Training:   3%|█▍                                         | 48/1501 [00:03<01:23, 17.37it/s][A
Training:   3%|█▍                       

Training:  13%|█████▌                                    | 200/1501 [00:12<01:24, 15.43it/s][A
Training:  13%|█████▋                                    | 202/1501 [00:12<01:25, 15.22it/s][A
Training:  14%|█████▋                                    | 204/1501 [00:12<01:24, 15.33it/s][A
Training:  14%|█████▊                                    | 206/1501 [00:12<01:20, 16.04it/s][A
Training:  14%|█████▊                                    | 208/1501 [00:12<01:19, 16.36it/s][A
Training:  14%|█████▉                                    | 210/1501 [00:12<01:15, 17.18it/s][A
Training:  14%|█████▉                                    | 212/1501 [00:12<01:12, 17.69it/s][A
Training:  14%|█████▉                                    | 214/1501 [00:12<01:14, 17.29it/s][A
Training:  14%|██████                                    | 216/1501 [00:13<01:15, 17.03it/s][A
Training:  15%|██████                                    | 218/1501 [00:13<01:15, 16.97it/s][A
Training:  15%|██████▏                  

Evaluation...:  88%|█████████████████████████████████▍    | 147/167 [00:04<00:00, 36.21it/s][A[A

Evaluation...:  90%|██████████████████████████████████▎   | 151/167 [00:04<00:00, 37.10it/s][A[A

Evaluation...:  93%|███████████████████████████████████▎  | 155/167 [00:04<00:00, 36.31it/s][A[A

Evaluation...:  95%|████████████████████████████████████▏ | 159/167 [00:04<00:00, 33.11it/s][A[A

Evaluation...:  98%|█████████████████████████████████████ | 163/167 [00:04<00:00, 33.96it/s][A[A

Evaluation...: 100%|██████████████████████████████████████| 167/167 [00:04<00:00, 33.46it/s][A[A

Training:  19%|████████▏                                 | 292/1501 [00:22<16:18,  1.24it/s][A
Training:  20%|████████▎                                 | 295/1501 [00:22<10:18,  1.95it/s][A
Training:  20%|████████▎                                 | 297/1501 [00:22<07:47,  2.57it/s][A
Training:  20%|████████▎                                 | 299/1501 [00:23<05:57,  3.36it/s][A
Training:  20%|█

Training:  30%|████████████▌                             | 451/1501 [00:32<01:01, 17.04it/s][A
Training:  30%|████████████▋                             | 453/1501 [00:32<01:01, 17.06it/s][A
Training:  30%|████████████▋                             | 455/1501 [00:32<01:02, 16.73it/s][A
Training:  30%|████████████▊                             | 457/1501 [00:32<01:03, 16.32it/s][A
Training:  31%|████████████▊                             | 459/1501 [00:32<01:01, 16.93it/s][A
Training:  31%|████████████▉                             | 461/1501 [00:33<01:01, 16.91it/s][A
Training:  31%|████████████▉                             | 463/1501 [00:33<01:02, 16.66it/s][A
Training:  31%|█████████████                             | 465/1501 [00:33<01:02, 16.68it/s][A
Training:  31%|█████████████                             | 467/1501 [00:33<01:01, 16.74it/s][A
Training:  31%|█████████████                             | 469/1501 [00:33<01:03, 16.21it/s][A
Training:  31%|█████████████▏           

Evaluation...:  34%|█████████████                          | 56/167 [00:01<00:03, 30.92it/s][A[A

Evaluation...:  36%|██████████████                         | 60/167 [00:01<00:03, 29.15it/s][A[A

Evaluation...:  38%|██████████████▉                        | 64/167 [00:01<00:03, 27.97it/s][A[A

Evaluation...:  40%|███████████████▋                       | 67/167 [00:02<00:03, 28.05it/s][A[A

Evaluation...:  42%|████████████████▎                      | 70/167 [00:02<00:04, 23.50it/s][A[A

Evaluation...:  44%|█████████████████                      | 73/167 [00:02<00:04, 20.78it/s][A[A

Evaluation...:  46%|█████████████████▋                     | 76/167 [00:02<00:04, 21.39it/s][A[A

Evaluation...:  47%|██████████████████▍                    | 79/167 [00:02<00:03, 22.56it/s][A[A

Evaluation...:  49%|███████████████████▏                   | 82/167 [00:02<00:03, 23.73it/s][A[A

Evaluation...:  51%|███████████████████▊                   | 85/167 [00:02<00:03, 22.50it/s][A[A



>>> training loss:  0.3611, valid loss:  2.0325

                            valid f1 score:  0.5188, valid precision score:  0.5395,
                            valid recall score:  0.5077, valid accuracy score:  0.5266



Training:  40%|████████████████▋                         | 595/1501 [00:47<07:23,  2.04it/s][A
Training:  40%|████████████████▋                         | 597/1501 [00:47<05:26,  2.77it/s][A
Training:  40%|████████████████▊                         | 599/1501 [00:47<04:03,  3.70it/s][A
Training:  40%|████████████████▊                         | 601/1501 [00:47<03:07,  4.79it/s][A
Training:  40%|████████████████▊                         | 603/1501 [00:47<02:31,  5.93it/s][A
Training:  40%|████████████████▉                         | 605/1501 [00:47<02:02,  7.29it/s][A
Training:  40%|████████████████▉                         | 607/1501 [00:48<01:42,  8.68it/s][A
Training:  41%|█████████████████                         | 609/1501 [00:48<01:29,  9.94it/s][A
Training:  41%|█████████████████                         | 611/1501 [00:48<01:21, 10.87it/s][A
Training:  41%|█████████████████▏                        | 613/1501 [00:48<01:13, 12.16it/s][A
Training:  41%|█████████████████▏      

Training:  51%|█████████████████████▍                    | 765/1501 [00:58<00:44, 16.50it/s][A
Training:  51%|█████████████████████▍                    | 767/1501 [00:58<00:43, 16.72it/s][A
Training:  51%|█████████████████████▌                    | 769/1501 [00:59<00:44, 16.52it/s][A
Training:  51%|█████████████████████▌                    | 771/1501 [00:59<00:45, 16.19it/s][A
Training:  51%|█████████████████████▋                    | 773/1501 [00:59<00:43, 16.68it/s][A
Training:  52%|█████████████████████▋                    | 775/1501 [00:59<00:42, 16.93it/s][A
Training:  52%|█████████████████████▋                    | 777/1501 [00:59<00:43, 16.68it/s][A
Training:  52%|█████████████████████▊                    | 779/1501 [00:59<00:43, 16.57it/s][A
Training:  52%|█████████████████████▊                    | 781/1501 [00:59<00:43, 16.39it/s][A
Training:  52%|█████████████████████▉                    | 783/1501 [00:59<00:44, 16.09it/s][A
Training:  52%|█████████████████████▉   

Evaluation...:  50%|███████████████████▌                   | 84/167 [00:02<00:02, 35.62it/s][A[A

Evaluation...:  53%|████████████████████▌                  | 88/167 [00:02<00:02, 33.43it/s][A[A

Evaluation...:  55%|█████████████████████▍                 | 92/167 [00:02<00:02, 34.01it/s][A[A

Evaluation...:  57%|██████████████████████▍                | 96/167 [00:02<00:02, 33.95it/s][A[A

Evaluation...:  60%|██████████████████████▊               | 100/167 [00:02<00:01, 34.44it/s][A[A

Evaluation...:  62%|███████████████████████▋              | 104/167 [00:03<00:01, 34.40it/s][A[A

Evaluation...:  65%|████████████████████████▌             | 108/167 [00:03<00:01, 35.12it/s][A[A

Evaluation...:  67%|█████████████████████████▍            | 112/167 [00:03<00:01, 35.82it/s][A[A

Evaluation...:  69%|██████████████████████████▍           | 116/167 [00:03<00:01, 35.69it/s][A[A

Evaluation...:  72%|███████████████████████████▎          | 120/167 [00:03<00:01, 34.59it/s][A[A



Training:  68%|███████████████████████████▊             | 1017/1501 [01:18<00:28, 17.28it/s][A
Training:  68%|███████████████████████████▊             | 1019/1501 [01:19<00:27, 17.82it/s][A
Training:  68%|███████████████████████████▉             | 1021/1501 [01:19<00:28, 16.65it/s][A
Training:  68%|███████████████████████████▉             | 1023/1501 [01:19<00:28, 16.77it/s][A
Training:  68%|███████████████████████████▉             | 1025/1501 [01:19<00:27, 17.21it/s][A
Training:  68%|████████████████████████████             | 1027/1501 [01:19<00:27, 17.01it/s][A
Training:  69%|████████████████████████████             | 1029/1501 [01:19<00:28, 16.54it/s][A
Training:  69%|████████████████████████████▏            | 1031/1501 [01:19<00:29, 15.99it/s][A
Training:  69%|████████████████████████████▏            | 1033/1501 [01:19<00:28, 16.34it/s][A
Training:  69%|████████████████████████████▎            | 1035/1501 [01:19<00:28, 16.52it/s][A
Training:  69%|█████████████████████████

Training:  79%|████████████████████████████████▍        | 1187/1501 [01:29<00:18, 17.15it/s][A
Training:  79%|████████████████████████████████▍        | 1189/1501 [01:29<00:17, 17.57it/s][A

Evaluation...:   0%|                                                | 0/167 [00:00<?, ?it/s][A[A

Evaluation...:   2%|▉                                       | 4/167 [00:00<00:04, 36.14it/s][A[A

Evaluation...:   5%|█▉                                      | 8/167 [00:00<00:04, 35.53it/s][A[A

Evaluation...:   7%|██▊                                    | 12/167 [00:00<00:04, 35.93it/s][A[A

Evaluation...:  10%|███▋                                   | 16/167 [00:00<00:04, 37.07it/s][A[A

Evaluation...:  12%|████▋                                  | 20/167 [00:00<00:03, 37.07it/s][A[A

Evaluation...:  14%|█████▌                                 | 24/167 [00:00<00:03, 37.67it/s][A[A

Evaluation...:  17%|██████▌                                | 28/167 [00:00<00:03, 36.62it/s][A[A

Evaluat

Training:  85%|██████████████████████████████████▋      | 1269/1501 [01:38<00:12, 18.68it/s][A
Training:  85%|██████████████████████████████████▋      | 1271/1501 [01:38<00:12, 18.16it/s][A
Training:  85%|██████████████████████████████████▊      | 1273/1501 [01:38<00:12, 17.92it/s][A
Training:  85%|██████████████████████████████████▊      | 1275/1501 [01:38<00:12, 18.13it/s][A
Training:  85%|██████████████████████████████████▉      | 1277/1501 [01:38<00:12, 18.25it/s][A
Training:  85%|██████████████████████████████████▉      | 1279/1501 [01:39<00:12, 18.19it/s][A
Training:  85%|██████████████████████████████████▉      | 1281/1501 [01:39<00:12, 17.82it/s][A
Training:  85%|███████████████████████████████████      | 1283/1501 [01:39<00:12, 18.06it/s][A
Training:  86%|███████████████████████████████████      | 1285/1501 [01:39<00:11, 18.12it/s][A
Training:  86%|███████████████████████████████████▏     | 1287/1501 [01:39<00:11, 18.41it/s][A
Training:  86%|█████████████████████████

Training:  96%|███████████████████████████████████████▎ | 1439/1501 [01:48<00:03, 17.42it/s][A
Training:  96%|███████████████████████████████████████▎ | 1441/1501 [01:48<00:03, 17.70it/s][A
Training:  96%|███████████████████████████████████████▍ | 1443/1501 [01:48<00:03, 17.91it/s][A
Training:  96%|███████████████████████████████████████▍ | 1445/1501 [01:48<00:03, 18.01it/s][A
Training:  96%|███████████████████████████████████████▌ | 1447/1501 [01:48<00:03, 17.57it/s][A
Training:  97%|███████████████████████████████████████▌ | 1449/1501 [01:48<00:02, 17.78it/s][A
Training:  97%|███████████████████████████████████████▋ | 1451/1501 [01:48<00:02, 17.15it/s][A
Training:  97%|███████████████████████████████████████▋ | 1453/1501 [01:48<00:02, 17.42it/s][A
Training:  97%|███████████████████████████████████████▋ | 1455/1501 [01:49<00:02, 17.90it/s][A
Training:  97%|███████████████████████████████████████▊ | 1457/1501 [01:49<00:02, 18.02it/s][A
Training:  97%|█████████████████████████

valid f1 score:  0.5188, valid precision score:  0.5395,
                valid recall score:  0.5077, valid accuracy score:  0.5266





## 预测并保存结果

In [31]:
def predict(config, id2label, model, test_dataloader):
    test_iterator = tqdm(test_dataloader, desc='Testing', total=len(test_dataloader))
    model.eval()
    test_preds = []
    
    with torch.no_grad():
        for batch in test_iterator:
            batch = {item: value.to(config['device']) for item, value in batch.items()}

            logits = model(**batch)[1]
            test_preds.append(logits.argmax(dim=-1).detach().cpu())
            
    test_preds = torch.cat(test_preds, dim=0).numpy()
    test_preds = [id2label[id_] for id_ in test_preds]
        
    test_df = pd.read_csv(config['test_file_path'], sep=',')
    # test_df.insert(1, column=['label_pred'], value=test_preds)
    test_df['label_pred'] = test_preds
    # test_df.drop(columns=['sentence'], inplace=True)
    test_df.to_csv('submission.csv', index=False, encoding='utf8')

In [32]:
predict(config, id2label, best_model, test_dataloader)

Testing: 100%|████████████████████████████████████████████| 313/313 [00:07<00:00, 40.90it/s]


In [26]:
test_df = pd.read_csv(config['test_file_path'], sep=',')

In [33]:
train_df = pd.read_csv(config['train_file_path'], sep=',')

In [50]:
train_df.head(10)

Unnamed: 0,id,label,label_desc,sentence
0,0,108,news_edu,上课时学生手机响个不停，老师一怒之下把手机摔了，家长拿发票让老师赔，大家怎么看待这种事？
1,1,104,news_finance,商赢环球股份有限公司关于延期回复上海证券交易所对公司2017年年度报告的事后审核问询函的公告
2,2,106,news_house,通过中介公司买了二手房，首付都付了，现在卖家不想卖了。怎么处理？
3,3,112,news_travel,2018年去俄罗斯看世界杯得花多少钱？
4,4,109,news_tech,剃须刀的个性革新，雷明登天猫定制版新品首发
5,5,103,news_sports,再次证明了“无敌是多么寂寞”——逆天的中国乒乓球队！
6,6,109,news_tech,三农盾SACC-全球首个推出：互联网+区块链+农产品的电商平台
7,7,116,news_game,重做or新英雄？其实重做对暴雪来说同样重要
8,8,103,news_sports,如何在商业活动中不受人欺骗？
9,9,101,news_culture,87版红楼梦最温柔的四个丫鬟，娶谁都是一生的福气


In [39]:
train_df['label'].unique()

array([108, 104, 106, 112, 109, 103, 116, 101, 107, 100, 102, 110, 115,
       113, 114])