### 小样本实验
数据规模：0.25k 0.5k 1k 1.35k  
抽样方式：随机抽样，设置统一的样本种子   
结果：每个模型训练3次，取最好的一次作为结果

#### 数据构造

In [None]:
# 创建数据样本
import os

path = "data/few_shot"
if not os.path.exists(path):
    os.makedirs(path)
print("done!")

##### 微博数据

In [None]:
# 复制微博数据
from shutil import copyfile
import os

data = ["train.json","dev.json","test.json","labels.txt"]

if not os.path.exists("data/few_shot/weibo"):
    os.makedirs("data/few_shot/weibo")
for f in data:
    copyfile(f"data/weibo/{f}",f"data/few_shot/weibo/{f}")

In [None]:
# 抽样数据
postfix = [250,500,1000,1350]

# 设置统一的随机种子
import random

# 读取原始训练集
train_file = "data/few_shot/weibo/train.json"
train_data = []

from tqdm import tqdm
import json

with open(train_file,"r",encoding="utf-8") as reader:
    for line in tqdm(reader,desc=f"load {train_file}"):
        data = json.loads(line.strip())
        text,label = data["text"],data["label"]
        assert len(text)==len(label)
        if len(text)>0:
            train_data.append(data)
        else:
            print(text,label)

# 生成数据
for post in postfix:
    # 重置随机，确保结果可复现
    random.seed(2021)
    data = random.sample(train_data,post)
    assert len(data)==post
    with open(f"data/few_shot/weibo/train_{post}.json","w",encoding="utf-8") as f: 
        for line in tqdm(data,desc=f"{post}"):
            f.write(f"{json.dumps(line,ensure_ascii=False)}\n")
        f.flush()

##### Notonotes4 数据

In [None]:
# 复制Ontonotes4数据
from shutil import copyfile
import os

data = ["train.json","dev.json","test.json","labels.txt"]

if not os.path.exists("data/few_shot/note4"):
    os.makedirs("data/few_shot/note4")
for f in data:
    copyfile(f"data/lebert/dataset/NER/note4/{f}",f"data/few_shot/note4/{f}")

In [None]:
# 抽样数据
postfix = [250,500,1000,1350]

# 设置统一的随机种子
import random

# 读取原始训练集
train_file = "data/few_shot/note4/train.json"
train_data = []

from tqdm import tqdm
import json

with open(train_file,"r",encoding="utf-8") as reader:
    for line in tqdm(reader,desc=f"load {train_file}"):
        data = json.loads(line.strip())
        text,label = data["text"],data["label"]
        assert len(text)==len(label)
        if len(text)>0:
            train_data.append(data)
        else:
            print(text,label)

# 生成数据
for post in postfix:
    # 重置随机，确保结果可复现
    random.seed(2021)
    data = random.sample(train_data,post)
    assert len(data)==post
    with open(f"data/few_shot/note4/train_{post}.json","w",encoding="utf-8") as f: 
        for line in tqdm(data,desc=f"{post}"):
            f.write(f"{json.dumps(line,ensure_ascii=False)}\n")
        f.flush()

##### MSRA 数据

In [None]:
# 复制MSRA数据
from shutil import copyfile
import os

data = ["train.json","dev.json","test.json","labels.txt"]

if not os.path.exists("data/few_shot/msra"):
    os.makedirs("data/few_shot/msra")
for f in data:
    copyfile(f"data/lebert/dataset/NER/msra/{f}",f"data/few_shot/msra/{f}")

In [None]:
# 抽样数据
postfix = [250,500,1000,1350]

# 设置统一的随机种子
import random

# 读取原始训练集
train_file = "data/few_shot/msra/train.json"
train_data = []

from tqdm import tqdm
import json

with open(train_file,"r",encoding="utf-8") as reader:
    for line in tqdm(reader,desc=f"load {train_file}"):
        data = json.loads(line.strip())
        text,label = data["text"],data["label"]
        assert len(text)==len(label)
        if len(text)>0:
            train_data.append(data)
        else:
            print(text,label)

# 生成数据
for post in postfix:
    # 重置随机，确保结果可复现
    random.seed(2021)
    data = random.sample(train_data,post)
    assert len(data)==post
    with open(f"data/few_shot/msra/train_{post}.json","w",encoding="utf-8") as f: 
        for line in tqdm(data,desc=f"{post}"):
            f.write(f"{json.dumps(line,ensure_ascii=False)}\n")
        f.flush()

##### Resume数据

In [None]:
# 复制Resume数据
from shutil import copyfile
import os

data = ["train.json","dev.json","test.json","labels.txt"]

if not os.path.exists("data/few_shot/resume"):
    os.makedirs("data/few_shot/resume")
for f in data:
    copyfile(f"data/lebert/dataset/NER/resume/{f}",f"data/few_shot/resume/{f}")

In [None]:
# 抽样数据
postfix = [250,500,1000,1350]

# 设置统一的随机种子
import random

# 读取原始训练集
train_file = "data/few_shot/resume/train.json"
train_data = []

from tqdm import tqdm
import json

with open(train_file,"r",encoding="utf-8") as reader:
    for line in tqdm(reader,desc=f"load {train_file}"):
        data = json.loads(line.strip())
        text,label = data["text"],data["label"]
        assert len(text)==len(label)
        if len(text)>0:
            train_data.append(data)
        else:
            print(text,label)

# 生成数据
for post in postfix:
    # 重置随机，确保结果可复现
    random.seed(2021)
    data = random.sample(train_data,post)
    assert len(data)==post
    with open(f"data/few_shot/resume/train_{post}.json","w",encoding="utf-8") as f: 
        for line in tqdm(data,desc=f"{post}"):
            f.write(f"{json.dumps(line,ensure_ascii=False)}\n")
        f.flush()

#### Bert+LSTM+CRF(Baseline)

In [None]:
model_args = {
    "model_name":"Bert",
    "loader":"cn_loader",
    'num_epochs': 30,
    'num_gpus': [0, 1, 2, 3],
    'hidden_dim': 512,
    'bert_config_file_name': './model/chinese_wwm_ext/config.json',
    'pretrained_file_name': './model/chinese_wwm_ext/pytorch_model.bin',
    'max_seq_length': 150,
    'max_scan_num': 1000000,
    'train_file': 'data/few_shot/weibo/train_250.json',
    'eval_file': 'data/few_shot/weibo/dev.json',
    'test_file': 'data/few_shot/weibo/test.json',
    'bert_vocab_file': './model/chinese_wwm_ext/vocab.txt',
    'tag_file': 'data/few_shot/weibo/labels.txt',
    'loader_name': 'cn_loader',
    'batch_size': 8,
    'eval_batch_size': 64,
    'do_shuffle': True,
    'use_json': True,
    'model_name': 'Bert',
    'output_eval': True,
    'task_name': 'weibo_bert_crf_250_x3',
    "use_gpu": True,
    "debug": True,
}

In [None]:
from CC.trainer import NERTrainer
import torch

per_task_count = 3

datasets = ["weibo","note4","msra","resume"]

task_trainset = [250,500,1000,1350]

tasks_args = {
        "train_file":"data/few_shot/{}/train_{}.json",
        "eval_file":"data/few_shot/{}/dev.json",
        "test_file":"data/few_shot/{}/test.json",
        'tag_file':"data/few_shot/{}/labels.txt",
        "task_name":"{}_bert_crf_{}_{}",
}

for name in datasets:
    for trainset in task_trainset:
        for i in range(per_task_count):
            for key,value in tasks_args.items():
                model_args[key] = value.format(name,trainset,f"x{i+1}")
            trainer = NERTrainer(**model_args)

            for _ in trainer.train():
                pass

            torch.cuda.empty_cache()


#### LEBert+LSTM+CRF

In [None]:
model_args = {
    "loader":"le_loader",
    'num_epochs': 30,
    'num_gpus': [0, 1, 2, 3],
    'hidden_dim': 512,
    'bert_config_file_name': './model/chinese_wwm_ext/config.json',
    'pretrained_file_name': './model/chinese_wwm_ext/pytorch_model.bin',
    'max_seq_length': 150,
    'max_scan_num': 1000000,
    'train_file': 'data/few_shot/weibo/train_250.json',
    'eval_file': 'data/few_shot/weibo/dev.json',
    'test_file': 'data/few_shot/weibo/test.json',
    'bert_vocab_file': './model/chinese_wwm_ext/vocab.txt',
    'word_embedding_file': 'data/tencent/word_embedding.txt',
    'tag_file': 'data/few_shot/weibo/labels.txt',
    'word_vocab_file':'data/tencent/tencent_vocab.txt',
    'loader_name': 'le_loader',
    'batch_size': 8,
    'eval_batch_size': 64,
    'do_shuffle': True,
    'use_json': True,
    'model_name': 'LEBert',
    'output_eval': True,
    'task_name': 'weibo_lebert_crf_250_x3',
    "use_gpu": True,
    "debug": True,
}

In [None]:
from CC.trainer import NERTrainer
import torch

per_task_count = 3

datasets = ["weibo","note4","msra","resume"]

task_trainset = [250,500,1000,1350]

tasks_args = {
        "train_file":"data/few_shot/{}/train_{}.json",
        "eval_file":"data/few_shot/{}/dev.json",
        "test_file":"data/few_shot/{}/test.json",
        'tag_file':"data/few_shot/{}/labels.txt",
        "task_name":"{}_lebert_crf_{}_{}"
}

for name in datasets:
    for trainset in task_trainset:
        for i in range(per_task_count):
            for key,value in tasks_args.items():
                model_args[key] = value.format(name,trainset,f"x{i+1}")
            trainer = NERTrainer(**model_args)

            for _ in trainer.train():
                pass

            torch.cuda.empty_cache()



#### Prompts PreTrain+LeBert FineTune

##### PreTrainer

In [None]:
# weibo
from CC.pre_trained import NERPreTrainer
import torch

pretrain_model_args = {
    'num_epochs': 30,
    'num_gpus': [0, 1, 2, 3],
    'bert_config_file_name': './model/chinese_wwm_ext/config.json',
    'pretrained_file_name': './model/chinese_wwm_ext/pytorch_model.bin',
    'max_seq_length': 512,
    'max_scan_num': 1000000,
    'train_file': 'data/few_shot/weibo/train_250.json',
    'eval_file': 'data/few_shot/weibo/dev.json',
    'test_file': 'data/few_shot/weibo/test.json',
    'bert_vocab_file': './model/chinese_wwm_ext/vocab.txt',
    'tag_file': 'data/few_shot/weibo/labels.txt',
    'loader_name': 'lex_loader',
    "word_embedding_file": "./data/tencent/word_embedding.txt",
    "word_vocab_file": "./data/tencent/tencent_vocab.txt",
    "word_vocab_file_with_tag": "./data/tencent/tencent_vocab_with_tag.json",
    "default_tag": "O",
    'batch_size': 32,
    'eval_batch_size': 64,
    'do_shuffle': True,
    'task_name': 'weibo_pretrain_lebert_250_pretraind_task',
    "use_gpu": True,
    "debug": True,
    "tag_rules": {
        "O":"非实体",
        "PER.NOM": "指代人名",
        "LOC.NAM": "地名",
        "PER.NAM": "人名",
        "GPE.NAM": "政体",
        "ORG.NAM": "机构",
        "ORG.NOM": "指代机构",
        "LOC.NOM": "指代地名",
        "GPE.NOM": "指代政体",
        "ORG": "组织",
        "LOC": "地点",
        "PER": "人",
        "Time": "时间",
        "Thing": "物品",
        "Metric": "测量单位",
        "Abstract": "作品",
        "Physical": "实体",
        "Term": "术语",
        "company": "企业",
        "name": "名字",
        "game": "游戏",
        "movie": "电影",
        "position": "职位",
        "address": "地址",
        "government": "政府",
        "scene": "景点",
        "book": "书名"
    }
}

trainsets = [250,500,1000,1350]

for train in trainsets:
    pretrain_model_args['train_file'] = f'data/few_shot/weibo/train_{train}.json'
    pretrain_model_args['task_name'] = f'weibo_pretrain_lebert_{train}_pretraind_task'

    pre_trainer = NERPreTrainer(**pretrain_model_args)

    for i in pre_trainer():
        a = i

    torch.cuda.empty_cache()

In [None]:
# note4
from CC.pre_trained import NERPreTrainer
import torch

pretrain_model_args = {
    'num_epochs': 30,
    'num_gpus': [0, 1, 2, 3],
    'bert_config_file_name': './model/chinese_wwm_ext/config.json',
    'pretrained_file_name': './model/chinese_wwm_ext/pytorch_model.bin',
    'max_seq_length': 512,
    'max_scan_num': 1000000,
    'train_file': 'data/few_shot/note4/train_250.json',
    'eval_file': 'data/few_shot/note4/dev.json',
    'test_file': 'data/few_shot/note4/test.json',
    'bert_vocab_file': './model/chinese_wwm_ext/vocab.txt',
    'tag_file': 'data/few_shot/note4/labels.txt',
    'loader_name': 'lex_loader',
    "word_embedding_file": "./data/tencent/word_embedding.txt",
    "word_vocab_file": "./data/tencent/tencent_vocab.txt",
    "word_vocab_file_with_tag": "./data/tencent/tencent_vocab_with_tag.json",
    "default_tag": "O",
    'batch_size': 32,
    'eval_batch_size': 64,
    'do_shuffle': True,
    'task_name': 'note4_pretrain_lebert_250_pretraind_task',
    "use_gpu": True,
    "debug": True,
    "tag_rules": {
        "O":"非实体",
        "ORG": "组织",
        "LOC": "地点",
        "PER": "人",
        "GPE": "政治",
        "Time": "时间",
        "Thing": "物品",
        "Metric": "测量单位",
        "Abstract": "作品",
        "Physical": "实体",
        "Term": "术语",
        "company": "企业",
        "name": "名字",
        "game": "游戏",
        "movie": "电影",
        "position": "职位",
        "address": "地址",
        "government": "政府",
        "scene": "景点",
        "book": "书名"
    }
}

trainsets = [250,500,1000,1350]

for train in trainsets:
    pretrain_model_args['train_file'] = f'data/few_shot/note4/train_{train}.json'
    pretrain_model_args['task_name'] = f'note4_pretrain_lebert_{train}_pretraind_task'

    pre_trainer = NERPreTrainer(**pretrain_model_args)

    for i in pre_trainer():
        a = i

    torch.cuda.empty_cache()

In [None]:
# msra
from CC.pre_trained import NERPreTrainer
import torch

pretrain_model_args = {
    'num_epochs': 30,
    'num_gpus': [0, 1, 2, 3],
    'bert_config_file_name': './model/chinese_wwm_ext/config.json',
    'pretrained_file_name': './model/chinese_wwm_ext/pytorch_model.bin',
    'max_seq_length': 512,
    'max_scan_num': 1000000,
    'train_file': 'data/few_shot/msra/train_250.json',
    'eval_file': 'data/few_shot/msra/dev.json',
    'test_file': 'data/few_shot/msra/test.json',
    'bert_vocab_file': './model/chinese_wwm_ext/vocab.txt',
    'tag_file': 'data/few_shot/msra/labels.txt',
    'loader_name': 'lex_loader',
    "word_embedding_file": "./data/tencent/word_embedding.txt",
    "word_vocab_file": "./data/tencent/tencent_vocab.txt",
    "word_vocab_file_with_tag": "./data/tencent/tencent_vocab_with_tag.json",
    "default_tag": "O",
    'batch_size': 32,
    'eval_batch_size': 64,
    'do_shuffle': True,
    'task_name': 'msra_pretrain_lebert_250_pretraind_task',
    "use_gpu": True,
    "debug": True,
    "tag_rules": {
        "O":"非实体",
        "NS":"地名",
        "NR":"人名",
        "NT":"机构团体",
        "ORG": "组织",
        "LOC": "地点",
        "PER": "人",
        "Time": "时间",
        "Thing": "物品",
        "Metric": "测量单位",
        "Abstract": "作品",
        "Physical": "实体",
        "Term": "术语",
        "company": "企业",
        "name": "名字",
        "game": "游戏",
        "movie": "电影",
        "position": "职位",
        "address": "地址",
        "government": "政府",
        "scene": "景点",
        "book": "书名"
    }
}

trainsets = [250,500,1000,1350]

for train in trainsets:
    pretrain_model_args['train_file'] = f'data/few_shot/msra/train_{train}.json'
    pretrain_model_args['task_name'] = f'msra_pretrain_lebert_{train}_pretraind_task'

    pre_trainer = NERPreTrainer(**pretrain_model_args)

    for i in pre_trainer():
        a = i

    torch.cuda.empty_cache()

In [None]:
# resume
from CC.pre_trained import NERPreTrainer
import torch

pretrain_model_args = {
    'num_epochs': 30,
    'num_gpus': [0, 1, 2, 3],
    'bert_config_file_name': './model/chinese_wwm_ext/config.json',
    'pretrained_file_name': './model/chinese_wwm_ext/pytorch_model.bin',
    'max_seq_length': 512,
    'max_scan_num': 1000000,
    'train_file': 'data/few_shot/resume/train_250.json',
    'eval_file': 'data/few_shot/resume/dev.json',
    'test_file': 'data/few_shot/resume/test.json',
    'bert_vocab_file': './model/chinese_wwm_ext/vocab.txt',
    'tag_file': 'data/few_shot/resume/labels.txt',
    'loader_name': 'lex_loader',
    "word_embedding_file": "./data/tencent/word_embedding.txt",
    "word_vocab_file": "./data/tencent/tencent_vocab.txt",
    "word_vocab_file_with_tag": "./data/tencent/tencent_vocab_with_tag.json",
    "default_tag": "O",
    'batch_size': 32,
    'eval_batch_size': 64,
    'do_shuffle': True,
    'task_name': 'resume_pretrain_lebert_250_pretraind_task',
    "use_gpu": True,
    "debug": True,
    "tag_rules": {
        "O":"非实体",
        "NAME":"名字",
        "CONT":"国家",
        "RACE":"种族背景",
        "TITLE":"职位",
        "EDU":"教育机构",
        "PRO":"专业",
        "ORG": "组织",
        "LOC": "地点",
        "PER": "人",
        "Time": "时间",
        "Thing": "物品",
        "Metric": "测量单位",
        "Abstract": "作品",
        "Physical": "实体",
        "Term": "术语",
        "company": "企业",
        "name": "名字",
        "game": "游戏",
        "movie": "电影",
        "position": "职位",
        "address": "地址",
        "government": "政府",
        "scene": "景点",
        "book": "书名"
    }
}

trainsets = [250,500,1000,1350]

for train in trainsets:
    pretrain_model_args['train_file'] = f'data/few_shot/resume/train_{train}.json'
    pretrain_model_args['task_name'] = f'resume_pretrain_lebert_{train}_pretraind_task'

    pre_trainer = NERPreTrainer(**pretrain_model_args)

    for i in pre_trainer():
        a = i

    torch.cuda.empty_cache()

In [2]:
model_args = {
    "loader":"le_loader",
    'num_epochs': 30,
    'num_gpus': [0, 1, 2, 3],
    'hidden_dim': 512,
    'bert_config_file_name': './model/chinese_wwm_ext/config.json',
    'pretrained_file_name': './model/chinese_wwm_ext/pytorch_model.bin',
    'max_seq_length': 150,
    'max_scan_num': 1000000,
    'train_file': 'data/few_shot/weibo/train_250.json',
    'eval_file': 'data/few_shot/weibo/dev.json',
    'test_file': 'data/few_shot/weibo/test.json',
    'bert_vocab_file': './model/chinese_wwm_ext/vocab.txt',
    'word_embedding_file': 'data/tencent/word_embedding.txt',
    'tag_file': 'data/few_shot/weibo/labels.txt',
    'word_vocab_file':'data/tencent/tencent_vocab.txt',
    'loader_name': 'le_loader',
    'batch_size': 8,
    'eval_batch_size': 64,
    'do_shuffle': True,
    'use_json': True,
    'model_name': 'LEBert',
    'output_eval': True,
    'task_name': 'weibo_lebert_crf_250_x3',
    "use_gpu": True,
    "debug": True,
}

In [4]:
from CC.trainer import NERTrainer
import torch

per_task_count = 3

datasets = ["weibo","note4","msra","resume"]

task_trainset = [250,500,1000,1350]

pretrain = [240,480,960,1290]

# dataset,counts,time,others
tasks_args = {
        'pretrained_file_name': 'save_pretrained/{0}_pretrain_lebert_{1}_pretraind_task/Bert_{3}/pytorch_model.bin',
        "train_file":"data/few_shot/{0}/train_{1}.json",
        "eval_file":"data/few_shot/{0}/dev.json",
        "test_file":"data/few_shot/{0}/test.json",
        'tag_file':"data/few_shot/{0}/labels.txt",
        "task_name":"{0}_pretrain_lebert_crf_{1}_{2}"
        
}

for name in datasets:
    for trainset,pre in zip(task_trainset,pretrain): 
        for i in range(per_task_count):
            for key,value in tasks_args.items():
                model_args[key] = value.format(name,trainset,f"x{i+1}",pre)
            trainer = NERTrainer(**model_args)

            for _ in trainer.train():
                pass

            torch.cuda.empty_cache()



calculate data/few_shot/weibo/train_250.json etag: 100%|██████████| 170k/170k [00:00<00:00, 174MB/s]
calculate data/few_shot/weibo/dev.json etag: 100%|██████████| 180k/180k [00:00<00:00, 191MB/s]
calculate data/few_shot/weibo/test.json etag: 100%|██████████| 184k/184k [00:00<00:00, 178MB/s]
calculate data/few_shot/weibo/labels.txt etag: 100%|██████████| 272/272 [00:00<00:00, 467kB/s]

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/weibo/train_250.json",
    "eval_file": "data/few_shot/weibo/dev.json",
    "test_file": "data/few_shot/weibo/test.json",
    "tag_file": "data/few_shot/weibo/labels.txt",
    "bert_vocab_file": "./model/chinese_wwm_ext/vocab.txt",
    "output_eval": true,
    "max_scan_num": 1000000,
    "add_seq_vocab": false,
    "max_seq_length": 150,
    "max_word_num": 5,
    "default_tag": "O",
    "use_test": false,
    "do_shuffle": true,
    "do_predict": false,
    "task_name": "weibo_pretrain_lebert_crf_250_x1"
}
load cached ./temp/dfcab4601ac8d4aaec9b6ecfb221d3ec_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/lexicon_tree



count line size data/few_shot/weibo/labels.txt: 29L [00:00, 201716.11L/s]
build line mapper: 29L [00:00, 214902.50L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 29/29 [00:00<00:00, 8029.76it/s]
load vocab from list: 100%|██████████| 28/28 [00:00<00:00, 247764.79it/s]
load dataset from data/few_shot/weibo/train_250.json: 0it [00:00, ?it/s]

load cached ./temp/dfcab4601ac8d4aaec9b6ecfb221d3ec_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/matched_words
load cached ./temp/dfcab4601ac8d4aaec9b6ecfb221d3ec_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/word_vocab
load cached ./temp/dfcab4601ac8d4aaec9b6ecfb221d3ec_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/vocab_embedding


load dataset from data/few_shot/weibo/train_250.json: 250it [00:00, 375.38it/s]
load dataset from data/few_shot/weibo/dev.json: 271it [00:00, 442.05it/s]
Some weights of the model checkpoint at save_pretrained/weibo_pretrain_lebert_250_pretraind_task/Bert_240/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model fr

Load pretrained embedding from file.........


  _warn_prf(average, modifier, msg_start, len(result))
Epoch: 1/30 Train: 100%|██████████| 32/32 [00:19<00:00,  1.63it/s, F1=0, train_acc=0.419, train_loss=93.9, train_precision=0, train_recall=0]
  _warn_prf(average, modifier, msg_start, len(result))


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        12
     LOC.NOM       0.00      0.00      0.00        13
     ORG.NAM       0.00      0.00      0.00        55
     ORG.NOM       0.00      0.00      0.00        10
     PER.NAM       0.00      0.00      0.00       105
     PER.NOM       0.00      0.00      0.00       141

   micro avg       0.00      0.00      0.00       381
   macro avg       0.00      0.00      0.00       381
weighted avg       0.00      0.00      0.00       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.22it/s, F1=0, eval_acc=0.933, eval_loss=26.4, eval_precision=0, eval_recall=0]
  _warn_prf(average, modifier, msg_start, len(result))


eval_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.00      0.00      0.00        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.00      0.00      0.00        90
     PER.NOM       0.00      0.00      0.00       208

   micro avg       0.00      0.00      0.00       389
   macro avg       0.00      0.00      0.00       389
weighted avg       0.00      0.00      0.00       389



Epoch: 2/30 Train: 100%|██████████| 32/32 [00:10<00:00,  3.11it/s, F1=0, train_acc=0.926, train_loss=29.8, train_precision=0, train_recall=0]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        12
     LOC.NOM       0.00      0.00      0.00        13
     ORG.NAM       0.00      0.00      0.00        55
     ORG.NOM       0.00      0.00      0.00        10
     PER.NAM       0.00      0.00      0.00       105
     PER.NOM       0.00      0.00      0.00       141

   micro avg       0.00      0.00      0.00       381
   macro avg       0.00      0.00      0.00       381
weighted avg       0.00      0.00      0.00       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.18it/s, F1=0, eval_acc=0.933, eval_loss=22.2, eval_precision=0, eval_recall=0]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.00      0.00      0.00        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.00      0.00      0.00        90
     PER.NOM       0.00      0.00      0.00       208

   micro avg       0.00      0.00      0.00       389
   macro avg       0.00      0.00      0.00       389
weighted avg       0.00      0.00      0.00       389



Epoch: 3/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.21it/s, F1=0, train_acc=0.924, train_loss=23.5, train_precision=0, train_recall=0]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        12
     LOC.NOM       0.00      0.00      0.00        13
     ORG.NAM       0.00      0.00      0.00        55
     ORG.NOM       0.00      0.00      0.00        10
     PER.NAM       0.00      0.00      0.00       105
     PER.NOM       0.00      0.00      0.00       141

   micro avg       0.00      0.00      0.00       381
   macro avg       0.00      0.00      0.00       381
weighted avg       0.00      0.00      0.00       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.34it/s, F1=0, eval_acc=0.933, eval_loss=18.3, eval_precision=0, eval_recall=0]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.00      0.00      0.00        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.00      0.00      0.00        90
     PER.NOM       0.00      0.00      0.00       208

   micro avg       0.00      0.00      0.00       389
   macro avg       0.00      0.00      0.00       389
weighted avg       0.00      0.00      0.00       389



  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(
Epoch: 4/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.31it/s, F1=0, train_acc=0.931, train_loss=18.6, train_precision=0, train_recall=0]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        12
     LOC.NOM       0.00      0.00      0.00        13
     ORG.NAM       0.00      0.00      0.00        55
     ORG.NOM       0.00      0.00      0.00        10
     PER.NAM       0.00      0.00      0.00       105
     PER.NOM       0.00      0.00      0.00       141

   micro avg       0.00      0.00      0.00       381
   macro avg       0.00      0.00      0.00       381
weighted avg       0.00      0.00      0.00       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.10it/s, F1=0, eval_acc=0.932, eval_loss=13.6, eval_precision=0, eval_recall=0]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.00      0.00      0.00        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.00      0.00      0.00        90
     PER.NOM       0.00      0.00      0.00       208

   micro avg       0.00      0.00      0.00       389
   macro avg       0.00      0.00      0.00       389
weighted avg       0.00      0.00      0.00       389



Epoch: 5/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.38it/s, F1=0.0477, train_acc=0.935, train_loss=14.2, train_precision=0.0637, train_recall=0.043]   


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        12
     LOC.NOM       0.00      0.00      0.00        13
     ORG.NAM       0.00      0.00      0.00        55
     ORG.NOM       0.00      0.00      0.00        10
     PER.NAM       0.11      0.11      0.11       105
     PER.NOM       0.02      0.01      0.01       141

   micro avg       0.04      0.04      0.04       381
   macro avg       0.02      0.02      0.02       381
weighted avg       0.04      0.04      0.04       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.30it/s, F1=0.121, eval_acc=0.944, eval_loss=10.3, eval_precision=0.0924, eval_recall=0.178]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.01      0.02      0.02        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.16      0.40      0.23        90
     PER.NOM       0.05      0.11      0.07       208

   micro avg       0.08      0.15      0.10       389
   macro avg       0.03      0.07      0.04       389
weighted avg       0.07      0.15      0.09       389



Epoch: 6/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.25it/s, F1=0.289, train_acc=0.955, train_loss=8.97, train_precision=0.278, train_recall=0.316]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.09      0.12      0.10        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        12
     LOC.NOM       0.00      0.00      0.00        13
     ORG.NAM       0.05      0.09      0.06        55
     ORG.NOM       0.00      0.00      0.00        10
     PER.NAM       0.39      0.55      0.46       105
     PER.NOM       0.29      0.37      0.32       141

   micro avg       0.25      0.31      0.28       381
   macro avg       0.10      0.14      0.12       381
weighted avg       0.23      0.31      0.27       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.46it/s, F1=0.434, eval_acc=0.956, eval_loss=7.65, eval_precision=0.344, eval_recall=0.601]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.18      0.42      0.25        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.07      0.21      0.11        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.44      0.58      0.50        90
     PER.NOM       0.48      0.71      0.57       208

   micro avg       0.35      0.57      0.43       389
   macro avg       0.15      0.24      0.18       389
weighted avg       0.38      0.57      0.45       389



Epoch: 7/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.29it/s, F1=0.585, train_acc=0.973, train_loss=6.17, train_precision=0.563, train_recall=0.633]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.41      0.70      0.51        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        12
     LOC.NOM       0.00      0.00      0.00        13
     ORG.NAM       0.18      0.35      0.24        55
     ORG.NOM       0.00      0.00      0.00        10
     PER.NAM       0.70      0.70      0.70       105
     PER.NOM       0.67      0.80      0.73       141

   micro avg       0.51      0.62      0.56       381
   macro avg       0.24      0.32      0.27       381
weighted avg       0.51      0.62      0.56       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.46it/s, F1=0.545, eval_acc=0.963, eval_loss=6.71, eval_precision=0.439, eval_recall=0.724]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.43      0.77      0.55        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.12      0.34      0.17        47
     ORG.NOM       1.00      0.80      0.89         5
     PER.NAM       0.48      0.76      0.58        90
     PER.NOM       0.58      0.78      0.67       208

   micro avg       0.44      0.70      0.54       389
   macro avg       0.32      0.43      0.36       389
weighted avg       0.48      0.70      0.56       389



Epoch: 8/30 Train: 100%|██████████| 32/32 [00:10<00:00,  3.20it/s, F1=0.681, train_acc=0.98, train_loss=4.72, train_precision=0.656, train_recall=0.729] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.50      0.72      0.59        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.13      0.17      0.15        12
     LOC.NOM       0.00      0.00      0.00        13
     ORG.NAM       0.49      0.73      0.59        55
     ORG.NOM       0.50      0.20      0.29        10
     PER.NAM       0.74      0.80      0.77       105
     PER.NOM       0.76      0.83      0.79       141

   micro avg       0.63      0.72      0.68       381
   macro avg       0.39      0.43      0.40       381
weighted avg       0.63      0.72      0.67       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.43it/s, F1=0.556, eval_acc=0.962, eval_loss=6.58, eval_precision=0.499, eval_recall=0.642]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.46      0.69      0.55        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.22      0.36      0.27        47
     ORG.NOM       0.67      0.80      0.73         5
     PER.NAM       0.62      0.67      0.64        90
     PER.NOM       0.63      0.69      0.66       208

   micro avg       0.52      0.62      0.57       389
   macro avg       0.32      0.40      0.36       389
weighted avg       0.54      0.62      0.58       389



Epoch: 9/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.25it/s, F1=0.736, train_acc=0.986, train_loss=2.92, train_precision=0.723, train_recall=0.757]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.62      0.77      0.69        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.27      0.33      0.30        12
     LOC.NOM       0.00      0.00      0.00        13
     ORG.NAM       0.64      0.85      0.73        55
     ORG.NOM       0.67      0.60      0.63        10
     PER.NAM       0.81      0.85      0.83       105
     PER.NOM       0.79      0.84      0.81       141

   micro avg       0.71      0.78      0.74       381
   macro avg       0.47      0.53      0.50       381
weighted avg       0.70      0.78      0.74       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.20it/s, F1=0.571, eval_acc=0.958, eval_loss=6.93, eval_precision=0.475, eval_recall=0.732]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.53      0.77      0.62        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.04      0.17      0.07         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.22      0.30      0.25        47
     ORG.NOM       0.33      0.80      0.47         5
     PER.NAM       0.47      0.77      0.58        90
     PER.NOM       0.63      0.83      0.71       208

   micro avg       0.50      0.72      0.59       389
   macro avg       0.28      0.45      0.34       389
weighted avg       0.51      0.72      0.60       389



Epoch: 10/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.29it/s, F1=0.814, train_acc=0.99, train_loss=1.95, train_precision=0.8, train_recall=0.837]   


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.74      0.86      0.80        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.27      0.50      0.35        12
     LOC.NOM       0.50      0.23      0.32        13
     ORG.NAM       0.73      0.85      0.79        55
     ORG.NOM       0.82      0.90      0.86        10
     PER.NAM       0.84      0.89      0.86       105
     PER.NOM       0.91      0.92      0.92       141

   micro avg       0.80      0.85      0.82       381
   macro avg       0.60      0.64      0.61       381
weighted avg       0.80      0.85      0.82       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.42it/s, F1=0.615, eval_acc=0.967, eval_loss=6.06, eval_precision=0.563, eval_recall=0.685]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.58      0.69      0.63        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.27      0.47      0.34        47
     ORG.NOM       0.67      0.80      0.73         5
     PER.NAM       0.61      0.76      0.67        90
     PER.NOM       0.73      0.72      0.72       208

   micro avg       0.58      0.67      0.62       389
   macro avg       0.36      0.43      0.39       389
weighted avg       0.61      0.67      0.64       389



Epoch: 11/30 Train: 100%|██████████| 32/32 [00:10<00:00,  3.17it/s, F1=0.869, train_acc=0.994, train_loss=1.34, train_precision=0.865, train_recall=0.881]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.88      0.88      0.88        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.31      0.42      0.36        12
     LOC.NOM       0.47      0.69      0.56        13
     ORG.NAM       0.83      0.95      0.88        55
     ORG.NOM       0.67      0.80      0.73        10
     PER.NAM       0.92      0.92      0.92       105
     PER.NOM       0.96      0.96      0.96       141

   micro avg       0.86      0.90      0.88       381
   macro avg       0.63      0.70      0.66       381
weighted avg       0.87      0.90      0.88       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.44it/s, F1=0.58, eval_acc=0.963, eval_loss=6.79, eval_precision=0.5, eval_recall=0.704]   


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.57      0.77      0.66        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.09      0.50      0.16         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.24      0.36      0.29        47
     ORG.NOM       0.33      0.80      0.47         5
     PER.NAM       0.55      0.77      0.64        90
     PER.NOM       0.69      0.77      0.73       208

   micro avg       0.53      0.70      0.61       389
   macro avg       0.31      0.50      0.37       389
weighted avg       0.57      0.70      0.63       389



Epoch: 12/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.21it/s, F1=0.94, train_acc=0.996, train_loss=0.974, train_precision=0.933, train_recall=0.949] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.89      0.93      0.91        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.60      0.75      0.67        12
     LOC.NOM       0.57      0.62      0.59        13
     ORG.NAM       0.96      0.96      0.96        55
     ORG.NOM       0.75      0.90      0.82        10
     PER.NAM       0.93      0.97      0.95       105
     PER.NOM       0.96      0.97      0.97       141

   micro avg       0.91      0.94      0.93       381
   macro avg       0.71      0.76      0.73       381
weighted avg       0.91      0.94      0.92       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.39it/s, F1=0.622, eval_acc=0.965, eval_loss=6.82, eval_precision=0.572, eval_recall=0.689]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.69      0.77      0.73        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.18      0.67      0.29         6
     LOC.NOM       0.60      0.50      0.55         6
     ORG.NAM       0.30      0.40      0.35        47
     ORG.NOM       0.57      0.80      0.67         5
     PER.NAM       0.64      0.69      0.66        90
     PER.NOM       0.71      0.74      0.72       208

   micro avg       0.60      0.68      0.64       389
   macro avg       0.46      0.57      0.49       389
weighted avg       0.63      0.68      0.65       389



Epoch: 13/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.23it/s, F1=0.907, train_acc=0.996, train_loss=0.838, train_precision=0.912, train_recall=0.904]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.91      0.91      0.91        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.71      0.83      0.77        12
     LOC.NOM       0.57      0.62      0.59        13
     ORG.NAM       0.96      0.98      0.97        55
     ORG.NOM       0.82      0.90      0.86        10
     PER.NAM       0.98      0.96      0.97       105
     PER.NOM       0.99      0.97      0.98       141

   micro avg       0.94      0.94      0.94       381
   macro avg       0.74      0.77      0.76       381
weighted avg       0.94      0.94      0.94       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.43it/s, F1=0.602, eval_acc=0.964, eval_loss=7.79, eval_precision=0.534, eval_recall=0.7]  


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.62      0.77      0.69        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.19      0.83      0.30         6
     LOC.NOM       0.38      0.50      0.43         6
     ORG.NAM       0.25      0.34      0.29        47
     ORG.NOM       0.67      0.80      0.73         5
     PER.NAM       0.59      0.73      0.66        90
     PER.NOM       0.67      0.76      0.71       208

   micro avg       0.56      0.70      0.62       389
   macro avg       0.42      0.59      0.48       389
weighted avg       0.58      0.70      0.63       389



Epoch: 14/30 Train: 100%|██████████| 32/32 [00:12<00:00,  2.57it/s, F1=0.956, train_acc=0.997, train_loss=0.605, train_precision=0.949, train_recall=0.965]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.91      0.91      0.91        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       1.00      0.92      0.96        12
     LOC.NOM       0.79      0.85      0.81        13
     ORG.NAM       0.93      0.98      0.96        55
     ORG.NOM       0.75      0.90      0.82        10
     PER.NAM       0.94      0.97      0.95       105
     PER.NOM       1.00      1.00      1.00       141

   micro avg       0.95      0.96      0.95       381
   macro avg       0.79      0.82      0.80       381
weighted avg       0.94      0.96      0.95       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.44it/s, F1=0.631, eval_acc=0.965, eval_loss=8.27, eval_precision=0.593, eval_recall=0.681]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.65      0.77      0.70        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.19      0.83      0.31         6
     LOC.NOM       0.50      0.50      0.50         6
     ORG.NAM       0.32      0.36      0.34        47
     ORG.NOM       0.50      0.80      0.62         5
     PER.NAM       0.69      0.62      0.65        90
     PER.NOM       0.70      0.75      0.73       208

   micro avg       0.61      0.67      0.64       389
   macro avg       0.44      0.58      0.48       389
weighted avg       0.63      0.67      0.65       389



Epoch: 15/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.26it/s, F1=0.958, train_acc=0.997, train_loss=0.674, train_precision=0.956, train_recall=0.963]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.95      0.95      0.95        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.85      0.92      0.88        12
     LOC.NOM       0.85      0.85      0.85        13
     ORG.NAM       0.95      0.96      0.95        55
     ORG.NOM       0.82      0.90      0.86        10
     PER.NAM       0.98      0.94      0.96       105
     PER.NOM       0.98      0.99      0.99       141

   micro avg       0.96      0.96      0.96       381
   macro avg       0.80      0.81      0.80       381
weighted avg       0.95      0.96      0.95       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.45it/s, F1=0.618, eval_acc=0.965, eval_loss=7.16, eval_precision=0.546, eval_recall=0.717]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.63      0.73      0.68        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.25      0.83      0.38         6
     LOC.NOM       0.20      0.17      0.18         6
     ORG.NAM       0.33      0.55      0.41        47
     ORG.NOM       0.67      0.80      0.73         5
     PER.NAM       0.59      0.78      0.67        90
     PER.NOM       0.68      0.75      0.71       208

   micro avg       0.58      0.72      0.64       389
   macro avg       0.42      0.58      0.47       389
weighted avg       0.60      0.72      0.65       389



Epoch: 16/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.32it/s, F1=0.958, train_acc=0.998, train_loss=0.407, train_precision=0.955, train_recall=0.965]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.93      0.95      0.94        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.77      0.83      0.80        12
     LOC.NOM       1.00      1.00      1.00        13
     ORG.NAM       0.96      1.00      0.98        55
     ORG.NOM       0.82      0.90      0.86        10
     PER.NAM       0.98      0.99      0.99       105
     PER.NOM       0.99      0.99      0.99       141

   micro avg       0.96      0.97      0.97       381
   macro avg       0.81      0.83      0.82       381
weighted avg       0.96      0.97      0.97       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.44it/s, F1=0.627, eval_acc=0.965, eval_loss=7.66, eval_precision=0.557, eval_recall=0.727]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.67      0.77      0.71        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.23      0.83      0.36         6
     LOC.NOM       0.33      0.33      0.33         6
     ORG.NAM       0.30      0.38      0.34        47
     ORG.NOM       0.57      0.80      0.67         5
     PER.NAM       0.63      0.73      0.68        90
     PER.NOM       0.68      0.82      0.75       208

   micro avg       0.60      0.74      0.66       389
   macro avg       0.43      0.58      0.48       389
weighted avg       0.61      0.74      0.66       389



Epoch: 17/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.30it/s, F1=0.973, train_acc=0.999, train_loss=0.335, train_precision=0.974, train_recall=0.977]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.98      0.95      0.96        43
     GPE.NOM       0.50      0.50      0.50         2
     LOC.NAM       1.00      1.00      1.00        12
     LOC.NOM       1.00      1.00      1.00        13
     ORG.NAM       1.00      1.00      1.00        55
     ORG.NOM       0.82      0.90      0.86        10
     PER.NAM       0.99      0.99      0.99       105
     PER.NOM       0.98      1.00      0.99       141

   micro avg       0.98      0.99      0.98       381
   macro avg       0.91      0.92      0.91       381
weighted avg       0.98      0.99      0.98       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.44it/s, F1=0.63, eval_acc=0.967, eval_loss=8.06, eval_precision=0.594, eval_recall=0.681] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.67      0.77      0.71        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.29      0.83      0.43         6
     LOC.NOM       0.50      0.33      0.40         6
     ORG.NAM       0.33      0.40      0.37        47
     ORG.NOM       0.67      0.80      0.73         5
     PER.NAM       0.67      0.67      0.67        90
     PER.NOM       0.70      0.73      0.71       208

   micro avg       0.62      0.67      0.65       389
   macro avg       0.48      0.57      0.50       389
weighted avg       0.64      0.67      0.65       389



Epoch: 18/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.30it/s, F1=0.995, train_acc=1, train_loss=0.196, train_precision=0.993, train_recall=0.996]  


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        43
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       1.00      1.00      1.00        12
     LOC.NOM       1.00      1.00      1.00        13
     ORG.NAM       1.00      1.00      1.00        55
     ORG.NOM       0.82      0.90      0.86        10
     PER.NAM       0.99      0.99      0.99       105
     PER.NOM       1.00      1.00      1.00       141

   micro avg       0.99      0.99      0.99       381
   macro avg       0.98      0.99      0.98       381
weighted avg       0.99      0.99      0.99       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.45it/s, F1=0.622, eval_acc=0.967, eval_loss=8.66, eval_precision=0.589, eval_recall=0.673]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.67      0.77      0.71        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.31      0.83      0.45         6
     LOC.NOM       0.33      0.33      0.33         6
     ORG.NAM       0.31      0.36      0.33        47
     ORG.NOM       0.67      0.80      0.73         5
     PER.NAM       0.64      0.64      0.64        90
     PER.NOM       0.72      0.73      0.72       208

   micro avg       0.62      0.66      0.64       389
   macro avg       0.46      0.56      0.49       389
weighted avg       0.63      0.66      0.64       389



Epoch: 19/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.24it/s, F1=0.993, train_acc=0.999, train_loss=0.214, train_precision=0.992, train_recall=0.995]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        43
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       1.00      1.00      1.00        12
     LOC.NOM       1.00      1.00      1.00        13
     ORG.NAM       1.00      1.00      1.00        55
     ORG.NOM       0.82      0.90      0.86        10
     PER.NAM       0.99      0.99      0.99       105
     PER.NOM       1.00      1.00      1.00       141

   micro avg       0.99      0.99      0.99       381
   macro avg       0.98      0.99      0.98       381
weighted avg       0.99      0.99      0.99       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.36it/s, F1=0.614, eval_acc=0.962, eval_loss=8.39, eval_precision=0.537, eval_recall=0.723]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.66      0.73      0.69        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.26      0.83      0.40         6
     LOC.NOM       0.38      0.50      0.43         6
     ORG.NAM       0.27      0.40      0.32        47
     ORG.NOM       0.40      0.80      0.53         5
     PER.NAM       0.54      0.76      0.63        90
     PER.NOM       0.69      0.80      0.74       208

   micro avg       0.57      0.73      0.64       389
   macro avg       0.40      0.60      0.47       389
weighted avg       0.59      0.73      0.65       389



Epoch: 20/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.27it/s, F1=0.985, train_acc=1, train_loss=0.14, train_precision=0.982, train_recall=0.989]     


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        43
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       1.00      1.00      1.00        12
     LOC.NOM       1.00      1.00      1.00        13
     ORG.NAM       1.00      1.00      1.00        55
     ORG.NOM       0.82      0.90      0.86        10
     PER.NAM       0.97      0.98      0.98       105
     PER.NOM       0.99      1.00      1.00       141

   micro avg       0.98      0.99      0.99       381
   macro avg       0.97      0.99      0.98       381
weighted avg       0.98      0.99      0.99       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.43it/s, F1=0.618, eval_acc=0.966, eval_loss=8.18, eval_precision=0.57, eval_recall=0.684] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.63      0.73      0.68        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.29      0.83      0.43         6
     LOC.NOM       0.33      0.33      0.33         6
     ORG.NAM       0.32      0.40      0.36        47
     ORG.NOM       0.50      0.80      0.62         5
     PER.NAM       0.62      0.74      0.68        90
     PER.NOM       0.69      0.71      0.70       208

   micro avg       0.59      0.68      0.63       389
   macro avg       0.42      0.57      0.47       389
weighted avg       0.61      0.68      0.64       389



Epoch: 21/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.30it/s, F1=0.994, train_acc=1, train_loss=0.168, train_precision=0.993, train_recall=0.994]    


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        43
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       1.00      1.00      1.00        12
     LOC.NOM       1.00      1.00      1.00        13
     ORG.NAM       1.00      1.00      1.00        55
     ORG.NOM       0.82      0.90      0.86        10
     PER.NAM       0.99      0.98      0.99       105
     PER.NOM       1.00      1.00      1.00       141

   micro avg       0.99      0.99      0.99       381
   macro avg       0.98      0.99      0.98       381
weighted avg       0.99      0.99      0.99       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  3.91it/s, F1=0.618, eval_acc=0.966, eval_loss=8.35, eval_precision=0.563, eval_recall=0.695]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.68      0.73      0.70        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.29      0.83      0.43         6
     LOC.NOM       0.40      0.33      0.36         6
     ORG.NAM       0.30      0.38      0.34        47
     ORG.NOM       0.44      0.80      0.57         5
     PER.NAM       0.58      0.78      0.66        90
     PER.NOM       0.70      0.73      0.71       208

   micro avg       0.59      0.69      0.64       389
   macro avg       0.42      0.57      0.47       389
weighted avg       0.60      0.69      0.64       389



Epoch: 22/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.32it/s, F1=0.991, train_acc=0.999, train_loss=0.175, train_precision=0.991, train_recall=0.991]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        43
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       1.00      1.00      1.00        12
     LOC.NOM       1.00      1.00      1.00        13
     ORG.NAM       1.00      1.00      1.00        55
     ORG.NOM       0.82      0.90      0.86        10
     PER.NAM       0.99      0.99      0.99       105
     PER.NOM       1.00      0.99      1.00       141

   micro avg       0.99      0.99      0.99       381
   macro avg       0.98      0.99      0.98       381
weighted avg       0.99      0.99      0.99       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.46it/s, F1=0.63, eval_acc=0.966, eval_loss=8.85, eval_precision=0.561, eval_recall=0.723] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.62      0.77      0.69        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.31      0.83      0.45         6
     LOC.NOM       0.50      0.50      0.50         6
     ORG.NAM       0.29      0.40      0.34        47
     ORG.NOM       0.40      0.80      0.53         5
     PER.NAM       0.61      0.72      0.66        90
     PER.NOM       0.68      0.80      0.74       208

   micro avg       0.59      0.73      0.65       389
   macro avg       0.43      0.60      0.49       389
weighted avg       0.60      0.73      0.66       389



Epoch: 23/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.33it/s, F1=0.978, train_acc=0.999, train_loss=0.248, train_precision=0.976, train_recall=0.981]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        43
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       1.00      1.00      1.00        12
     LOC.NOM       1.00      1.00      1.00        13
     ORG.NAM       1.00      1.00      1.00        55
     ORG.NOM       0.82      0.90      0.86        10
     PER.NAM       0.94      0.96      0.95       105
     PER.NOM       0.97      0.99      0.98       141

   micro avg       0.97      0.98      0.98       381
   macro avg       0.97      0.98      0.97       381
weighted avg       0.97      0.98      0.98       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.40it/s, F1=0.626, eval_acc=0.967, eval_loss=8.93, eval_precision=0.558, eval_recall=0.719]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.67      0.77      0.71        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.26      0.83      0.40         6
     LOC.NOM       0.27      0.50      0.35         6
     ORG.NAM       0.31      0.51      0.38        47
     ORG.NOM       0.29      1.00      0.45         5
     PER.NAM       0.64      0.71      0.67        90
     PER.NOM       0.69      0.77      0.73       208

   micro avg       0.58      0.72      0.64       389
   macro avg       0.39      0.64      0.46       389
weighted avg       0.61      0.72      0.66       389



Epoch: 24/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.24it/s, F1=0.947, train_acc=0.999, train_loss=0.265, train_precision=0.943, train_recall=0.951]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        43
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       1.00      1.00      1.00        12
     LOC.NOM       1.00      1.00      1.00        13
     ORG.NAM       1.00      1.00      1.00        55
     ORG.NOM       0.82      0.90      0.86        10
     PER.NAM       0.96      0.97      0.97       105
     PER.NOM       0.99      0.99      0.99       141

   micro avg       0.98      0.99      0.98       381
   macro avg       0.97      0.98      0.98       381
weighted avg       0.98      0.99      0.98       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.46it/s, F1=0.625, eval_acc=0.965, eval_loss=8.97, eval_precision=0.544, eval_recall=0.738]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.63      0.73      0.68        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.25      0.83      0.38         6
     LOC.NOM       0.38      0.50      0.43         6
     ORG.NAM       0.28      0.55      0.37        47
     ORG.NOM       0.29      0.80      0.42         5
     PER.NAM       0.60      0.77      0.67        90
     PER.NOM       0.71      0.79      0.75       208

   micro avg       0.57      0.75      0.65       389
   macro avg       0.39      0.62      0.46       389
weighted avg       0.61      0.75      0.66       389



Epoch: 25/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.38it/s, F1=0.965, train_acc=1, train_loss=0.0806, train_precision=0.967, train_recall=0.963]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        43
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       1.00      1.00      1.00        12
     LOC.NOM       1.00      1.00      1.00        13
     ORG.NAM       1.00      1.00      1.00        55
     ORG.NOM       1.00      1.00      1.00        10
     PER.NAM       1.00      0.99      1.00       105
     PER.NOM       0.99      0.99      0.99       141

   micro avg       1.00      0.99      1.00       381
   macro avg       1.00      1.00      1.00       381
weighted avg       1.00      0.99      1.00       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.47it/s, F1=0.634, eval_acc=0.965, eval_loss=8.65, eval_precision=0.557, eval_recall=0.741]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.64      0.81      0.71        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.26      0.83      0.40         6
     LOC.NOM       0.33      0.50      0.40         6
     ORG.NAM       0.30      0.51      0.38        47
     ORG.NOM       0.33      0.80      0.47         5
     PER.NAM       0.59      0.79      0.67        90
     PER.NOM       0.73      0.80      0.76       208

   micro avg       0.59      0.76      0.66       389
   macro avg       0.40      0.63      0.47       389
weighted avg       0.62      0.76      0.67       389



Epoch: 26/30 Train: 100%|██████████| 32/32 [00:12<00:00,  2.58it/s, F1=1, train_acc=1, train_loss=0.053, train_precision=1, train_recall=1] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        43
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       1.00      1.00      1.00        12
     LOC.NOM       1.00      1.00      1.00        13
     ORG.NAM       1.00      1.00      1.00        55
     ORG.NOM       1.00      1.00      1.00        10
     PER.NAM       1.00      1.00      1.00       105
     PER.NOM       1.00      1.00      1.00       141

   micro avg       1.00      1.00      1.00       381
   macro avg       1.00      1.00      1.00       381
weighted avg       1.00      1.00      1.00       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.38it/s, F1=0.633, eval_acc=0.966, eval_loss=8.7, eval_precision=0.571, eval_recall=0.716] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.61      0.77      0.68        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.29      0.83      0.43         6
     LOC.NOM       0.29      0.33      0.31         6
     ORG.NAM       0.30      0.47      0.37        47
     ORG.NOM       0.33      0.80      0.47         5
     PER.NAM       0.64      0.72      0.68        90
     PER.NOM       0.73      0.78      0.75       208

   micro avg       0.60      0.72      0.65       389
   macro avg       0.40      0.59      0.46       389
weighted avg       0.63      0.72      0.67       389



Epoch: 27/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.34it/s, F1=0.968, train_acc=1, train_loss=0.0489, train_precision=0.968, train_recall=0.969]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        43
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       1.00      1.00      1.00        12
     LOC.NOM       1.00      1.00      1.00        13
     ORG.NAM       1.00      1.00      1.00        55
     ORG.NOM       1.00      1.00      1.00        10
     PER.NAM       0.99      1.00      1.00       105
     PER.NOM       1.00      1.00      1.00       141

   micro avg       1.00      1.00      1.00       381
   macro avg       1.00      1.00      1.00       381
weighted avg       1.00      1.00      1.00       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.40it/s, F1=0.644, eval_acc=0.967, eval_loss=8.87, eval_precision=0.588, eval_recall=0.718]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.61      0.77      0.68        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.33      0.83      0.48         6
     LOC.NOM       0.33      0.33      0.33         6
     ORG.NAM       0.32      0.49      0.39        47
     ORG.NOM       0.40      0.80      0.53         5
     PER.NAM       0.64      0.72      0.68        90
     PER.NOM       0.73      0.78      0.76       208

   micro avg       0.61      0.72      0.66       389
   macro avg       0.42      0.59      0.48       389
weighted avg       0.63      0.72      0.67       389



Epoch: 28/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.27it/s, F1=1, train_acc=1, train_loss=0.0372, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        43
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       1.00      1.00      1.00        12
     LOC.NOM       1.00      1.00      1.00        13
     ORG.NAM       1.00      1.00      1.00        55
     ORG.NOM       1.00      1.00      1.00        10
     PER.NAM       1.00      1.00      1.00       105
     PER.NOM       1.00      1.00      1.00       141

   micro avg       1.00      1.00      1.00       381
   macro avg       1.00      1.00      1.00       381
weighted avg       1.00      1.00      1.00       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.46it/s, F1=0.634, eval_acc=0.967, eval_loss=9.05, eval_precision=0.574, eval_recall=0.715]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.61      0.77      0.68        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.33      0.83      0.48         6
     LOC.NOM       0.22      0.33      0.27         6
     ORG.NAM       0.30      0.47      0.37        47
     ORG.NOM       0.36      0.80      0.50         5
     PER.NAM       0.63      0.71      0.67        90
     PER.NOM       0.73      0.78      0.75       208

   micro avg       0.60      0.72      0.65       389
   macro avg       0.40      0.59      0.46       389
weighted avg       0.63      0.72      0.66       389



Epoch: 29/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.24it/s, F1=0.998, train_acc=1, train_loss=0.0353, train_precision=0.996, train_recall=1]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        43
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       1.00      1.00      1.00        12
     LOC.NOM       1.00      1.00      1.00        13
     ORG.NAM       1.00      1.00      1.00        55
     ORG.NOM       1.00      1.00      1.00        10
     PER.NAM       0.99      1.00      1.00       105
     PER.NOM       1.00      1.00      1.00       141

   micro avg       1.00      1.00      1.00       381
   macro avg       1.00      1.00      1.00       381
weighted avg       1.00      1.00      1.00       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.31it/s, F1=0.653, eval_acc=0.968, eval_loss=9.27, eval_precision=0.6, eval_recall=0.722]  


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.64      0.81      0.71        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.42      0.83      0.56         6
     LOC.NOM       0.25      0.33      0.29         6
     ORG.NAM       0.34      0.49      0.40        47
     ORG.NOM       0.33      0.80      0.47         5
     PER.NAM       0.67      0.70      0.68        90
     PER.NOM       0.73      0.79      0.76       208

   micro avg       0.63      0.73      0.67       389
   macro avg       0.42      0.59      0.48       389
weighted avg       0.65      0.73      0.68       389



Epoch: 30/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.26it/s, F1=1, train_acc=1, train_loss=0.0374, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        43
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       1.00      1.00      1.00        12
     LOC.NOM       1.00      1.00      1.00        13
     ORG.NAM       1.00      1.00      1.00        55
     ORG.NOM       1.00      1.00      1.00        10
     PER.NAM       1.00      1.00      1.00       105
     PER.NOM       1.00      1.00      1.00       141

   micro avg       1.00      1.00      1.00       381
   macro avg       1.00      1.00      1.00       381
weighted avg       1.00      1.00      1.00       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.06it/s, F1=0.641, eval_acc=0.967, eval_loss=9.4, eval_precision=0.576, eval_recall=0.727] 


eval_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.61      0.77      0.68        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.25      0.83      0.38         6
     LOC.NOM       0.43      0.50      0.46         6
     ORG.NAM       0.31      0.49      0.38        47
     ORG.NOM       0.25      0.80      0.38         5
     PER.NAM       0.65      0.70      0.67        90
     PER.NOM       0.73      0.80      0.76       208

   micro avg       0.60      0.73      0.66       389
   macro avg       0.40      0.61      0.47       389
weighted avg       0.63      0.73      0.67       389



calculate data/few_shot/weibo/train_250.json etag: 100%|██████████| 170k/170k [00:00<00:00, 189MB/s]
calculate data/few_shot/weibo/dev.json etag: 100%|██████████| 180k/180k [00:00<00:00, 198MB/s]
calculate data/few_shot/weibo/test.json etag: 100%|██████████| 184k/184k [00:00<00:00, 241MB/s]
calculate data/few_shot/weibo/labels.txt etag: 100%|██████████| 272/272 [00:00<00:00, 599kB/s]

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/weibo/train_250.json",
    "eval_file": "data/few_shot/weibo/dev.json",
    "test_file": "data/few_shot/weibo/test.json",
    "tag_file": "data/few_shot/weibo/labels.txt",
    "bert_vocab_file": "./model/chinese_wwm_ext/vocab.txt",
    "output_eval": true,
    "max_scan_num": 1000000,
    "add_seq_vocab": false,
    "max_seq_length": 150,
    "max_word_num": 5,
    "default_tag": "O",
    "use_test": false,
    "do_shuffle": true,
    "do_predict": false,
    "task_name": "weibo_pretrain_lebert_crf_250_x2"
}
load cached ./temp/dfcab4601ac8d4aaec9b6ecfb221d3ec_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/lexicon_tree



count line size data/few_shot/weibo/labels.txt: 29L [00:00, 235270.44L/s]
build line mapper: 29L [00:00, 211907.34L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 29/29 [00:00<00:00, 8359.78it/s]
load vocab from list: 100%|██████████| 28/28 [00:00<00:00, 260400.25it/s]
load dataset from data/few_shot/weibo/train_250.json: 36it [00:00, 359.02it/s]

load cached ./temp/dfcab4601ac8d4aaec9b6ecfb221d3ec_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/matched_words
load cached ./temp/dfcab4601ac8d4aaec9b6ecfb221d3ec_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/word_vocab
load cached ./temp/dfcab4601ac8d4aaec9b6ecfb221d3ec_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/vocab_embedding


load dataset from data/few_shot/weibo/train_250.json: 250it [00:00, 346.61it/s]
load dataset from data/few_shot/weibo/dev.json: 271it [00:00, 351.77it/s]
Some weights of the model checkpoint at save_pretrained/weibo_pretrain_lebert_250_pretraind_task/Bert_240/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model fr

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 32/32 [00:10<00:00,  3.19it/s, F1=0, train_acc=0.314, train_loss=132, train_precision=0, train_recall=0]  


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        12
     LOC.NOM       0.00      0.00      0.00        13
     ORG.NAM       0.00      0.00      0.00        55
     ORG.NOM       0.00      0.00      0.00        10
     PER.NAM       0.00      0.00      0.00       105
     PER.NOM       0.00      0.00      0.00       141

   micro avg       0.00      0.00      0.00       381
   macro avg       0.00      0.00      0.00       381
weighted avg       0.00      0.00      0.00       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.26it/s, F1=0, eval_acc=0.933, eval_loss=32.1, eval_precision=0, eval_recall=0]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.00      0.00      0.00        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.00      0.00      0.00        90
     PER.NOM       0.00      0.00      0.00       208

   micro avg       0.00      0.00      0.00       389
   macro avg       0.00      0.00      0.00       389
weighted avg       0.00      0.00      0.00       389



Epoch: 2/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.28it/s, F1=0, train_acc=0.927, train_loss=32.4, train_precision=0, train_recall=0]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        12
     LOC.NOM       0.00      0.00      0.00        13
     ORG.NAM       0.00      0.00      0.00        55
     ORG.NOM       0.00      0.00      0.00        10
     PER.NAM       0.00      0.00      0.00       105
     PER.NOM       0.00      0.00      0.00       141

   micro avg       0.00      0.00      0.00       381
   macro avg       0.00      0.00      0.00       381
weighted avg       0.00      0.00      0.00       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.19it/s, F1=0, eval_acc=0.933, eval_loss=23.5, eval_precision=0, eval_recall=0]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.00      0.00      0.00        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.00      0.00      0.00        90
     PER.NOM       0.00      0.00      0.00       208

   micro avg       0.00      0.00      0.00       389
   macro avg       0.00      0.00      0.00       389
weighted avg       0.00      0.00      0.00       389



Epoch: 3/30 Train: 100%|██████████| 32/32 [00:10<00:00,  3.20it/s, F1=0, train_acc=0.924, train_loss=27.3, train_precision=0, train_recall=0]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        12
     LOC.NOM       0.00      0.00      0.00        13
     ORG.NAM       0.00      0.00      0.00        55
     ORG.NOM       0.00      0.00      0.00        10
     PER.NAM       0.00      0.00      0.00       105
     PER.NOM       0.00      0.00      0.00       141

   micro avg       0.00      0.00      0.00       381
   macro avg       0.00      0.00      0.00       381
weighted avg       0.00      0.00      0.00       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.28it/s, F1=0, eval_acc=0.933, eval_loss=20.6, eval_precision=0, eval_recall=0]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.00      0.00      0.00        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.00      0.00      0.00        90
     PER.NOM       0.00      0.00      0.00       208

   micro avg       0.00      0.00      0.00       389
   macro avg       0.00      0.00      0.00       389
weighted avg       0.00      0.00      0.00       389



Epoch: 4/30 Train: 100%|██████████| 32/32 [00:10<00:00,  3.19it/s, F1=0, train_acc=0.926, train_loss=23.4, train_precision=0, train_recall=0]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        12
     LOC.NOM       0.00      0.00      0.00        13
     ORG.NAM       0.00      0.00      0.00        55
     ORG.NOM       0.00      0.00      0.00        10
     PER.NAM       0.00      0.00      0.00       105
     PER.NOM       0.00      0.00      0.00       141

   micro avg       0.00      0.00      0.00       381
   macro avg       0.00      0.00      0.00       381
weighted avg       0.00      0.00      0.00       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.34it/s, F1=0, eval_acc=0.931, eval_loss=14.9, eval_precision=0, eval_recall=0]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.00      0.00      0.00        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.00      0.00      0.00        90
     PER.NOM       0.00      0.00      0.00       208

   micro avg       0.00      0.00      0.00       389
   macro avg       0.00      0.00      0.00       389
weighted avg       0.00      0.00      0.00       389



Epoch: 5/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.30it/s, F1=0.00919, train_acc=0.928, train_loss=15.8, train_precision=0.00905, train_recall=0.00972]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        12
     LOC.NOM       0.00      0.00      0.00        13
     ORG.NAM       0.01      0.02      0.01        55
     ORG.NOM       0.00      0.00      0.00        10
     PER.NAM       0.02      0.02      0.02       105
     PER.NOM       0.01      0.01      0.01       141

   micro avg       0.01      0.01      0.01       381
   macro avg       0.00      0.01      0.00       381
weighted avg       0.01      0.01      0.01       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.37it/s, F1=0.0419, eval_acc=0.943, eval_loss=9.85, eval_precision=0.0407, eval_recall=0.0434]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.00      0.00      0.00        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.01      0.01      0.01        90
     PER.NOM       0.07      0.09      0.08       208

   micro avg       0.05      0.05      0.05       389
   macro avg       0.01      0.01      0.01       389
weighted avg       0.04      0.05      0.04       389



Epoch: 6/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.22it/s, F1=0.285, train_acc=0.954, train_loss=10.1, train_precision=0.279, train_recall=0.307]  


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        12
     LOC.NOM       0.00      0.00      0.00        13
     ORG.NAM       0.05      0.07      0.06        55
     ORG.NOM       0.00      0.00      0.00        10
     PER.NAM       0.17      0.30      0.22       105
     PER.NOM       0.36      0.53      0.43       141

   micro avg       0.21      0.29      0.24       381
   macro avg       0.07      0.11      0.09       381
weighted avg       0.19      0.29      0.23       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.45it/s, F1=0.33, eval_acc=0.954, eval_loss=7.57, eval_precision=0.268, eval_recall=0.436] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.02      0.04      0.03        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.19      0.39      0.25        90
     PER.NOM       0.50      0.64      0.57       208

   micro avg       0.29      0.44      0.35       389
   macro avg       0.09      0.13      0.11       389
weighted avg       0.32      0.44      0.36       389



Epoch: 7/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.24it/s, F1=0.418, train_acc=0.969, train_loss=6.24, train_precision=0.376, train_recall=0.484]  


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.10      0.19      0.13        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        12
     LOC.NOM       0.00      0.00      0.00        13
     ORG.NAM       0.10      0.20      0.14        55
     ORG.NOM       0.00      0.00      0.00        10
     PER.NAM       0.43      0.60      0.50       105
     PER.NOM       0.58      0.73      0.65       141

   micro avg       0.36      0.49      0.42       381
   macro avg       0.15      0.21      0.18       381
weighted avg       0.36      0.49      0.41       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.46it/s, F1=0.417, eval_acc=0.953, eval_loss=7.52, eval_precision=0.311, eval_recall=0.661]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.18      0.42      0.26        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.03      0.11      0.04        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.30      0.72      0.42        90
     PER.NOM       0.60      0.79      0.68       208

   micro avg       0.33      0.63      0.43       389
   macro avg       0.14      0.26      0.18       389
weighted avg       0.41      0.63      0.49       389



Epoch: 8/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.20it/s, F1=0.643, train_acc=0.978, train_loss=4.48, train_precision=0.606, train_recall=0.701]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.40      0.63      0.49        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        12
     LOC.NOM       0.25      0.15      0.19        13
     ORG.NAM       0.28      0.38      0.33        55
     ORG.NOM       0.00      0.00      0.00        10
     PER.NAM       0.55      0.77      0.64       105
     PER.NOM       0.73      0.87      0.79       141

   micro avg       0.53      0.66      0.59       381
   macro avg       0.28      0.35      0.30       381
weighted avg       0.51      0.66      0.58       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.34it/s, F1=0.492, eval_acc=0.962, eval_loss=7.39, eval_precision=0.416, eval_recall=0.624]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.39      0.65      0.49        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.06      0.15      0.08        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.52      0.59      0.55        90
     PER.NOM       0.64      0.72      0.68       208

   micro avg       0.43      0.58      0.50       389
   macro avg       0.20      0.26      0.22       389
weighted avg       0.49      0.58      0.53       389



Epoch: 9/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.31it/s, F1=0.72, train_acc=0.987, train_loss=2.98, train_precision=0.678, train_recall=0.781] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.60      0.77      0.67        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        12
     LOC.NOM       0.33      0.31      0.32        13
     ORG.NAM       0.44      0.75      0.55        55
     ORG.NOM       0.00      0.00      0.00        10
     PER.NAM       0.69      0.82      0.75       105
     PER.NOM       0.90      0.93      0.91       141

   micro avg       0.65      0.77      0.71       381
   macro avg       0.37      0.45      0.40       381
weighted avg       0.66      0.77      0.71       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.43it/s, F1=0.592, eval_acc=0.962, eval_loss=7.34, eval_precision=0.499, eval_recall=0.736]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.35      0.62      0.44        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.38      0.50      0.43         6
     ORG.NAM       0.24      0.55      0.34        47
     ORG.NOM       1.00      0.80      0.89         5
     PER.NAM       0.44      0.68      0.53        90
     PER.NOM       0.62      0.79      0.69       208

   micro avg       0.47      0.70      0.56       389
   macro avg       0.38      0.49      0.42       389
weighted avg       0.50      0.70      0.58       389



Epoch: 10/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.27it/s, F1=0.811, train_acc=0.991, train_loss=2.11, train_precision=0.794, train_recall=0.836]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.72      0.84      0.77        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.36      0.42      0.38        12
     LOC.NOM       0.62      0.62      0.62        13
     ORG.NAM       0.75      0.82      0.78        55
     ORG.NOM       0.89      0.80      0.84        10
     PER.NAM       0.83      0.90      0.86       105
     PER.NOM       0.87      0.90      0.89       141

   micro avg       0.80      0.85      0.82       381
   macro avg       0.63      0.66      0.64       381
weighted avg       0.79      0.85      0.82       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.44it/s, F1=0.573, eval_acc=0.963, eval_loss=7.23, eval_precision=0.485, eval_recall=0.714]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.54      0.73      0.62        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.11      0.33      0.17         6
     LOC.NOM       0.50      0.50      0.50         6
     ORG.NAM       0.23      0.47      0.31        47
     ORG.NOM       0.80      0.80      0.80         5
     PER.NAM       0.48      0.70      0.57        90
     PER.NOM       0.68      0.80      0.74       208

   micro avg       0.52      0.72      0.61       389
   macro avg       0.42      0.54      0.46       389
weighted avg       0.56      0.72      0.63       389



Epoch: 11/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.33it/s, F1=0.887, train_acc=0.994, train_loss=1.6, train_precision=0.87, train_recall=0.911]  


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.80      0.91      0.85        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.77      0.83      0.80        12
     LOC.NOM       0.58      0.54      0.56        13
     ORG.NAM       0.87      0.96      0.91        55
     ORG.NOM       0.82      0.90      0.86        10
     PER.NAM       0.77      0.89      0.82       105
     PER.NOM       0.89      0.94      0.91       141

   micro avg       0.82      0.90      0.86       381
   macro avg       0.69      0.75      0.71       381
weighted avg       0.82      0.90      0.86       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.34it/s, F1=0.611, eval_acc=0.965, eval_loss=7.36, eval_precision=0.518, eval_recall=0.752]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.49      0.81      0.61        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.17      0.50      0.25         6
     LOC.NOM       0.57      0.67      0.62         6
     ORG.NAM       0.29      0.43      0.34        47
     ORG.NOM       0.50      0.80      0.62         5
     PER.NAM       0.48      0.76      0.58        90
     PER.NOM       0.71      0.82      0.76       208

   micro avg       0.55      0.75      0.63       389
   macro avg       0.40      0.60      0.47       389
weighted avg       0.57      0.75      0.64       389



Epoch: 12/30 Train: 100%|██████████| 32/32 [00:12<00:00,  2.48it/s, F1=0.894, train_acc=0.994, train_loss=1.51, train_precision=0.875, train_recall=0.918]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.86      0.88      0.87        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.77      0.83      0.80        12
     LOC.NOM       0.62      0.77      0.69        13
     ORG.NAM       0.91      0.95      0.93        55
     ORG.NOM       0.90      0.90      0.90        10
     PER.NAM       0.78      0.90      0.84       105
     PER.NOM       0.97      0.98      0.97       141

   micro avg       0.87      0.92      0.90       381
   macro avg       0.73      0.78      0.75       381
weighted avg       0.87      0.92      0.90       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.32it/s, F1=0.591, eval_acc=0.963, eval_loss=7.5, eval_precision=0.523, eval_recall=0.689] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.52      0.65      0.58        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.22      0.67      0.33         6
     LOC.NOM       0.40      0.33      0.36         6
     ORG.NAM       0.30      0.40      0.35        47
     ORG.NOM       0.57      0.80      0.67         5
     PER.NAM       0.47      0.71      0.57        90
     PER.NOM       0.72      0.75      0.73       208

   micro avg       0.56      0.68      0.61       389
   macro avg       0.40      0.54      0.45       389
weighted avg       0.58      0.68      0.62       389



Epoch: 13/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.33it/s, F1=0.882, train_acc=0.996, train_loss=1.03, train_precision=0.879, train_recall=0.888] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.91      0.95      0.93        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.77      0.83      0.80        12
     LOC.NOM       0.60      0.69      0.64        13
     ORG.NAM       0.92      0.98      0.95        55
     ORG.NOM       0.82      0.90      0.86        10
     PER.NAM       0.90      0.93      0.92       105
     PER.NOM       0.95      0.94      0.95       141

   micro avg       0.90      0.93      0.92       381
   macro avg       0.73      0.78      0.76       381
weighted avg       0.90      0.93      0.91       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.38it/s, F1=0.602, eval_acc=0.963, eval_loss=7.92, eval_precision=0.518, eval_recall=0.725]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.62      0.77      0.69        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.20      0.50      0.29         6
     LOC.NOM       0.50      0.67      0.57         6
     ORG.NAM       0.29      0.40      0.34        47
     ORG.NOM       0.50      0.80      0.62         5
     PER.NAM       0.48      0.81      0.60        90
     PER.NOM       0.67      0.77      0.72       208

   micro avg       0.54      0.73      0.62       389
   macro avg       0.41      0.59      0.48       389
weighted avg       0.56      0.73      0.63       389



Epoch: 14/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.32it/s, F1=0.939, train_acc=0.996, train_loss=1.2, train_precision=0.926, train_recall=0.957]  


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.89      0.93      0.91        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.92      0.92      0.92        12
     LOC.NOM       0.77      0.77      0.77        13
     ORG.NAM       0.91      0.96      0.94        55
     ORG.NOM       0.82      0.90      0.86        10
     PER.NAM       0.82      0.93      0.87       105
     PER.NOM       0.94      0.97      0.95       141

   micro avg       0.88      0.94      0.91       381
   macro avg       0.76      0.80      0.78       381
weighted avg       0.88      0.94      0.91       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.38it/s, F1=0.608, eval_acc=0.965, eval_loss=10.4, eval_precision=0.641, eval_recall=0.589]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.59      0.85      0.70        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.27      0.50      0.35         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.41      0.34      0.37        47
     ORG.NOM       0.80      0.80      0.80         5
     PER.NAM       0.74      0.59      0.65        90
     PER.NOM       0.73      0.57      0.64       208

   micro avg       0.66      0.56      0.61       389
   macro avg       0.44      0.46      0.44       389
weighted avg       0.66      0.56      0.60       389



Epoch: 15/30 Train: 100%|██████████| 32/32 [00:10<00:00,  3.17it/s, F1=0.889, train_acc=0.994, train_loss=1.54, train_precision=0.885, train_recall=0.905]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.95      0.95      0.95        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.65      0.92      0.76        12
     LOC.NOM       0.67      0.77      0.71        13
     ORG.NAM       0.95      1.00      0.97        55
     ORG.NOM       0.82      0.90      0.86        10
     PER.NAM       0.77      0.83      0.80       105
     PER.NOM       0.96      0.96      0.96       141

   micro avg       0.87      0.92      0.89       381
   macro avg       0.72      0.79      0.75       381
weighted avg       0.88      0.92      0.89       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.44it/s, F1=0.602, eval_acc=0.964, eval_loss=7.61, eval_precision=0.524, eval_recall=0.719]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.57      0.77      0.66        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.20      0.50      0.29         6
     LOC.NOM       0.22      0.33      0.27         6
     ORG.NAM       0.26      0.47      0.34        47
     ORG.NOM       0.44      0.80      0.57         5
     PER.NAM       0.55      0.73      0.63        90
     PER.NOM       0.72      0.79      0.75       208

   micro avg       0.56      0.72      0.63       389
   macro avg       0.37      0.55      0.44       389
weighted avg       0.59      0.72      0.65       389



Epoch: 16/30 Train: 100%|██████████| 32/32 [00:10<00:00,  3.20it/s, F1=0.961, train_acc=0.998, train_loss=0.746, train_precision=0.961, train_recall=0.963]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.92      0.92      0.92        12
     LOC.NOM       0.60      0.69      0.64        13
     ORG.NAM       0.96      0.98      0.97        55
     ORG.NOM       1.00      1.00      1.00        10
     PER.NAM       0.96      0.97      0.97       105
     PER.NOM       0.98      0.98      0.98       141

   micro avg       0.95      0.96      0.96       381
   macro avg       0.80      0.82      0.81       381
weighted avg       0.96      0.96      0.96       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.43it/s, F1=0.593, eval_acc=0.959, eval_loss=9.66, eval_precision=0.493, eval_recall=0.755]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.58      0.85      0.69        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.17      0.67      0.27         6
     LOC.NOM       0.29      0.67      0.40         6
     ORG.NAM       0.30      0.43      0.35        47
     ORG.NOM       0.25      0.80      0.38         5
     PER.NAM       0.53      0.69      0.60        90
     PER.NOM       0.60      0.85      0.70       208

   micro avg       0.51      0.75      0.61       389
   macro avg       0.34      0.62      0.42       389
weighted avg       0.53      0.75      0.62       389



Epoch: 17/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.33it/s, F1=0.976, train_acc=0.999, train_loss=0.45, train_precision=0.966, train_recall=0.988] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.98      0.98      0.98        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.92      0.92      0.92        12
     LOC.NOM       0.75      0.92      0.83        13
     ORG.NAM       0.96      1.00      0.98        55
     ORG.NOM       1.00      1.00      1.00        10
     PER.NAM       0.99      0.99      0.99       105
     PER.NOM       0.97      1.00      0.98       141

   micro avg       0.96      0.98      0.97       381
   macro avg       0.82      0.85      0.83       381
weighted avg       0.96      0.98      0.97       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.32it/s, F1=0.651, eval_acc=0.965, eval_loss=9.01, eval_precision=0.624, eval_recall=0.685]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.52      0.88      0.66        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.27      0.50      0.35         6
     LOC.NOM       0.67      0.33      0.44         6
     ORG.NAM       0.39      0.34      0.36        47
     ORG.NOM       0.80      0.80      0.80         5
     PER.NAM       0.58      0.66      0.62        90
     PER.NOM       0.78      0.76      0.77       208

   micro avg       0.65      0.68      0.66       389
   macro avg       0.50      0.53      0.50       389
weighted avg       0.66      0.68      0.66       389



Epoch: 18/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.33it/s, F1=0.97, train_acc=0.999, train_loss=0.338, train_precision=0.968, train_recall=0.972] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.96      1.00      0.98        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.85      0.92      0.88        12
     LOC.NOM       0.69      0.85      0.76        13
     ORG.NAM       1.00      0.98      0.99        55
     ORG.NOM       1.00      1.00      1.00        10
     PER.NAM       0.99      0.99      0.99       105
     PER.NOM       0.99      0.99      0.99       141

   micro avg       0.97      0.98      0.97       381
   macro avg       0.81      0.84      0.82       381
weighted avg       0.97      0.98      0.97       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.21it/s, F1=0.626, eval_acc=0.965, eval_loss=9.06, eval_precision=0.562, eval_recall=0.714]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.53      0.65      0.59        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.36      0.67      0.47         6
     LOC.NOM       0.67      0.33      0.44         6
     ORG.NAM       0.33      0.43      0.37        47
     ORG.NOM       0.57      0.80      0.67         5
     PER.NAM       0.52      0.74      0.61        90
     PER.NOM       0.71      0.79      0.75       208

   micro avg       0.59      0.72      0.65       389
   macro avg       0.46      0.55      0.49       389
weighted avg       0.60      0.72      0.65       389



Epoch: 19/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.27it/s, F1=0.963, train_acc=0.997, train_loss=0.753, train_precision=0.953, train_recall=0.973]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.98      0.98      0.98        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.79      0.92      0.85        12
     LOC.NOM       0.80      0.92      0.86        13
     ORG.NAM       0.96      0.98      0.97        55
     ORG.NOM       1.00      1.00      1.00        10
     PER.NAM       0.96      0.99      0.98       105
     PER.NOM       0.97      0.98      0.98       141

   micro avg       0.95      0.97      0.96       381
   macro avg       0.81      0.85      0.83       381
weighted avg       0.95      0.97      0.96       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.47it/s, F1=0.645, eval_acc=0.967, eval_loss=8.52, eval_precision=0.619, eval_recall=0.68] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.62      0.77      0.69        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.33      0.67      0.44         6
     LOC.NOM       0.67      0.33      0.44         6
     ORG.NAM       0.30      0.40      0.34        47
     ORG.NOM       0.67      0.80      0.73         5
     PER.NAM       0.71      0.67      0.69        90
     PER.NOM       0.75      0.74      0.74       208

   micro avg       0.64      0.68      0.66       389
   macro avg       0.51      0.55      0.51       389
weighted avg       0.66      0.68      0.67       389



Epoch: 20/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.23it/s, F1=0.978, train_acc=0.999, train_loss=0.413, train_precision=0.974, train_recall=0.982]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.92      0.92      0.92        12
     LOC.NOM       0.71      0.92      0.80        13
     ORG.NAM       1.00      1.00      1.00        55
     ORG.NOM       1.00      1.00      1.00        10
     PER.NAM       0.98      0.98      0.98       105
     PER.NOM       0.99      0.99      0.99       141

   micro avg       0.97      0.98      0.98       381
   macro avg       0.82      0.85      0.84       381
weighted avg       0.97      0.98      0.98       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.44it/s, F1=0.65, eval_acc=0.967, eval_loss=8.32, eval_precision=0.59, eval_recall=0.728]  


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.67      0.77      0.71        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.36      0.67      0.47         6
     LOC.NOM       0.40      0.33      0.36         6
     ORG.NAM       0.33      0.40      0.37        47
     ORG.NOM       0.57      0.80      0.67         5
     PER.NAM       0.62      0.74      0.68        90
     PER.NOM       0.68      0.82      0.74       208

   micro avg       0.61      0.74      0.67       389
   macro avg       0.45      0.57      0.50       389
weighted avg       0.61      0.74      0.67       389



Epoch: 21/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.22it/s, F1=0.986, train_acc=0.999, train_loss=0.332, train_precision=0.989, train_recall=0.984]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.98      0.98      0.98        43
     GPE.NOM       0.50      0.50      0.50         2
     LOC.NAM       0.92      1.00      0.96        12
     LOC.NOM       1.00      1.00      1.00        13
     ORG.NAM       1.00      1.00      1.00        55
     ORG.NOM       1.00      1.00      1.00        10
     PER.NAM       0.98      0.96      0.97       105
     PER.NOM       1.00      0.99      1.00       141

   micro avg       0.99      0.98      0.98       381
   macro avg       0.92      0.93      0.93       381
weighted avg       0.99      0.98      0.98       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.44it/s, F1=0.6, eval_acc=0.964, eval_loss=8.85, eval_precision=0.507, eval_recall=0.741]  


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.59      0.77      0.67        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.31      0.83      0.45         6
     LOC.NOM       0.29      0.33      0.31         6
     ORG.NAM       0.28      0.45      0.34        47
     ORG.NOM       0.50      0.80      0.62         5
     PER.NAM       0.46      0.82      0.59        90
     PER.NOM       0.65      0.80      0.71       208

   micro avg       0.52      0.75      0.62       389
   macro avg       0.38      0.60      0.46       389
weighted avg       0.54      0.75      0.62       389



Epoch: 22/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.27it/s, F1=0.952, train_acc=0.999, train_loss=0.22, train_precision=0.952, train_recall=0.953] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        43
     GPE.NOM       0.50      0.50      0.50         2
     LOC.NAM       1.00      1.00      1.00        12
     LOC.NOM       0.92      0.92      0.92        13
     ORG.NAM       1.00      1.00      1.00        55
     ORG.NOM       1.00      1.00      1.00        10
     PER.NAM       0.94      0.97      0.96       105
     PER.NOM       0.99      0.99      0.99       141

   micro avg       0.97      0.98      0.98       381
   macro avg       0.92      0.92      0.92       381
weighted avg       0.97      0.98      0.98       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.42it/s, F1=0.673, eval_acc=0.967, eval_loss=8.53, eval_precision=0.608, eval_recall=0.758]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.59      0.77      0.67        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.27      0.50      0.35         6
     LOC.NOM       0.33      0.33      0.33         6
     ORG.NAM       0.37      0.49      0.42        47
     ORG.NOM       0.44      0.80      0.57         5
     PER.NAM       0.60      0.70      0.65        90
     PER.NOM       0.70      0.85      0.76       208

   micro avg       0.61      0.75      0.67       389
   macro avg       0.41      0.55      0.47       389
weighted avg       0.61      0.75      0.67       389



Epoch: 23/30 Train: 100%|██████████| 32/32 [00:10<00:00,  3.18it/s, F1=0.962, train_acc=1, train_loss=0.179, train_precision=0.963, train_recall=0.962]    


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        43
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       1.00      0.92      0.96        12
     LOC.NOM       1.00      1.00      1.00        13
     ORG.NAM       1.00      1.00      1.00        55
     ORG.NOM       1.00      1.00      1.00        10
     PER.NAM       0.99      0.98      0.99       105
     PER.NOM       0.99      1.00      1.00       141

   micro avg       0.99      0.99      0.99       381
   macro avg       1.00      0.99      0.99       381
weighted avg       0.99      0.99      0.99       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.02it/s, F1=0.605, eval_acc=0.965, eval_loss=8.86, eval_precision=0.525, eval_recall=0.723]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.61      0.73      0.67        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.15      0.83      0.25         6
     LOC.NOM       0.50      0.33      0.40         6
     ORG.NAM       0.26      0.47      0.34        47
     ORG.NOM       0.43      0.60      0.50         5
     PER.NAM       0.54      0.79      0.64        90
     PER.NOM       0.75      0.78      0.76       208

   micro avg       0.56      0.73      0.63       389
   macro avg       0.40      0.57      0.44       389
weighted avg       0.61      0.73      0.66       389



Epoch: 24/30 Train: 100%|██████████| 32/32 [00:13<00:00,  2.45it/s, F1=0.959, train_acc=0.999, train_loss=0.233, train_precision=0.957, train_recall=0.961]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      0.98      0.99        43
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       0.92      0.92      0.92        12
     LOC.NOM       1.00      1.00      1.00        13
     ORG.NAM       0.96      0.98      0.97        55
     ORG.NOM       1.00      1.00      1.00        10
     PER.NAM       0.98      1.00      0.99       105
     PER.NOM       1.00      1.00      1.00       141

   micro avg       0.99      0.99      0.99       381
   macro avg       0.98      0.98      0.98       381
weighted avg       0.99      0.99      0.99       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.44it/s, F1=0.645, eval_acc=0.966, eval_loss=8.72, eval_precision=0.604, eval_recall=0.697]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.56      0.77      0.65        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.23      0.50      0.32         6
     LOC.NOM       0.33      0.33      0.33         6
     ORG.NAM       0.35      0.38      0.36        47
     ORG.NOM       0.67      0.80      0.73         5
     PER.NAM       0.64      0.68      0.66        90
     PER.NOM       0.73      0.78      0.76       208

   micro avg       0.63      0.70      0.66       389
   macro avg       0.44      0.53      0.47       389
weighted avg       0.63      0.70      0.66       389



Epoch: 25/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.24it/s, F1=0.999, train_acc=1, train_loss=0.111, train_precision=0.999, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        43
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       1.00      1.00      1.00        12
     LOC.NOM       1.00      1.00      1.00        13
     ORG.NAM       1.00      1.00      1.00        55
     ORG.NOM       1.00      1.00      1.00        10
     PER.NAM       0.99      0.99      0.99       105
     PER.NOM       1.00      1.00      1.00       141

   micro avg       1.00      1.00      1.00       381
   macro avg       1.00      1.00      1.00       381
weighted avg       1.00      1.00      1.00       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  3.93it/s, F1=0.646, eval_acc=0.966, eval_loss=8.73, eval_precision=0.584, eval_recall=0.729]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.59      0.73      0.66        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.21      0.83      0.33         6
     LOC.NOM       0.43      0.50      0.46         6
     ORG.NAM       0.33      0.38      0.35        47
     ORG.NOM       0.50      0.80      0.62         5
     PER.NAM       0.61      0.77      0.68        90
     PER.NOM       0.74      0.81      0.78       208

   micro avg       0.62      0.74      0.67       389
   macro avg       0.43      0.60      0.48       389
weighted avg       0.63      0.74      0.68       389



Epoch: 26/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.21it/s, F1=0.998, train_acc=1, train_loss=0.0957, train_precision=0.996, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.98      0.98      0.98        43
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       0.92      1.00      0.96        12
     LOC.NOM       1.00      1.00      1.00        13
     ORG.NAM       1.00      1.00      1.00        55
     ORG.NOM       1.00      1.00      1.00        10
     PER.NAM       0.99      1.00      1.00       105
     PER.NOM       1.00      1.00      1.00       141

   micro avg       0.99      1.00      0.99       381
   macro avg       0.99      1.00      0.99       381
weighted avg       0.99      1.00      0.99       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.30it/s, F1=0.652, eval_acc=0.966, eval_loss=9.52, eval_precision=0.614, eval_recall=0.701]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.55      0.81      0.66        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.23      0.50      0.32         6
     LOC.NOM       0.40      0.33      0.36         6
     ORG.NAM       0.40      0.38      0.39        47
     ORG.NOM       0.67      0.80      0.73         5
     PER.NAM       0.66      0.68      0.67        90
     PER.NOM       0.73      0.78      0.76       208

   micro avg       0.65      0.70      0.67       389
   macro avg       0.46      0.54      0.49       389
weighted avg       0.65      0.70      0.67       389



Epoch: 27/30 Train: 100%|██████████| 32/32 [00:10<00:00,  3.19it/s, F1=0.998, train_acc=1, train_loss=0.0751, train_precision=0.998, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.98      0.98      0.98        43
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       1.00      1.00      1.00        12
     LOC.NOM       1.00      1.00      1.00        13
     ORG.NAM       0.98      1.00      0.99        55
     ORG.NOM       1.00      1.00      1.00        10
     PER.NAM       1.00      1.00      1.00       105
     PER.NOM       1.00      1.00      1.00       141

   micro avg       0.99      1.00      1.00       381
   macro avg       0.99      1.00      1.00       381
weighted avg       0.99      1.00      1.00       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.39it/s, F1=0.649, eval_acc=0.966, eval_loss=9.64, eval_precision=0.602, eval_recall=0.713]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.51      0.77      0.62        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.21      0.50      0.30         6
     LOC.NOM       0.40      0.33      0.36         6
     ORG.NAM       0.35      0.38      0.37        47
     ORG.NOM       0.57      0.80      0.67         5
     PER.NAM       0.67      0.69      0.68        90
     PER.NOM       0.74      0.81      0.78       208

   micro avg       0.64      0.71      0.67       389
   macro avg       0.43      0.54      0.47       389
weighted avg       0.65      0.71      0.68       389



Epoch: 28/30 Train: 100%|██████████| 32/32 [00:10<00:00,  3.14it/s, F1=0.998, train_acc=1, train_loss=0.0697, train_precision=0.998, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        43
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       1.00      1.00      1.00        12
     LOC.NOM       1.00      1.00      1.00        13
     ORG.NAM       1.00      1.00      1.00        55
     ORG.NOM       1.00      1.00      1.00        10
     PER.NAM       0.98      0.99      0.99       105
     PER.NOM       1.00      1.00      1.00       141

   micro avg       0.99      1.00      1.00       381
   macro avg       1.00      1.00      1.00       381
weighted avg       0.99      1.00      1.00       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  3.92it/s, F1=0.654, eval_acc=0.965, eval_loss=9.75, eval_precision=0.605, eval_recall=0.717]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.58      0.81      0.68        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.27      0.67      0.38         6
     LOC.NOM       0.40      0.33      0.36         6
     ORG.NAM       0.38      0.38      0.38        47
     ORG.NOM       0.57      0.80      0.67         5
     PER.NAM       0.63      0.69      0.66        90
     PER.NOM       0.73      0.81      0.77       208

   micro avg       0.64      0.72      0.68       389
   macro avg       0.45      0.56      0.49       389
weighted avg       0.64      0.72      0.68       389



Epoch: 29/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.22it/s, F1=0.997, train_acc=1, train_loss=0.0465, train_precision=0.996, train_recall=0.998]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.98      1.00      0.99        43
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       1.00      1.00      1.00        12
     LOC.NOM       1.00      1.00      1.00        13
     ORG.NAM       0.98      0.98      0.98        55
     ORG.NOM       1.00      1.00      1.00        10
     PER.NAM       1.00      1.00      1.00       105
     PER.NOM       1.00      1.00      1.00       141

   micro avg       0.99      1.00      1.00       381
   macro avg       0.99      1.00      1.00       381
weighted avg       0.99      1.00      1.00       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.45it/s, F1=0.635, eval_acc=0.967, eval_loss=9.56, eval_precision=0.581, eval_recall=0.708]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.55      0.69      0.61        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.20      0.50      0.29         6
     LOC.NOM       0.40      0.33      0.36         6
     ORG.NAM       0.33      0.38      0.35        47
     ORG.NOM       0.57      0.80      0.67         5
     PER.NAM       0.63      0.69      0.66        90
     PER.NOM       0.73      0.81      0.77       208

   micro avg       0.62      0.71      0.66       389
   macro avg       0.42      0.53      0.46       389
weighted avg       0.63      0.71      0.66       389



Epoch: 30/30 Train: 100%|██████████| 32/32 [00:10<00:00,  3.20it/s, F1=0.936, train_acc=1, train_loss=0.119, train_precision=0.938, train_recall=0.934]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        43
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       1.00      1.00      1.00        12
     LOC.NOM       1.00      1.00      1.00        13
     ORG.NAM       1.00      1.00      1.00        55
     ORG.NOM       1.00      1.00      1.00        10
     PER.NAM       1.00      0.99      1.00       105
     PER.NOM       1.00      1.00      1.00       141

   micro avg       1.00      1.00      1.00       381
   macro avg       1.00      1.00      1.00       381
weighted avg       1.00      1.00      1.00       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.12it/s, F1=0.642, eval_acc=0.967, eval_loss=9.06, eval_precision=0.581, eval_recall=0.722]


eval_reports:


calculate data/few_shot/weibo/train_250.json etag: 100%|██████████| 170k/170k [00:00<00:00, 256MB/s]
calculate data/few_shot/weibo/dev.json etag: 100%|██████████| 180k/180k [00:00<00:00, 189MB/s]
calculate data/few_shot/weibo/test.json etag: 100%|██████████| 184k/184k [00:00<00:00, 194MB/s]
calculate data/few_shot/weibo/labels.txt etag: 100%|██████████| 272/272 [00:00<00:00, 495kB/s]

              precision    recall  f1-score   support

     GPE.NAM       0.59      0.73      0.66        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.22      0.67      0.33         6
     LOC.NOM       0.75      0.50      0.60         6
     ORG.NAM       0.30      0.40      0.35        47
     ORG.NOM       0.43      0.60      0.50         5
     PER.NAM       0.59      0.73      0.66        90
     PER.NOM       0.73      0.81      0.77       208

   micro avg       0.61      0.73      0.66       389
   macro avg       0.45      0.56      0.48       389
weighted avg       0.63      0.73      0.67       389

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/weibo/train_250.json",
    "eval_file": "data/few_shot/weibo/dev.json",
    "test_file": "data/few_shot/w


count line size data/few_shot/weibo/labels.txt: 29L [00:00, 243269.63L/s]
build line mapper: 29L [00:00, 217983.54L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 29/29 [00:00<00:00, 8445.10it/s]
load vocab from list: 100%|██████████| 28/28 [00:00<00:00, 259824.14it/s]
load dataset from data/few_shot/weibo/train_250.json: 34it [00:00, 336.41it/s]

load cached ./temp/dfcab4601ac8d4aaec9b6ecfb221d3ec_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/matched_words
load cached ./temp/dfcab4601ac8d4aaec9b6ecfb221d3ec_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/word_vocab
load cached ./temp/dfcab4601ac8d4aaec9b6ecfb221d3ec_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/vocab_embedding


load dataset from data/few_shot/weibo/train_250.json: 250it [00:00, 414.23it/s]
load dataset from data/few_shot/weibo/dev.json: 271it [00:00, 506.00it/s]
Some weights of the model checkpoint at save_pretrained/weibo_pretrain_lebert_250_pretraind_task/Bert_240/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model fr

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 32/32 [00:10<00:00,  3.19it/s, F1=0.000296, train_acc=0.0779, train_loss=237, train_precision=0.000153, train_recall=0.00567]  


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        12
     LOC.NOM       0.00      0.00      0.00        13
     ORG.NAM       0.00      0.00      0.00        55
     ORG.NOM       0.00      0.00      0.00        10
     PER.NAM       0.00      0.00      0.00       105
     PER.NOM       0.00      0.01      0.00       141

   micro avg       0.00      0.01      0.00       381
   macro avg       0.00      0.00      0.00       381
weighted avg       0.00      0.01      0.00       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.37it/s, F1=0, eval_acc=0.689, eval_loss=86.9, eval_precision=0, eval_recall=0]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.00      0.00      0.00        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.00      0.00      0.00        90
     PER.NOM       0.00      0.00      0.00       208

   micro avg       0.00      0.00      0.00       389
   macro avg       0.00      0.00      0.00       389
weighted avg       0.00      0.00      0.00       389



Epoch: 2/30 Train: 100%|██████████| 32/32 [00:10<00:00,  3.18it/s, F1=0, train_acc=0.926, train_loss=39.2, train_precision=0, train_recall=0]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        12
     LOC.NOM       0.00      0.00      0.00        13
     ORG.NAM       0.00      0.00      0.00        55
     ORG.NOM       0.00      0.00      0.00        10
     PER.NAM       0.00      0.00      0.00       105
     PER.NOM       0.00      0.00      0.00       141

   micro avg       0.00      0.00      0.00       381
   macro avg       0.00      0.00      0.00       381
weighted avg       0.00      0.00      0.00       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.45it/s, F1=0, eval_acc=0.933, eval_loss=25.5, eval_precision=0, eval_recall=0]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.00      0.00      0.00        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.00      0.00      0.00        90
     PER.NOM       0.00      0.00      0.00       208

   micro avg       0.00      0.00      0.00       389
   macro avg       0.00      0.00      0.00       389
weighted avg       0.00      0.00      0.00       389



Epoch: 3/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.24it/s, F1=0, train_acc=0.926, train_loss=28.9, train_precision=0, train_recall=0]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        12
     LOC.NOM       0.00      0.00      0.00        13
     ORG.NAM       0.00      0.00      0.00        55
     ORG.NOM       0.00      0.00      0.00        10
     PER.NAM       0.00      0.00      0.00       105
     PER.NOM       0.00      0.00      0.00       141

   micro avg       0.00      0.00      0.00       381
   macro avg       0.00      0.00      0.00       381
weighted avg       0.00      0.00      0.00       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.45it/s, F1=0, eval_acc=0.933, eval_loss=23.9, eval_precision=0, eval_recall=0]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.00      0.00      0.00        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.00      0.00      0.00        90
     PER.NOM       0.00      0.00      0.00       208

   micro avg       0.00      0.00      0.00       389
   macro avg       0.00      0.00      0.00       389
weighted avg       0.00      0.00      0.00       389



Epoch: 4/30 Train: 100%|██████████| 32/32 [00:10<00:00,  3.14it/s, F1=0, train_acc=0.93, train_loss=27.8, train_precision=0, train_recall=0] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        12
     LOC.NOM       0.00      0.00      0.00        13
     ORG.NAM       0.00      0.00      0.00        55
     ORG.NOM       0.00      0.00      0.00        10
     PER.NAM       0.00      0.00      0.00       105
     PER.NOM       0.00      0.00      0.00       141

   micro avg       0.00      0.00      0.00       381
   macro avg       0.00      0.00      0.00       381
weighted avg       0.00      0.00      0.00       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.42it/s, F1=0, eval_acc=0.933, eval_loss=22.9, eval_precision=0, eval_recall=0]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.00      0.00      0.00        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.00      0.00      0.00        90
     PER.NOM       0.00      0.00      0.00       208

   micro avg       0.00      0.00      0.00       389
   macro avg       0.00      0.00      0.00       389
weighted avg       0.00      0.00      0.00       389



Epoch: 5/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.29it/s, F1=0, train_acc=0.931, train_loss=25.6, train_precision=0, train_recall=0]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        12
     LOC.NOM       0.00      0.00      0.00        13
     ORG.NAM       0.00      0.00      0.00        55
     ORG.NOM       0.00      0.00      0.00        10
     PER.NAM       0.00      0.00      0.00       105
     PER.NOM       0.00      0.00      0.00       141

   micro avg       0.00      0.00      0.00       381
   macro avg       0.00      0.00      0.00       381
weighted avg       0.00      0.00      0.00       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.41it/s, F1=0, eval_acc=0.933, eval_loss=17.4, eval_precision=0, eval_recall=0]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.00      0.00      0.00        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.00      0.00      0.00        90
     PER.NOM       0.00      0.00      0.00       208

   micro avg       0.00      0.00      0.00       389
   macro avg       0.00      0.00      0.00       389
weighted avg       0.00      0.00      0.00       389



Epoch: 6/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.28it/s, F1=0.0135, train_acc=0.928, train_loss=18.5, train_precision=0.0148, train_recall=0.0148]    


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        12
     LOC.NOM       0.00      0.00      0.00        13
     ORG.NAM       0.00      0.00      0.00        55
     ORG.NOM       0.00      0.00      0.00        10
     PER.NAM       0.04      0.04      0.04       105
     PER.NOM       0.00      0.00      0.00       141

   micro avg       0.01      0.01      0.01       381
   macro avg       0.01      0.00      0.00       381
weighted avg       0.01      0.01      0.01       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.44it/s, F1=0.0294, eval_acc=0.947, eval_loss=11.9, eval_precision=0.0255, eval_recall=0.035] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.00      0.00      0.00        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.08      0.13      0.10        90
     PER.NOM       0.02      0.02      0.02       208

   micro avg       0.03      0.04      0.04       389
   macro avg       0.01      0.02      0.01       389
weighted avg       0.03      0.04      0.03       389



Epoch: 7/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.22it/s, F1=0.124, train_acc=0.946, train_loss=12.1, train_precision=0.106, train_recall=0.16]   


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        12
     LOC.NOM       0.00      0.00      0.00        13
     ORG.NAM       0.01      0.02      0.01        55
     ORG.NOM       0.00      0.00      0.00        10
     PER.NAM       0.21      0.35      0.26       105
     PER.NOM       0.13      0.21      0.16       141

   micro avg       0.11      0.18      0.14       381
   macro avg       0.04      0.07      0.05       381
weighted avg       0.11      0.18      0.13       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.45it/s, F1=0.367, eval_acc=0.956, eval_loss=8.98, eval_precision=0.284, eval_recall=0.527]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.03      0.09      0.05        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.35      0.63      0.45        90
     PER.NOM       0.44      0.70      0.54       208

   micro avg       0.30      0.53      0.39       389
   macro avg       0.10      0.18      0.13       389
weighted avg       0.32      0.53      0.40       389



Epoch: 8/30 Train: 100%|██████████| 32/32 [00:12<00:00,  2.49it/s, F1=0.479, train_acc=0.968, train_loss=7.51, train_precision=0.428, train_recall=0.561]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.01      0.02      0.02        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        12
     LOC.NOM       0.00      0.00      0.00        13
     ORG.NAM       0.05      0.15      0.08        55
     ORG.NOM       0.00      0.00      0.00        10
     PER.NAM       0.53      0.68      0.59       105
     PER.NOM       0.64      0.84      0.73       141

   micro avg       0.36      0.52      0.42       381
   macro avg       0.16      0.21      0.18       381
weighted avg       0.39      0.52      0.45       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.46it/s, F1=0.388, eval_acc=0.956, eval_loss=7.92, eval_precision=0.298, eval_recall=0.57] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.01      0.02      0.01        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.38      0.72      0.50        90
     PER.NOM       0.60      0.74      0.66       208

   micro avg       0.32      0.57      0.41       389
   macro avg       0.12      0.19      0.15       389
weighted avg       0.41      0.57      0.47       389



Epoch: 9/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.27it/s, F1=0.471, train_acc=0.974, train_loss=5.62, train_precision=0.419, train_recall=0.546]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.01      0.02      0.01        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        12
     LOC.NOM       0.00      0.00      0.00        13
     ORG.NAM       0.08      0.22      0.12        55
     ORG.NOM       0.00      0.00      0.00        10
     PER.NAM       0.60      0.74      0.67       105
     PER.NOM       0.75      0.84      0.80       141

   micro avg       0.40      0.55      0.46       381
   macro avg       0.18      0.23      0.20       381
weighted avg       0.46      0.55      0.50       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.44it/s, F1=0.432, eval_acc=0.957, eval_loss=7.77, eval_precision=0.335, eval_recall=0.62] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.08      0.27      0.13        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.02      0.06      0.03        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.38      0.67      0.49        90
     PER.NOM       0.60      0.76      0.67       208

   micro avg       0.34      0.59      0.43       389
   macro avg       0.14      0.22      0.16       389
weighted avg       0.42      0.59      0.48       389



Epoch: 10/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.30it/s, F1=0.669, train_acc=0.981, train_loss=4.12, train_precision=0.639, train_recall=0.72] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.26      0.53      0.35        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        12
     LOC.NOM       0.00      0.00      0.00        13
     ORG.NAM       0.21      0.40      0.28        55
     ORG.NOM       0.00      0.00      0.00        10
     PER.NAM       0.82      0.90      0.86       105
     PER.NOM       0.81      0.90      0.86       141

   micro avg       0.57      0.70      0.63       381
   macro avg       0.26      0.34      0.29       381
weighted avg       0.59      0.70      0.63       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.45it/s, F1=0.537, eval_acc=0.962, eval_loss=8.04, eval_precision=0.434, eval_recall=0.71] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.24      0.62      0.34        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.15      0.30      0.20        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.47      0.73      0.58        90
     PER.NOM       0.63      0.84      0.72       208

   micro avg       0.45      0.69      0.55       389
   macro avg       0.19      0.31      0.23       389
weighted avg       0.48      0.69      0.57       389



Epoch: 11/30 Train: 100%|██████████| 32/32 [00:10<00:00,  3.18it/s, F1=0.724, train_acc=0.988, train_loss=2.8, train_precision=0.681, train_recall=0.784] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.54      0.79      0.64        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        12
     LOC.NOM       0.00      0.00      0.00        13
     ORG.NAM       0.69      0.89      0.78        55
     ORG.NOM       0.00      0.00      0.00        10
     PER.NAM       0.79      0.89      0.83       105
     PER.NOM       0.84      0.90      0.87       141

   micro avg       0.68      0.80      0.74       381
   macro avg       0.36      0.43      0.39       381
weighted avg       0.69      0.80      0.74       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.28it/s, F1=0.58, eval_acc=0.962, eval_loss=8.34, eval_precision=0.499, eval_recall=0.695] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.40      0.69      0.51        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.23      0.43      0.30        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.50      0.63      0.56        90
     PER.NOM       0.66      0.79      0.72       208

   micro avg       0.50      0.67      0.57       389
   macro avg       0.22      0.32      0.26       389
weighted avg       0.52      0.67      0.59       389



Epoch: 12/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.24it/s, F1=0.795, train_acc=0.99, train_loss=2.06, train_precision=0.776, train_recall=0.826] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.82      0.93      0.87        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.33      0.42      0.37        12
     LOC.NOM       0.00      0.00      0.00        13
     ORG.NAM       0.82      0.96      0.88        55
     ORG.NOM       0.17      0.20      0.18        10
     PER.NAM       0.86      0.92      0.89       105
     PER.NOM       0.84      0.88      0.86       141

   micro avg       0.77      0.84      0.80       381
   macro avg       0.48      0.54      0.51       381
weighted avg       0.77      0.84      0.81       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.42it/s, F1=0.582, eval_acc=0.963, eval_loss=8.53, eval_precision=0.513, eval_recall=0.676]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.51      0.81      0.63        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.12      0.50      0.19         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.32      0.32      0.32        47
     ORG.NOM       0.15      0.40      0.22         5
     PER.NAM       0.56      0.67      0.61        90
     PER.NOM       0.68      0.76      0.72       208

   micro avg       0.53      0.67      0.59       389
   macro avg       0.29      0.43      0.34       389
weighted avg       0.57      0.67      0.61       389



Epoch: 13/30 Train: 100%|██████████| 32/32 [00:10<00:00,  3.12it/s, F1=0.873, train_acc=0.994, train_loss=1.92, train_precision=0.85, train_recall=0.903] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.83      0.91      0.87        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.55      0.92      0.69        12
     LOC.NOM       0.11      0.15      0.13        13
     ORG.NAM       0.82      0.93      0.87        55
     ORG.NOM       0.27      0.30      0.29        10
     PER.NAM       0.90      0.93      0.92       105
     PER.NOM       0.94      0.96      0.95       141

   micro avg       0.83      0.89      0.86       381
   macro avg       0.55      0.64      0.59       381
weighted avg       0.84      0.89      0.86       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.43it/s, F1=0.593, eval_acc=0.966, eval_loss=8.46, eval_precision=0.537, eval_recall=0.668]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.54      0.73      0.62        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.25      0.50      0.33         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.29      0.40      0.34        47
     ORG.NOM       0.43      0.60      0.50         5
     PER.NAM       0.55      0.64      0.59        90
     PER.NOM       0.69      0.74      0.71       208

   micro avg       0.56      0.66      0.61       389
   macro avg       0.34      0.45      0.39       389
weighted avg       0.58      0.66      0.61       389



Epoch: 14/30 Train: 100%|██████████| 32/32 [00:10<00:00,  3.19it/s, F1=0.88, train_acc=0.995, train_loss=1.28, train_precision=0.866, train_recall=0.9]   


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.93      0.93      0.93        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.71      0.83      0.77        12
     LOC.NOM       0.00      0.00      0.00        13
     ORG.NAM       0.88      0.96      0.92        55
     ORG.NOM       0.41      0.70      0.52        10
     PER.NAM       0.93      0.95      0.94       105
     PER.NOM       0.94      0.96      0.95       141

   micro avg       0.86      0.91      0.88       381
   macro avg       0.60      0.67      0.63       381
weighted avg       0.87      0.91      0.89       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.21it/s, F1=0.631, eval_acc=0.965, eval_loss=8.71, eval_precision=0.552, eval_recall=0.738]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.62      0.81      0.70        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.16      0.67      0.26         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.32      0.47      0.38        47
     ORG.NOM       0.33      0.60      0.43         5
     PER.NAM       0.47      0.74      0.58        90
     PER.NOM       0.72      0.76      0.74       208

   micro avg       0.54      0.71      0.61       389
   macro avg       0.33      0.51      0.39       389
weighted avg       0.58      0.71      0.63       389



Epoch: 15/30 Train: 100%|██████████| 32/32 [00:10<00:00,  3.19it/s, F1=0.925, train_acc=0.996, train_loss=1.04, train_precision=0.907, train_recall=0.947] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.83      0.93      0.88        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.92      0.92      0.92        12
     LOC.NOM       0.37      0.54      0.44        13
     ORG.NAM       0.95      0.96      0.95        55
     ORG.NOM       0.47      0.70      0.56        10
     PER.NAM       0.95      0.96      0.96       105
     PER.NOM       0.97      0.99      0.98       141

   micro avg       0.90      0.94      0.92       381
   macro avg       0.68      0.75      0.71       381
weighted avg       0.90      0.94      0.92       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.43it/s, F1=0.625, eval_acc=0.965, eval_loss=8.79, eval_precision=0.58, eval_recall=0.681] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.58      0.73      0.64        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.23      0.83      0.36         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.33      0.34      0.34        47
     ORG.NOM       0.80      0.80      0.80         5
     PER.NAM       0.51      0.70      0.59        90
     PER.NOM       0.75      0.75      0.75       208

   micro avg       0.59      0.68      0.63       389
   macro avg       0.40      0.52      0.43       389
weighted avg       0.61      0.68      0.64       389



Epoch: 16/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.34it/s, F1=0.886, train_acc=0.996, train_loss=0.796, train_precision=0.875, train_recall=0.899]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.89      0.91      0.90        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.69      0.92      0.79        12
     LOC.NOM       0.33      0.46      0.39        13
     ORG.NAM       0.96      1.00      0.98        55
     ORG.NOM       0.58      0.70      0.64        10
     PER.NAM       0.94      0.95      0.95       105
     PER.NOM       0.95      0.96      0.96       141

   micro avg       0.89      0.93      0.91       381
   macro avg       0.67      0.74      0.70       381
weighted avg       0.90      0.93      0.91       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.43it/s, F1=0.585, eval_acc=0.961, eval_loss=9.85, eval_precision=0.503, eval_recall=0.706]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.50      0.81      0.62        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.21      0.50      0.30         6
     LOC.NOM       0.09      0.33      0.14         6
     ORG.NAM       0.28      0.36      0.31        47
     ORG.NOM       0.31      0.80      0.44         5
     PER.NAM       0.52      0.69      0.59        90
     PER.NOM       0.67      0.80      0.73       208

   micro avg       0.53      0.71      0.61       389
   macro avg       0.32      0.54      0.39       389
weighted avg       0.55      0.71      0.62       389



Epoch: 17/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.26it/s, F1=0.909, train_acc=0.997, train_loss=0.762, train_precision=0.898, train_recall=0.922]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.89      0.93      0.91        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.83      0.83      0.83        12
     LOC.NOM       0.53      0.77      0.62        13
     ORG.NAM       0.95      0.98      0.96        55
     ORG.NOM       0.54      0.70      0.61        10
     PER.NAM       0.94      0.96      0.95       105
     PER.NOM       0.97      0.99      0.98       141

   micro avg       0.91      0.95      0.93       381
   macro avg       0.71      0.77      0.73       381
weighted avg       0.92      0.95      0.93       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.36it/s, F1=0.593, eval_acc=0.962, eval_loss=9.61, eval_precision=0.505, eval_recall=0.722]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.55      0.65      0.60        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.16      0.83      0.27         6
     LOC.NOM       0.17      0.50      0.25         6
     ORG.NAM       0.25      0.45      0.32        47
     ORG.NOM       0.30      0.60      0.40         5
     PER.NAM       0.54      0.73      0.62        90
     PER.NOM       0.69      0.80      0.74       208

   micro avg       0.52      0.72      0.61       389
   macro avg       0.33      0.57      0.40       389
weighted avg       0.57      0.72      0.63       389



Epoch: 18/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.22it/s, F1=0.971, train_acc=0.998, train_loss=0.585, train_precision=0.97, train_recall=0.972] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.93      0.95      0.94        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       1.00      1.00      1.00        12
     LOC.NOM       0.80      0.92      0.86        13
     ORG.NAM       0.96      1.00      0.98        55
     ORG.NOM       0.82      0.90      0.86        10
     PER.NAM       1.00      0.99      1.00       105
     PER.NOM       0.99      0.99      0.99       141

   micro avg       0.97      0.98      0.98       381
   macro avg       0.81      0.84      0.83       381
weighted avg       0.97      0.98      0.97       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.44it/s, F1=0.633, eval_acc=0.964, eval_loss=9.35, eval_precision=0.569, eval_recall=0.718]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.61      0.73      0.67        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.17      0.67      0.27         6
     LOC.NOM       0.13      0.33      0.19         6
     ORG.NAM       0.36      0.43      0.39        47
     ORG.NOM       0.50      0.80      0.62         5
     PER.NAM       0.61      0.69      0.65        90
     PER.NOM       0.72      0.82      0.76       208

   micro avg       0.60      0.72      0.65       389
   macro avg       0.39      0.56      0.44       389
weighted avg       0.62      0.72      0.67       389



Epoch: 19/30 Train: 100%|██████████| 32/32 [00:10<00:00,  3.18it/s, F1=0.854, train_acc=0.991, train_loss=2.86, train_precision=0.85, train_recall=0.866] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.98      0.98      0.98        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.83      0.83      0.83        12
     LOC.NOM       0.71      0.77      0.74        13
     ORG.NAM       0.84      0.93      0.88        55
     ORG.NOM       0.73      0.80      0.76        10
     PER.NAM       0.75      0.81      0.78       105
     PER.NOM       0.96      0.96      0.96       141

   micro avg       0.86      0.90      0.88       381
   macro avg       0.72      0.76      0.74       381
weighted avg       0.86      0.90      0.88       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.41it/s, F1=0.627, eval_acc=0.966, eval_loss=9.52, eval_precision=0.605, eval_recall=0.655]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.64      0.81      0.71        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.24      0.67      0.35         6
     LOC.NOM       0.17      0.17      0.17         6
     ORG.NAM       0.35      0.40      0.37        47
     ORG.NOM       0.67      0.80      0.73         5
     PER.NAM       0.65      0.71      0.68        90
     PER.NOM       0.72      0.66      0.69       208

   micro avg       0.62      0.64      0.63       389
   macro avg       0.43      0.53      0.46       389
weighted avg       0.64      0.64      0.64       389



Epoch: 20/30 Train: 100%|██████████| 32/32 [00:12<00:00,  2.48it/s, F1=0.944, train_acc=0.997, train_loss=0.945, train_precision=0.947, train_recall=0.948]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.93      0.98      0.95        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.83      0.83      0.83        12
     LOC.NOM       0.69      0.85      0.76        13
     ORG.NAM       0.90      0.98      0.94        55
     ORG.NOM       0.82      0.90      0.86        10
     PER.NAM       0.95      0.97      0.96       105
     PER.NOM       0.99      0.97      0.98       141

   micro avg       0.93      0.96      0.95       381
   macro avg       0.76      0.81      0.79       381
weighted avg       0.93      0.96      0.95       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.43it/s, F1=0.63, eval_acc=0.963, eval_loss=9.74, eval_precision=0.555, eval_recall=0.744] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.62      0.77      0.69        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.22      0.83      0.34         6
     LOC.NOM       0.14      0.33      0.20         6
     ORG.NAM       0.36      0.40      0.38        47
     ORG.NOM       0.50      0.80      0.62         5
     PER.NAM       0.57      0.77      0.66        90
     PER.NOM       0.71      0.81      0.75       208

   micro avg       0.59      0.74      0.65       389
   macro avg       0.39      0.59      0.46       389
weighted avg       0.61      0.74      0.66       389



Epoch: 21/30 Train: 100%|██████████| 32/32 [00:10<00:00,  3.14it/s, F1=0.931, train_acc=0.999, train_loss=0.524, train_precision=0.927, train_recall=0.937]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.98      0.95      0.96        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.86      1.00      0.92        12
     LOC.NOM       0.86      0.92      0.89        13
     ORG.NAM       0.95      0.98      0.96        55
     ORG.NOM       0.82      0.90      0.86        10
     PER.NAM       0.97      0.98      0.98       105
     PER.NOM       0.97      0.98      0.98       141

   micro avg       0.95      0.97      0.96       381
   macro avg       0.80      0.84      0.82       381
weighted avg       0.95      0.97      0.96       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.43it/s, F1=0.672, eval_acc=0.966, eval_loss=9.63, eval_precision=0.604, eval_recall=0.768]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.62      0.77      0.69        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.24      1.00      0.39         6
     LOC.NOM       0.12      0.33      0.17         6
     ORG.NAM       0.37      0.47      0.41        47
     ORG.NOM       0.50      0.80      0.62         5
     PER.NAM       0.61      0.73      0.66        90
     PER.NOM       0.74      0.77      0.76       208

   micro avg       0.60      0.72      0.66       389
   macro avg       0.40      0.61      0.46       389
weighted avg       0.63      0.72      0.67       389



Epoch: 22/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.30it/s, F1=0.976, train_acc=0.999, train_loss=0.264, train_precision=0.972, train_recall=0.981]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.98      0.98      0.98        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       1.00      1.00      1.00        12
     LOC.NOM       0.93      1.00      0.96        13
     ORG.NAM       0.98      1.00      0.99        55
     ORG.NOM       0.82      0.90      0.86        10
     PER.NAM       1.00      0.99      1.00       105
     PER.NOM       0.99      1.00      1.00       141

   micro avg       0.98      0.99      0.98       381
   macro avg       0.84      0.86      0.85       381
weighted avg       0.98      0.99      0.98       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.44it/s, F1=0.665, eval_acc=0.968, eval_loss=9.79, eval_precision=0.598, eval_recall=0.762]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.64      0.81      0.71        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.26      1.00      0.41         6
     LOC.NOM       0.14      0.33      0.20         6
     ORG.NAM       0.37      0.45      0.40        47
     ORG.NOM       0.50      0.80      0.62         5
     PER.NAM       0.62      0.77      0.69        90
     PER.NOM       0.74      0.79      0.76       208

   micro avg       0.61      0.74      0.67       389
   macro avg       0.41      0.62      0.47       389
weighted avg       0.64      0.74      0.68       389



Epoch: 23/30 Train: 100%|██████████| 32/32 [00:10<00:00,  3.17it/s, F1=0.984, train_acc=0.999, train_loss=0.298, train_precision=0.98, train_recall=0.987] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      0.98      0.99        43
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       1.00      1.00      1.00        12
     LOC.NOM       0.87      1.00      0.93        13
     ORG.NAM       1.00      1.00      1.00        55
     ORG.NOM       0.82      0.90      0.86        10
     PER.NAM       0.99      1.00      1.00       105
     PER.NOM       0.99      0.99      0.99       141

   micro avg       0.98      0.99      0.98       381
   macro avg       0.83      0.86      0.85       381
weighted avg       0.98      0.99      0.98       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.42it/s, F1=0.651, eval_acc=0.967, eval_loss=9.65, eval_precision=0.592, eval_recall=0.734]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.62      0.81      0.70        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.27      1.00      0.43         6
     LOC.NOM       0.15      0.33      0.21         6
     ORG.NAM       0.39      0.45      0.42        47
     ORG.NOM       0.67      0.80      0.73         5
     PER.NAM       0.64      0.72      0.68        90
     PER.NOM       0.72      0.78      0.75       208

   micro avg       0.62      0.72      0.67       389
   macro avg       0.43      0.61      0.49       389
weighted avg       0.64      0.72      0.67       389



Epoch: 24/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.23it/s, F1=0.988, train_acc=0.999, train_loss=0.261, train_precision=0.986, train_recall=0.99] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      0.98      0.99        43
     GPE.NOM       0.67      1.00      0.80         2
     LOC.NAM       1.00      1.00      1.00        12
     LOC.NOM       1.00      1.00      1.00        13
     ORG.NAM       1.00      1.00      1.00        55
     ORG.NOM       0.82      0.90      0.86        10
     PER.NAM       0.98      0.98      0.98       105
     PER.NOM       0.98      0.99      0.99       141

   micro avg       0.98      0.99      0.98       381
   macro avg       0.93      0.98      0.95       381
weighted avg       0.98      0.99      0.98       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.24it/s, F1=0.679, eval_acc=0.968, eval_loss=9.99, eval_precision=0.605, eval_recall=0.779]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.68      0.81      0.74        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.21      1.00      0.35         6
     LOC.NOM       0.14      0.33      0.20         6
     ORG.NAM       0.34      0.47      0.40        47
     ORG.NOM       0.33      0.60      0.43         5
     PER.NAM       0.57      0.78      0.66        90
     PER.NOM       0.75      0.78      0.77       208

   micro avg       0.59      0.74      0.66       389
   macro avg       0.38      0.60      0.44       389
weighted avg       0.63      0.74      0.67       389



Epoch: 25/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.27it/s, F1=0.992, train_acc=0.999, train_loss=0.211, train_precision=0.99, train_recall=0.994] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        43
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       1.00      1.00      1.00        12
     LOC.NOM       1.00      1.00      1.00        13
     ORG.NAM       0.95      0.98      0.96        55
     ORG.NOM       0.82      0.90      0.86        10
     PER.NAM       0.99      0.99      0.99       105
     PER.NOM       1.00      0.99      1.00       141

   micro avg       0.98      0.99      0.99       381
   macro avg       0.97      0.98      0.98       381
weighted avg       0.99      0.99      0.99       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.44it/s, F1=0.688, eval_acc=0.967, eval_loss=10.4, eval_precision=0.607, eval_recall=0.798]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.66      0.81      0.72        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.26      1.00      0.41         6
     LOC.NOM       0.11      0.33      0.17         6
     ORG.NAM       0.34      0.45      0.39        47
     ORG.NOM       0.50      0.80      0.62         5
     PER.NAM       0.60      0.80      0.69        90
     PER.NOM       0.72      0.82      0.77       208

   micro avg       0.60      0.76      0.67       389
   macro avg       0.40      0.63      0.47       389
weighted avg       0.62      0.76      0.68       389



Epoch: 26/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.34it/s, F1=0.994, train_acc=1, train_loss=0.126, train_precision=0.992, train_recall=0.996]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.98      1.00      0.99        43
     GPE.NOM       0.50      0.50      0.50         2
     LOC.NAM       1.00      1.00      1.00        12
     LOC.NOM       1.00      1.00      1.00        13
     ORG.NAM       1.00      1.00      1.00        55
     ORG.NOM       0.82      0.90      0.86        10
     PER.NAM       1.00      1.00      1.00       105
     PER.NOM       1.00      1.00      1.00       141

   micro avg       0.99      0.99      0.99       381
   macro avg       0.91      0.93      0.92       381
weighted avg       0.99      0.99      0.99       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.42it/s, F1=0.691, eval_acc=0.968, eval_loss=10.4, eval_precision=0.612, eval_recall=0.796]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.64      0.81      0.71        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.29      1.00      0.44         6
     LOC.NOM       0.13      0.33      0.19         6
     ORG.NAM       0.34      0.45      0.39        47
     ORG.NOM       0.44      0.80      0.57         5
     PER.NAM       0.62      0.80      0.70        90
     PER.NOM       0.72      0.82      0.77       208

   micro avg       0.60      0.76      0.67       389
   macro avg       0.40      0.63      0.47       389
weighted avg       0.62      0.76      0.68       389



Epoch: 27/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.25it/s, F1=0.994, train_acc=1, train_loss=0.113, train_precision=0.992, train_recall=0.995]    


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        43
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       1.00      1.00      1.00        12
     LOC.NOM       1.00      1.00      1.00        13
     ORG.NAM       1.00      1.00      1.00        55
     ORG.NOM       0.82      0.90      0.86        10
     PER.NAM       1.00      1.00      1.00       105
     PER.NOM       0.99      0.99      0.99       141

   micro avg       0.99      0.99      0.99       381
   macro avg       0.98      0.99      0.98       381
weighted avg       0.99      0.99      0.99       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.45it/s, F1=0.683, eval_acc=0.967, eval_loss=10.6, eval_precision=0.603, eval_recall=0.791]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.64      0.81      0.71        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.27      1.00      0.43         6
     LOC.NOM       0.13      0.33      0.19         6
     ORG.NAM       0.33      0.45      0.38        47
     ORG.NOM       0.44      0.80      0.57         5
     PER.NAM       0.58      0.78      0.67        90
     PER.NOM       0.72      0.81      0.76       208

   micro avg       0.59      0.75      0.66       389
   macro avg       0.39      0.62      0.46       389
weighted avg       0.61      0.75      0.67       389



Epoch: 28/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.31it/s, F1=0.961, train_acc=1, train_loss=0.0867, train_precision=0.96, train_recall=0.962] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        43
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       1.00      1.00      1.00        12
     LOC.NOM       1.00      1.00      1.00        13
     ORG.NAM       1.00      1.00      1.00        55
     ORG.NOM       0.82      0.90      0.86        10
     PER.NAM       1.00      0.99      1.00       105
     PER.NOM       1.00      1.00      1.00       141

   micro avg       0.99      0.99      0.99       381
   macro avg       0.98      0.99      0.98       381
weighted avg       1.00      0.99      0.99       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  3.92it/s, F1=0.688, eval_acc=0.967, eval_loss=10.6, eval_precision=0.61, eval_recall=0.791] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.64      0.81      0.71        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.26      1.00      0.41         6
     LOC.NOM       0.14      0.33      0.20         6
     ORG.NAM       0.34      0.45      0.39        47
     ORG.NOM       0.50      0.80      0.62         5
     PER.NAM       0.59      0.78      0.67        90
     PER.NOM       0.73      0.81      0.77       208

   micro avg       0.60      0.75      0.67       389
   macro avg       0.40      0.62      0.47       389
weighted avg       0.62      0.75      0.68       389



Epoch: 29/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.25it/s, F1=0.99, train_acc=1, train_loss=0.136, train_precision=0.992, train_recall=0.989]     


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        43
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       1.00      1.00      1.00        12
     LOC.NOM       1.00      1.00      1.00        13
     ORG.NAM       1.00      1.00      1.00        55
     ORG.NOM       1.00      1.00      1.00        10
     PER.NAM       0.95      0.97      0.96       105
     PER.NOM       1.00      1.00      1.00       141

   micro avg       0.99      0.99      0.99       381
   macro avg       0.99      1.00      1.00       381
weighted avg       0.99      0.99      0.99       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.44it/s, F1=0.68, eval_acc=0.968, eval_loss=10.5, eval_precision=0.613, eval_recall=0.769] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.64      0.81      0.71        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.29      1.00      0.44         6
     LOC.NOM       0.18      0.33      0.24         6
     ORG.NAM       0.35      0.45      0.39        47
     ORG.NOM       0.50      0.80      0.62         5
     PER.NAM       0.63      0.78      0.70        90
     PER.NOM       0.74      0.80      0.77       208

   micro avg       0.62      0.75      0.68       389
   macro avg       0.42      0.62      0.48       389
weighted avg       0.64      0.75      0.69       389



Epoch: 30/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.22it/s, F1=0.985, train_acc=0.999, train_loss=0.215, train_precision=0.982, train_recall=0.989]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        43
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       1.00      1.00      1.00        12
     LOC.NOM       1.00      1.00      1.00        13
     ORG.NAM       1.00      1.00      1.00        55
     ORG.NOM       1.00      1.00      1.00        10
     PER.NAM       0.97      0.96      0.97       105
     PER.NOM       0.98      0.99      0.99       141

   micro avg       0.98      0.99      0.99       381
   macro avg       0.99      0.99      0.99       381
weighted avg       0.98      0.99      0.99       381



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.44it/s, F1=0.644, eval_acc=0.966, eval_loss=10.5, eval_precision=0.555, eval_recall=0.775]


eval_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.64      0.81      0.71        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.26      1.00      0.41         6
     LOC.NOM       0.20      0.50      0.29         6
     ORG.NAM       0.34      0.53      0.41        47
     ORG.NOM       0.36      0.80      0.50         5
     PER.NAM       0.57      0.80      0.66        90
     PER.NOM       0.71      0.82      0.76       208

   micro avg       0.58      0.78      0.66       389
   macro avg       0.38      0.66      0.47       389
weighted avg       0.61      0.78      0.68       389

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/weibo/train_500.json",
    "eval_file": "data/few_shot/weibo/dev.json",
    "test_file": "d

calculate data/few_shot/weibo/train_500.json etag: 100%|██████████| 339k/339k [00:01<00:00, 259kB/s]
calculate data/few_shot/weibo/dev.json etag: 100%|██████████| 180k/180k [00:00<00:00, 157MB/s]
calculate data/few_shot/weibo/test.json etag: 100%|██████████| 184k/184k [00:00<00:00, 172MB/s]
calculate data/few_shot/weibo/labels.txt etag: 100%|██████████| 272/272 [00:00<00:00, 454kB/s]


load cached ./temp/ada2fdd9eb2e52ae2745d5d8c800bddd_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/lexicon_tree


count line size data/few_shot/weibo/labels.txt: 29L [00:00, 189167.68L/s]
build line mapper: 29L [00:00, 220752.84L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 29/29 [00:00<00:00, 8022.88it/s]
load vocab from list: 100%|██████████| 28/28 [00:00<00:00, 280287.62it/s]
load dataset from data/few_shot/weibo/train_500.json: 0it [00:00, ?it/s]

load cached ./temp/ada2fdd9eb2e52ae2745d5d8c800bddd_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/matched_words
load cached ./temp/ada2fdd9eb2e52ae2745d5d8c800bddd_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/word_vocab
load cached ./temp/ada2fdd9eb2e52ae2745d5d8c800bddd_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/vocab_embedding


load dataset from data/few_shot/weibo/train_500.json: 500it [00:01, 488.03it/s]
load dataset from data/few_shot/weibo/dev.json: 271it [00:00, 505.29it/s]
Some weights of the model checkpoint at save_pretrained/weibo_pretrain_lebert_500_pretraind_task/Bert_480/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model fr

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.22it/s, F1=0.000356, train_acc=0.559, train_loss=117, train_precision=0.000183, train_recall=0.00876] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        21
     LOC.NOM       0.00      0.00      0.00        21
     ORG.NAM       0.00      0.00      0.00        79
     ORG.NOM       0.00      0.00      0.00        13
     PER.NAM       0.00      0.00      0.00       223
     PER.NOM       0.00      0.01      0.00       268

   micro avg       0.00      0.01      0.00       695
   macro avg       0.00      0.00      0.00       695
weighted avg       0.00      0.01      0.00       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.19it/s, F1=0, eval_acc=0.933, eval_loss=24.7, eval_precision=0, eval_recall=0]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.00      0.00      0.00        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.00      0.00      0.00        90
     PER.NOM       0.00      0.00      0.00       208

   micro avg       0.00      0.00      0.00       389
   macro avg       0.00      0.00      0.00       389
weighted avg       0.00      0.00      0.00       389



Epoch: 2/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.21it/s, F1=0, train_acc=0.934, train_loss=24.3, train_precision=0, train_recall=0]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        21
     LOC.NOM       0.00      0.00      0.00        21
     ORG.NAM       0.00      0.00      0.00        79
     ORG.NOM       0.00      0.00      0.00        13
     PER.NAM       0.00      0.00      0.00       223
     PER.NOM       0.00      0.00      0.00       268

   micro avg       0.00      0.00      0.00       695
   macro avg       0.00      0.00      0.00       695
weighted avg       0.00      0.00      0.00       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.45it/s, F1=0, eval_acc=0.933, eval_loss=18.6, eval_precision=0, eval_recall=0]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.00      0.00      0.00        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.00      0.00      0.00        90
     PER.NOM       0.00      0.00      0.00       208

   micro avg       0.00      0.00      0.00       389
   macro avg       0.00      0.00      0.00       389
weighted avg       0.00      0.00      0.00       389



Epoch: 3/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.19it/s, F1=0.097, train_acc=0.939, train_loss=16.1, train_precision=0.128, train_recall=0.0948]    


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        21
     LOC.NOM       0.00      0.00      0.00        21
     ORG.NAM       0.00      0.00      0.00        79
     ORG.NOM       0.00      0.00      0.00        13
     PER.NAM       0.18      0.14      0.16       223
     PER.NOM       0.24      0.14      0.18       268

   micro avg       0.19      0.10      0.13       695
   macro avg       0.05      0.04      0.04       695
weighted avg       0.15      0.10      0.12       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.43it/s, F1=0.353, eval_acc=0.954, eval_loss=9.66, eval_precision=0.353, eval_recall=0.355]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.00      0.00      0.00        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.22      0.23      0.23        90
     PER.NOM       0.46      0.62      0.53       208

   micro avg       0.39      0.38      0.39       389
   macro avg       0.09      0.11      0.09       389
weighted avg       0.30      0.38      0.33       389



Epoch: 4/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.28it/s, F1=0.375, train_acc=0.959, train_loss=9.25, train_precision=0.351, train_recall=0.433]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        21
     LOC.NOM       0.00      0.00      0.00        21
     ORG.NAM       0.02      0.03      0.02        79
     ORG.NOM       0.00      0.00      0.00        13
     PER.NAM       0.30      0.51      0.38       223
     PER.NOM       0.42      0.63      0.50       268

   micro avg       0.31      0.41      0.35       695
   macro avg       0.09      0.15      0.11       695
weighted avg       0.26      0.41      0.32       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.37it/s, F1=0.384, eval_acc=0.961, eval_loss=7.39, eval_precision=0.311, eval_recall=0.509]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.06      0.19      0.09        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.47      0.64      0.54        90
     PER.NOM       0.58      0.68      0.63       208

   micro avg       0.34      0.54      0.42       389
   macro avg       0.14      0.19      0.16       389
weighted avg       0.43      0.54      0.47       389



Epoch: 5/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.20it/s, F1=0.556, train_acc=0.975, train_loss=5.58, train_precision=0.516, train_recall=0.62] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.17      0.26      0.20        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        21
     LOC.NOM       0.00      0.00      0.00        21
     ORG.NAM       0.22      0.47      0.30        79
     ORG.NOM       0.00      0.00      0.00        13
     PER.NAM       0.60      0.77      0.67       223
     PER.NOM       0.62      0.76      0.68       268

   micro avg       0.47      0.62      0.54       695
   macro avg       0.20      0.28      0.23       695
weighted avg       0.47      0.62      0.53       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.45it/s, F1=0.548, eval_acc=0.961, eval_loss=6.74, eval_precision=0.458, eval_recall=0.689]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.38      0.50      0.43        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.22      0.43      0.29        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.37      0.76      0.50        90
     PER.NOM       0.66      0.81      0.72       208

   micro avg       0.47      0.69      0.56       389
   macro avg       0.20      0.31      0.24       389
weighted avg       0.49      0.69      0.57       389



Epoch: 6/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.23it/s, F1=0.728, train_acc=0.982, train_loss=3.75, train_precision=0.704, train_recall=0.77] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.37      0.59      0.46        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        21
     LOC.NOM       0.00      0.00      0.00        21
     ORG.NAM       0.49      0.72      0.58        79
     ORG.NOM       0.00      0.00      0.00        13
     PER.NAM       0.66      0.83      0.74       223
     PER.NOM       0.81      0.90      0.85       268

   micro avg       0.62      0.75      0.68       695
   macro avg       0.29      0.38      0.33       695
weighted avg       0.62      0.75      0.68       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.34it/s, F1=0.611, eval_acc=0.966, eval_loss=6.67, eval_precision=0.541, eval_recall=0.704]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.40      0.65      0.50        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.23      0.38      0.29        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.56      0.73      0.64        90
     PER.NOM       0.72      0.80      0.76       208

   micro avg       0.54      0.69      0.61       389
   macro avg       0.24      0.32      0.27       389
weighted avg       0.57      0.69      0.62       389



Epoch: 7/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.22it/s, F1=0.783, train_acc=0.989, train_loss=2.43, train_precision=0.752, train_recall=0.829]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.61      0.79      0.69        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        21
     LOC.NOM       0.06      0.10      0.07        21
     ORG.NAM       0.72      0.87      0.79        79
     ORG.NOM       0.17      0.15      0.16        13
     PER.NAM       0.81      0.90      0.85       223
     PER.NOM       0.87      0.93      0.90       268

   micro avg       0.73      0.83      0.78       695
   macro avg       0.40      0.47      0.43       695
weighted avg       0.74      0.83      0.78       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.29it/s, F1=0.612, eval_acc=0.966, eval_loss=7.82, eval_precision=0.575, eval_recall=0.665]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.49      0.65      0.56        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.07      0.17      0.10         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.25      0.32      0.28        47
     ORG.NOM       0.20      0.20      0.20         5
     PER.NAM       0.69      0.66      0.67        90
     PER.NOM       0.75      0.75      0.75       208

   micro avg       0.59      0.64      0.61       389
   macro avg       0.31      0.34      0.32       389
weighted avg       0.63      0.64      0.63       389



Epoch: 8/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.27it/s, F1=0.805, train_acc=0.99, train_loss=2.28, train_precision=0.779, train_recall=0.843] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.68      0.82      0.75        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.13      0.24      0.17        21
     LOC.NOM       0.15      0.19      0.17        21
     ORG.NAM       0.71      0.82      0.76        79
     ORG.NOM       0.36      0.38      0.37        13
     PER.NAM       0.84      0.92      0.88       223
     PER.NOM       0.89      0.94      0.91       268

   micro avg       0.76      0.85      0.80       695
   macro avg       0.47      0.54      0.50       695
weighted avg       0.78      0.85      0.81       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.22it/s, F1=0.633, eval_acc=0.968, eval_loss=6.4, eval_precision=0.564, eval_recall=0.726] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.55      0.81      0.66        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.25      0.38      0.31        47
     ORG.NOM       0.27      0.80      0.40         5
     PER.NAM       0.58      0.72      0.64        90
     PER.NOM       0.75      0.82      0.78       208

   micro avg       0.57      0.71      0.64       389
   macro avg       0.30      0.44      0.35       389
weighted avg       0.60      0.71      0.65       389



Epoch: 9/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.25it/s, F1=0.794, train_acc=0.992, train_loss=1.63, train_precision=0.768, train_recall=0.827]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.93      0.91      0.92        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.11      0.19      0.14        21
     LOC.NOM       0.09      0.14      0.11        21
     ORG.NAM       0.82      0.94      0.88        79
     ORG.NOM       0.39      0.54      0.45        13
     PER.NAM       0.85      0.92      0.89       223
     PER.NOM       0.89      0.93      0.91       268

   micro avg       0.79      0.87      0.83       695
   macro avg       0.51      0.57      0.54       695
weighted avg       0.81      0.87      0.84       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.36it/s, F1=0.622, eval_acc=0.968, eval_loss=7.63, eval_precision=0.578, eval_recall=0.678]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.57      0.81      0.67        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.28      0.32      0.30        47
     ORG.NOM       0.40      0.80      0.53         5
     PER.NAM       0.68      0.68      0.68        90
     PER.NOM       0.75      0.77      0.76       208

   micro avg       0.60      0.67      0.63       389
   macro avg       0.33      0.42      0.37       389
weighted avg       0.64      0.67      0.65       389



Epoch: 10/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.30it/s, F1=0.856, train_acc=0.992, train_loss=1.6, train_precision=0.828, train_recall=0.893] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.94      0.94      0.94        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.18      0.29      0.22        21
     LOC.NOM       0.21      0.38      0.27        21
     ORG.NAM       0.82      0.94      0.88        79
     ORG.NOM       0.50      0.62      0.55        13
     PER.NAM       0.85      0.90      0.88       223
     PER.NOM       0.92      0.97      0.94       268

   micro avg       0.81      0.89      0.85       695
   macro avg       0.55      0.63      0.58       695
weighted avg       0.83      0.89      0.86       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.40it/s, F1=0.609, eval_acc=0.964, eval_loss=7.22, eval_precision=0.533, eval_recall=0.715]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.55      0.85      0.67        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.13      0.50      0.21         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.27      0.45      0.33        47
     ORG.NOM       0.50      0.80      0.62         5
     PER.NAM       0.56      0.76      0.64        90
     PER.NOM       0.70      0.78      0.74       208

   micro avg       0.55      0.72      0.62       389
   macro avg       0.34      0.52      0.40       389
weighted avg       0.58      0.72      0.64       389



Epoch: 11/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.25it/s, F1=0.772, train_acc=0.985, train_loss=4.02, train_precision=0.766, train_recall=0.795]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.87      0.96      0.91        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.38      0.62      0.47        21
     LOC.NOM       0.17      0.19      0.18        21
     ORG.NAM       0.78      0.87      0.82        79
     ORG.NOM       0.57      0.62      0.59        13
     PER.NAM       0.60      0.70      0.65       223
     PER.NOM       0.89      0.94      0.91       268

   micro avg       0.73      0.82      0.77       695
   macro avg       0.53      0.61      0.57       695
weighted avg       0.74      0.82      0.77       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.33it/s, F1=0.628, eval_acc=0.966, eval_loss=7.2, eval_precision=0.559, eval_recall=0.721] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.58      0.73      0.64        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.33      0.50      0.40         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.26      0.51      0.34        47
     ORG.NOM       0.60      0.60      0.60         5
     PER.NAM       0.55      0.78      0.64        90
     PER.NOM       0.75      0.75      0.75       208

   micro avg       0.56      0.71      0.63       389
   macro avg       0.38      0.48      0.42       389
weighted avg       0.61      0.71      0.65       389



Epoch: 12/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.20it/s, F1=0.874, train_acc=0.993, train_loss=1.61, train_precision=0.848, train_recall=0.909]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.92      0.96      0.94        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.48      0.52      0.50        21
     LOC.NOM       0.30      0.57      0.39        21
     ORG.NAM       0.90      0.95      0.93        79
     ORG.NOM       0.53      0.62      0.57        13
     PER.NAM       0.80      0.90      0.85       223
     PER.NOM       0.94      0.96      0.95       268

   micro avg       0.83      0.91      0.87       695
   macro avg       0.61      0.68      0.64       695
weighted avg       0.84      0.91      0.87       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.38it/s, F1=0.619, eval_acc=0.963, eval_loss=8.88, eval_precision=0.559, eval_recall=0.698]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.50      0.58      0.54        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.18      0.50      0.26         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.28      0.38      0.32        47
     ORG.NOM       0.56      1.00      0.71         5
     PER.NAM       0.53      0.71      0.61        90
     PER.NOM       0.73      0.77      0.75       208

   micro avg       0.57      0.68      0.62       389
   macro avg       0.35      0.49      0.40       389
weighted avg       0.59      0.68      0.63       389



Epoch: 13/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.24it/s, F1=0.908, train_acc=0.995, train_loss=1.11, train_precision=0.887, train_recall=0.935] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.90      0.90      0.90        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.83      0.95      0.89        21
     LOC.NOM       0.54      0.71      0.61        21
     ORG.NAM       0.91      0.95      0.93        79
     ORG.NOM       0.71      0.92      0.80        13
     PER.NAM       0.84      0.92      0.88       223
     PER.NOM       0.93      0.98      0.96       268

   micro avg       0.87      0.94      0.90       695
   macro avg       0.71      0.79      0.75       695
weighted avg       0.88      0.94      0.91       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.43it/s, F1=0.631, eval_acc=0.965, eval_loss=7.39, eval_precision=0.565, eval_recall=0.719]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.51      0.69      0.59        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.17      0.83      0.28         6
     LOC.NOM       0.12      0.33      0.17         6
     ORG.NAM       0.29      0.38      0.33        47
     ORG.NOM       0.62      1.00      0.77         5
     PER.NAM       0.59      0.72      0.65        90
     PER.NOM       0.77      0.78      0.78       208

   micro avg       0.58      0.71      0.64       389
   macro avg       0.38      0.59      0.45       389
weighted avg       0.63      0.71      0.66       389



Epoch: 14/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.29it/s, F1=0.91, train_acc=0.995, train_loss=0.89, train_precision=0.893, train_recall=0.935]  


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.93      0.94      0.93        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.76      0.90      0.83        21
     LOC.NOM       0.39      0.57      0.46        21
     ORG.NAM       0.81      0.92      0.86        79
     ORG.NOM       0.92      0.92      0.92        13
     PER.NAM       0.91      0.95      0.93       223
     PER.NOM       0.94      0.97      0.95       268

   micro avg       0.88      0.94      0.91       695
   macro avg       0.71      0.77      0.74       695
weighted avg       0.89      0.94      0.91       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.35it/s, F1=0.635, eval_acc=0.967, eval_loss=7.81, eval_precision=0.567, eval_recall=0.727]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.57      0.77      0.66        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.15      0.50      0.23         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.29      0.45      0.35        47
     ORG.NOM       0.45      1.00      0.62         5
     PER.NAM       0.63      0.74      0.68        90
     PER.NOM       0.76      0.78      0.77       208

   micro avg       0.59      0.72      0.65       389
   macro avg       0.36      0.53      0.41       389
weighted avg       0.63      0.72      0.67       389



Epoch: 15/30 Train: 100%|██████████| 63/63 [00:22<00:00,  2.75it/s, F1=0.955, train_acc=0.997, train_loss=0.574, train_precision=0.945, train_recall=0.967]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      1.00      0.99        68
     GPE.NOM       0.50      0.50      0.50         2
     LOC.NAM       0.83      0.95      0.89        21
     LOC.NOM       0.68      0.81      0.74        21
     ORG.NAM       0.94      0.96      0.95        79
     ORG.NOM       0.92      0.92      0.92        13
     PER.NAM       0.94      0.97      0.96       223
     PER.NOM       0.95      0.97      0.96       268

   micro avg       0.94      0.97      0.95       695
   macro avg       0.84      0.89      0.86       695
weighted avg       0.94      0.97      0.95       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.45it/s, F1=0.644, eval_acc=0.966, eval_loss=8.07, eval_precision=0.579, eval_recall=0.734]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.62      0.69      0.65        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.27      0.67      0.38         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.33      0.49      0.40        47
     ORG.NOM       0.50      1.00      0.67         5
     PER.NAM       0.59      0.76      0.66        90
     PER.NOM       0.75      0.79      0.77       208

   micro avg       0.60      0.73      0.66       389
   macro avg       0.38      0.55      0.44       389
weighted avg       0.63      0.73      0.67       389



Epoch: 16/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.25it/s, F1=0.948, train_acc=0.997, train_loss=0.504, train_precision=0.938, train_recall=0.959]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      0.99      0.99        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.87      0.95      0.91        21
     LOC.NOM       0.88      1.00      0.93        21
     ORG.NAM       0.94      0.97      0.96        79
     ORG.NOM       1.00      0.92      0.96        13
     PER.NAM       0.96      0.98      0.97       223
     PER.NOM       0.95      0.97      0.96       268

   micro avg       0.95      0.97      0.96       695
   macro avg       0.82      0.85      0.83       695
weighted avg       0.95      0.97      0.96       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.43it/s, F1=0.606, eval_acc=0.961, eval_loss=8.98, eval_precision=0.529, eval_recall=0.718]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.58      0.81      0.68        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.18      0.50      0.26         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.32      0.45      0.37        47
     ORG.NOM       0.45      1.00      0.62         5
     PER.NAM       0.59      0.73      0.66        90
     PER.NOM       0.65      0.76      0.70       208

   micro avg       0.55      0.71      0.62       389
   macro avg       0.35      0.53      0.41       389
weighted avg       0.57      0.71      0.63       389



Epoch: 17/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.26it/s, F1=0.969, train_acc=0.997, train_loss=0.483, train_precision=0.963, train_recall=0.981]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.96      0.99      0.97        68
     GPE.NOM       0.50      0.50      0.50         2
     LOC.NAM       1.00      0.95      0.98        21
     LOC.NOM       0.83      0.90      0.86        21
     ORG.NAM       0.94      0.97      0.96        79
     ORG.NOM       1.00      0.92      0.96        13
     PER.NAM       0.98      0.98      0.98       223
     PER.NOM       0.96      0.99      0.98       268

   micro avg       0.96      0.98      0.97       695
   macro avg       0.90      0.90      0.90       695
weighted avg       0.96      0.98      0.97       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.43it/s, F1=0.619, eval_acc=0.964, eval_loss=8.34, eval_precision=0.538, eval_recall=0.742]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.59      0.77      0.67        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.16      0.83      0.27         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.29      0.38      0.33        47
     ORG.NOM       0.42      1.00      0.59         5
     PER.NAM       0.57      0.77      0.65        90
     PER.NOM       0.77      0.81      0.79       208

   micro avg       0.57      0.74      0.64       389
   macro avg       0.35      0.57      0.41       389
weighted avg       0.62      0.74      0.67       389



Epoch: 18/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.28it/s, F1=0.977, train_acc=0.998, train_loss=0.315, train_precision=0.971, train_recall=0.984]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       0.95      1.00      0.98        21
     LOC.NOM       0.95      1.00      0.98        21
     ORG.NAM       0.99      0.99      0.99        79
     ORG.NOM       0.92      0.92      0.92        13
     PER.NAM       0.97      0.97      0.97       223
     PER.NOM       0.96      0.99      0.97       268

   micro avg       0.97      0.98      0.98       695
   macro avg       0.97      0.98      0.98       695
weighted avg       0.97      0.98      0.98       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.38it/s, F1=0.629, eval_acc=0.967, eval_loss=8.54, eval_precision=0.564, eval_recall=0.725]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.59      0.77      0.67        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.19      0.67      0.30         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.32      0.43      0.37        47
     ORG.NOM       0.42      1.00      0.59         5
     PER.NAM       0.61      0.79      0.69        90
     PER.NOM       0.76      0.76      0.76       208

   micro avg       0.60      0.71      0.65       389
   macro avg       0.36      0.55      0.42       389
weighted avg       0.64      0.71      0.67       389



Epoch: 19/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.19it/s, F1=0.982, train_acc=0.998, train_loss=0.266, train_precision=0.974, train_recall=0.99] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       0.91      1.00      0.95        21
     LOC.NOM       0.95      1.00      0.98        21
     ORG.NAM       0.97      0.99      0.98        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.98      1.00      0.99       223
     PER.NOM       0.97      0.99      0.98       268

   micro avg       0.98      0.99      0.98       695
   macro avg       0.97      1.00      0.98       695
weighted avg       0.98      0.99      0.98       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.43it/s, F1=0.675, eval_acc=0.968, eval_loss=10, eval_precision=0.625, eval_recall=0.738]  


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.66      0.81      0.72        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.30      0.50      0.37         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.35      0.40      0.38        47
     ORG.NOM       0.50      1.00      0.67         5
     PER.NAM       0.64      0.73      0.68        90
     PER.NOM       0.76      0.82      0.79       208

   micro avg       0.64      0.73      0.68       389
   macro avg       0.40      0.53      0.45       389
weighted avg       0.65      0.73      0.69       389



Epoch: 20/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.26it/s, F1=0.963, train_acc=0.998, train_loss=0.26, train_precision=0.959, train_recall=0.969] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       0.95      1.00      0.98        21
     LOC.NOM       0.95      1.00      0.98        21
     ORG.NAM       0.96      0.99      0.97        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.98      0.99      0.98       223
     PER.NOM       0.97      0.98      0.98       268

   micro avg       0.98      0.99      0.98       695
   macro avg       0.98      0.99      0.99       695
weighted avg       0.98      0.99      0.98       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.40it/s, F1=0.649, eval_acc=0.966, eval_loss=9.51, eval_precision=0.567, eval_recall=0.767]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.63      0.85      0.72        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.27      0.67      0.38         6
     LOC.NOM       0.14      0.33      0.20         6
     ORG.NAM       0.30      0.43      0.35        47
     ORG.NOM       0.38      1.00      0.56         5
     PER.NAM       0.58      0.80      0.67        90
     PER.NOM       0.76      0.84      0.79       208

   micro avg       0.60      0.77      0.67       389
   macro avg       0.38      0.61      0.46       389
weighted avg       0.63      0.77      0.69       389



Epoch: 21/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.27it/s, F1=0.987, train_acc=0.998, train_loss=0.266, train_precision=0.983, train_recall=0.991]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       0.95      1.00      0.98        21
     LOC.NOM       1.00      1.00      1.00        21
     ORG.NAM       0.96      0.99      0.97        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.98      0.99      0.99       223
     PER.NOM       0.97      0.98      0.98       268

   micro avg       0.98      0.99      0.98       695
   macro avg       0.98      0.99      0.99       695
weighted avg       0.98      0.99      0.98       695



Eval Result: 100%|██████████| 5/5 [00:04<00:00,  1.13it/s, F1=0.645, eval_acc=0.967, eval_loss=8.81, eval_precision=0.572, eval_recall=0.747]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.66      0.81      0.72        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.27      0.67      0.38         6
     LOC.NOM       0.11      0.33      0.16         6
     ORG.NAM       0.34      0.47      0.39        47
     ORG.NOM       0.56      1.00      0.71         5
     PER.NAM       0.61      0.76      0.68        90
     PER.NOM       0.72      0.80      0.76       208

   micro avg       0.60      0.74      0.66       389
   macro avg       0.41      0.60      0.48       389
weighted avg       0.62      0.74      0.67       389



Epoch: 22/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.29it/s, F1=0.969, train_acc=0.999, train_loss=0.234, train_precision=0.962, train_recall=0.978]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      0.99      0.99        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       0.91      1.00      0.95        21
     LOC.NOM       0.95      0.95      0.95        21
     ORG.NAM       0.97      0.99      0.98        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.98      0.98      0.98       223
     PER.NOM       0.97      0.99      0.98       268

   micro avg       0.97      0.99      0.98       695
   macro avg       0.97      0.99      0.98       695
weighted avg       0.97      0.99      0.98       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.43it/s, F1=0.653, eval_acc=0.967, eval_loss=8.76, eval_precision=0.587, eval_recall=0.738]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.67      0.85      0.75        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.31      0.67      0.42         6
     LOC.NOM       0.15      0.33      0.21         6
     ORG.NAM       0.30      0.43      0.35        47
     ORG.NOM       0.38      1.00      0.56         5
     PER.NAM       0.61      0.77      0.68        90
     PER.NOM       0.73      0.78      0.75       208

   micro avg       0.60      0.73      0.66       389
   macro avg       0.39      0.60      0.46       389
weighted avg       0.62      0.73      0.67       389



Epoch: 23/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.24it/s, F1=0.961, train_acc=0.998, train_loss=0.262, train_precision=0.96, train_recall=0.962] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       0.82      0.86      0.84        21
     LOC.NOM       0.86      0.86      0.86        21
     ORG.NAM       0.96      0.99      0.97        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.98      0.99      0.98       223
     PER.NOM       0.99      0.99      0.99       268

   micro avg       0.98      0.98      0.98       695
   macro avg       0.95      0.96      0.96       695
weighted avg       0.98      0.98      0.98       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.23it/s, F1=0.644, eval_acc=0.965, eval_loss=9.48, eval_precision=0.564, eval_recall=0.756]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.67      0.85      0.75        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.25      0.67      0.36         6
     LOC.NOM       0.17      0.50      0.25         6
     ORG.NAM       0.29      0.40      0.34        47
     ORG.NOM       0.31      1.00      0.48         5
     PER.NAM       0.61      0.78      0.68        90
     PER.NOM       0.73      0.82      0.77       208

   micro avg       0.59      0.75      0.66       389
   macro avg       0.38      0.63      0.45       389
weighted avg       0.62      0.75      0.68       389



Epoch: 24/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.26it/s, F1=0.981, train_acc=0.999, train_loss=0.215, train_precision=0.977, train_recall=0.986]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       0.95      1.00      0.98        21
     LOC.NOM       0.91      1.00      0.95        21
     ORG.NAM       0.96      0.99      0.97        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.99      0.98      0.98       223
     PER.NOM       0.97      0.99      0.98       268

   micro avg       0.97      0.99      0.98       695
   macro avg       0.97      0.99      0.98       695
weighted avg       0.97      0.99      0.98       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.43it/s, F1=0.674, eval_acc=0.968, eval_loss=9.57, eval_precision=0.648, eval_recall=0.707]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.62      0.77      0.69        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.33      0.50      0.40         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.34      0.40      0.37        47
     ORG.NOM       0.56      1.00      0.71         5
     PER.NAM       0.61      0.76      0.67        90
     PER.NOM       0.78      0.75      0.77       208

   micro avg       0.65      0.70      0.67       389
   macro avg       0.41      0.52      0.45       389
weighted avg       0.65      0.70      0.67       389



Epoch: 25/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.33it/s, F1=0.97, train_acc=0.998, train_loss=0.194, train_precision=0.964, train_recall=0.977] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       0.86      0.90      0.88        21
     LOC.NOM       0.95      0.95      0.95        21
     ORG.NAM       0.94      0.99      0.96        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.98      1.00      0.99       223
     PER.NOM       0.97      0.97      0.97       268

   micro avg       0.97      0.98      0.98       695
   macro avg       0.96      0.98      0.97       695
weighted avg       0.97      0.98      0.98       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.47it/s, F1=0.649, eval_acc=0.966, eval_loss=10.2, eval_precision=0.582, eval_recall=0.741]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.62      0.81      0.70        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.31      0.67      0.42         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.31      0.43      0.36        47
     ORG.NOM       0.36      0.80      0.50         5
     PER.NAM       0.69      0.72      0.71        90
     PER.NOM       0.70      0.83      0.76       208

   micro avg       0.60      0.74      0.66       389
   macro avg       0.37      0.53      0.43       389
weighted avg       0.62      0.74      0.67       389



Epoch: 26/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.26it/s, F1=0.978, train_acc=0.999, train_loss=0.162, train_precision=0.971, train_recall=0.986]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       0.91      0.95      0.93        21
     LOC.NOM       0.95      1.00      0.98        21
     ORG.NAM       0.95      0.97      0.96        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.98      1.00      0.99       223
     PER.NOM       0.98      1.00      0.99       268

   micro avg       0.98      0.99      0.98       695
   macro avg       0.97      0.99      0.98       695
weighted avg       0.98      0.99      0.98       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  3.99it/s, F1=0.642, eval_acc=0.967, eval_loss=9.82, eval_precision=0.591, eval_recall=0.711]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.67      0.85      0.75        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.33      0.67      0.44         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.29      0.43      0.34        47
     ORG.NOM       0.36      0.80      0.50         5
     PER.NAM       0.68      0.70      0.69        90
     PER.NOM       0.74      0.76      0.75       208

   micro avg       0.61      0.70      0.65       389
   macro avg       0.39      0.53      0.44       389
weighted avg       0.65      0.70      0.67       389



Epoch: 27/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.22it/s, F1=0.982, train_acc=0.999, train_loss=0.177, train_precision=0.98, train_recall=0.986] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       0.95      1.00      0.98        21
     LOC.NOM       0.95      1.00      0.98        21
     ORG.NAM       0.95      0.99      0.97        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.99      0.99      0.99       223
     PER.NOM       0.98      0.98      0.98       268

   micro avg       0.98      0.99      0.98       695
   macro avg       0.98      0.99      0.99       695
weighted avg       0.98      0.99      0.98       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.37it/s, F1=0.672, eval_acc=0.969, eval_loss=9.58, eval_precision=0.622, eval_recall=0.74] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.71      0.85      0.77        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.36      0.67      0.47         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.32      0.45      0.38        47
     ORG.NOM       0.45      1.00      0.62         5
     PER.NAM       0.66      0.77      0.71        90
     PER.NOM       0.79      0.79      0.79       208

   micro avg       0.65      0.74      0.69       389
   macro avg       0.41      0.56      0.47       389
weighted avg       0.67      0.74      0.70       389



Epoch: 28/30 Train: 100%|██████████| 63/63 [00:21<00:00,  2.93it/s, F1=0.984, train_acc=0.999, train_loss=0.137, train_precision=0.984, train_recall=0.986]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       0.91      0.95      0.93        21
     LOC.NOM       0.95      0.95      0.95        21
     ORG.NAM       0.95      0.99      0.97        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.99      0.99      0.99       223
     PER.NOM       0.98      0.98      0.98       268

   micro avg       0.98      0.99      0.98       695
   macro avg       0.97      0.98      0.98       695
weighted avg       0.98      0.99      0.98       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.44it/s, F1=0.659, eval_acc=0.968, eval_loss=10.2, eval_precision=0.59, eval_recall=0.751] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.67      0.85      0.75        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.25      0.67      0.36         6
     LOC.NOM       0.08      0.17      0.11         6
     ORG.NAM       0.29      0.43      0.35        47
     ORG.NOM       0.36      0.80      0.50         5
     PER.NAM       0.64      0.77      0.70        90
     PER.NOM       0.76      0.83      0.79       208

   micro avg       0.61      0.75      0.68       389
   macro avg       0.38      0.56      0.44       389
weighted avg       0.64      0.75      0.69       389



Epoch: 29/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.21it/s, F1=0.975, train_acc=0.998, train_loss=0.23, train_precision=0.968, train_recall=0.987] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       0.90      0.90      0.90        21
     LOC.NOM       0.95      1.00      0.98        21
     ORG.NAM       0.95      0.99      0.97        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.97      0.98      0.98       223
     PER.NOM       0.97      1.00      0.99       268

   micro avg       0.97      0.99      0.98       695
   macro avg       0.97      0.98      0.98       695
weighted avg       0.97      0.99      0.98       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.41it/s, F1=0.616, eval_acc=0.967, eval_loss=9.36, eval_precision=0.587, eval_recall=0.656]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.58      0.85      0.69        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.22      0.67      0.33         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.31      0.36      0.33        47
     ORG.NOM       0.50      1.00      0.67         5
     PER.NAM       0.64      0.71      0.67        90
     PER.NOM       0.79      0.68      0.73       208

   micro avg       0.62      0.65      0.64       389
   macro avg       0.38      0.53      0.43       389
weighted avg       0.66      0.65      0.65       389



Epoch: 30/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.24it/s, F1=0.96, train_acc=0.997, train_loss=0.564, train_precision=0.951, train_recall=0.973] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       0.91      1.00      0.95        21
     LOC.NOM       0.95      1.00      0.98        21
     ORG.NAM       0.94      0.92      0.93        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.93      0.97      0.95       223
     PER.NOM       0.97      0.99      0.98       268

   micro avg       0.95      0.98      0.96       695
   macro avg       0.96      0.98      0.97       695
weighted avg       0.95      0.98      0.96       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.43it/s, F1=0.663, eval_acc=0.968, eval_loss=8.79, eval_precision=0.616, eval_recall=0.721]


eval_reports:


calculate data/few_shot/weibo/train_500.json etag: 100%|██████████| 339k/339k [00:00<00:00, 248MB/s]
calculate data/few_shot/weibo/dev.json etag: 100%|██████████| 180k/180k [00:00<00:00, 192MB/s]
calculate data/few_shot/weibo/test.json etag: 100%|██████████| 184k/184k [00:00<00:00, 194MB/s]
calculate data/few_shot/weibo/labels.txt etag: 100%|██████████| 272/272 [00:00<00:00, 533kB/s]

              precision    recall  f1-score   support

     GPE.NAM       0.61      0.73      0.67        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.40      0.33      0.36         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.28      0.45      0.34        47
     ORG.NOM       0.44      0.80      0.57         5
     PER.NAM       0.59      0.77      0.67        90
     PER.NOM       0.78      0.78      0.78       208

   micro avg       0.62      0.71      0.66       389
   macro avg       0.39      0.48      0.42       389
weighted avg       0.64      0.71      0.67       389

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/weibo/train_500.json",
    "eval_file": "data/few_shot/weibo/dev.json",
    "test_file": "data/few_shot/w




load cached ./temp/ada2fdd9eb2e52ae2745d5d8c800bddd_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/lexicon_tree


count line size data/few_shot/weibo/labels.txt: 29L [00:00, 252879.04L/s]
build line mapper: 29L [00:00, 222367.12L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 29/29 [00:00<00:00, 8483.39it/s]
load vocab from list: 100%|██████████| 28/28 [00:00<00:00, 277637.14it/s]
load dataset from data/few_shot/weibo/train_500.json: 54it [00:00, 538.81it/s]

load cached ./temp/ada2fdd9eb2e52ae2745d5d8c800bddd_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/matched_words
load cached ./temp/ada2fdd9eb2e52ae2745d5d8c800bddd_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/word_vocab
load cached ./temp/ada2fdd9eb2e52ae2745d5d8c800bddd_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/vocab_embedding


load dataset from data/few_shot/weibo/train_500.json: 500it [00:01, 498.50it/s]
load dataset from data/few_shot/weibo/dev.json: 271it [00:00, 504.65it/s]
Some weights of the model checkpoint at save_pretrained/weibo_pretrain_lebert_500_pretraind_task/Bert_480/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model fr

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.20it/s, F1=0, train_acc=0.726, train_loss=57.4, train_precision=0, train_recall=0] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        21
     LOC.NOM       0.00      0.00      0.00        21
     ORG.NAM       0.00      0.00      0.00        79
     ORG.NOM       0.00      0.00      0.00        13
     PER.NAM       0.00      0.00      0.00       223
     PER.NOM       0.00      0.00      0.00       268

   micro avg       0.00      0.00      0.00       695
   macro avg       0.00      0.00      0.00       695
weighted avg       0.00      0.00      0.00       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.43it/s, F1=0, eval_acc=0.933, eval_loss=19.6, eval_precision=0, eval_recall=0]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.00      0.00      0.00        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.00      0.00      0.00        90
     PER.NOM       0.00      0.00      0.00       208

   micro avg       0.00      0.00      0.00       389
   macro avg       0.00      0.00      0.00       389
weighted avg       0.00      0.00      0.00       389



Epoch: 2/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.24it/s, F1=0.00176, train_acc=0.932, train_loss=17.2, train_precision=0.00397, train_recall=0.00113]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        21
     LOC.NOM       0.00      0.00      0.00        21
     ORG.NAM       0.00      0.00      0.00        79
     ORG.NOM       0.00      0.00      0.00        13
     PER.NAM       0.00      0.00      0.00       223
     PER.NOM       0.33      0.00      0.01       268

   micro avg       0.25      0.00      0.00       695
   macro avg       0.04      0.00      0.00       695
weighted avg       0.13      0.00      0.00       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.45it/s, F1=0.0639, eval_acc=0.935, eval_loss=9.77, eval_precision=0.167, eval_recall=0.0403]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.00      0.00      0.00        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.07      0.03      0.04        90
     PER.NOM       0.28      0.07      0.11       208

   micro avg       0.18      0.05      0.07       389
   macro avg       0.04      0.01      0.02       389
weighted avg       0.16      0.05      0.07       389



Epoch: 3/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.28it/s, F1=0.346, train_acc=0.949, train_loss=9.42, train_precision=0.485, train_recall=0.304] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.27      0.04      0.08        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        21
     LOC.NOM       0.00      0.00      0.00        21
     ORG.NAM       0.06      0.03      0.04        79
     ORG.NOM       0.00      0.00      0.00        13
     PER.NAM       0.40      0.32      0.36       223
     PER.NOM       0.49      0.52      0.51       268

   micro avg       0.43      0.31      0.36       695
   macro avg       0.15      0.11      0.12       695
weighted avg       0.35      0.31      0.32       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.40it/s, F1=0.509, eval_acc=0.96, eval_loss=6.03, eval_precision=0.44, eval_recall=0.616]  


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.17      0.31      0.22        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.08      0.19      0.11        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.71      0.67      0.69        90
     PER.NOM       0.64      0.80      0.72       208

   micro avg       0.48      0.63      0.54       389
   macro avg       0.20      0.25      0.22       389
weighted avg       0.53      0.63      0.57       389



Epoch: 4/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.29it/s, F1=0.668, train_acc=0.972, train_loss=5.05, train_precision=0.693, train_recall=0.677]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.54      0.63      0.58        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        21
     LOC.NOM       0.00      0.00      0.00        21
     ORG.NAM       0.33      0.44      0.38        79
     ORG.NOM       0.00      0.00      0.00        13
     PER.NAM       0.70      0.71      0.70       223
     PER.NOM       0.72      0.82      0.77       268

   micro avg       0.63      0.65      0.64       695
   macro avg       0.29      0.33      0.30       695
weighted avg       0.59      0.65      0.62       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.37it/s, F1=0.638, eval_acc=0.964, eval_loss=4.92, eval_precision=0.61, eval_recall=0.672] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.45      0.65      0.53        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.27      0.40      0.32        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.59      0.80      0.68        90
     PER.NOM       0.74      0.70      0.72       208

   micro avg       0.59      0.65      0.62       389
   macro avg       0.25      0.32      0.28       389
weighted avg       0.59      0.65      0.61       389



Epoch: 5/30 Train: 100%|██████████| 63/63 [00:22<00:00,  2.79it/s, F1=0.755, train_acc=0.984, train_loss=3.14, train_precision=0.752, train_recall=0.773]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.57      0.72      0.64        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.29      0.29      0.29        21
     LOC.NOM       0.43      0.14      0.21        21
     ORG.NAM       0.70      0.76      0.73        79
     ORG.NOM       0.00      0.00      0.00        13
     PER.NAM       0.78      0.84      0.81       223
     PER.NOM       0.84      0.88      0.86       268

   micro avg       0.75      0.78      0.76       695
   macro avg       0.45      0.45      0.44       695
weighted avg       0.73      0.78      0.75       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.39it/s, F1=0.668, eval_acc=0.967, eval_loss=4.73, eval_precision=0.651, eval_recall=0.688]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.54      0.77      0.63        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.57      0.67      0.62         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.33      0.38      0.35        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.69      0.78      0.73        90
     PER.NOM       0.78      0.75      0.76       208

   micro avg       0.67      0.69      0.68       389
   macro avg       0.36      0.42      0.39       389
weighted avg       0.66      0.69      0.67       389



Epoch: 6/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.25it/s, F1=0.831, train_acc=0.985, train_loss=2.35, train_precision=0.832, train_recall=0.849]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.76      0.84      0.80        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.55      0.52      0.54        21
     LOC.NOM       0.44      0.38      0.41        21
     ORG.NAM       0.76      0.86      0.81        79
     ORG.NOM       0.00      0.00      0.00        13
     PER.NAM       0.81      0.87      0.84       223
     PER.NOM       0.86      0.89      0.88       268

   micro avg       0.80      0.83      0.81       695
   macro avg       0.52      0.55      0.53       695
weighted avg       0.78      0.83      0.81       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.38it/s, F1=0.692, eval_acc=0.969, eval_loss=4.85, eval_precision=0.631, eval_recall=0.77] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.56      0.77      0.65        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.56      0.83      0.67         6
     LOC.NOM       0.33      0.17      0.22         6
     ORG.NAM       0.37      0.40      0.39        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.63      0.84      0.72        90
     PER.NOM       0.72      0.82      0.77       208

   micro avg       0.64      0.75      0.69       389
   macro avg       0.40      0.48      0.43       389
weighted avg       0.63      0.75      0.68       389



Epoch: 7/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.22it/s, F1=0.855, train_acc=0.99, train_loss=1.65, train_precision=0.863, train_recall=0.857] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.84      0.90      0.87        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.52      0.52      0.52        21
     LOC.NOM       0.39      0.33      0.36        21
     ORG.NAM       0.86      0.95      0.90        79
     ORG.NOM       0.00      0.00      0.00        13
     PER.NAM       0.88      0.89      0.89       223
     PER.NOM       0.91      0.94      0.92       268

   micro avg       0.85      0.87      0.86       695
   macro avg       0.55      0.57      0.56       695
weighted avg       0.84      0.87      0.86       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.40it/s, F1=0.688, eval_acc=0.968, eval_loss=5.16, eval_precision=0.663, eval_recall=0.717]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.67      0.77      0.71        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.42      0.83      0.56         6
     LOC.NOM       0.22      0.33      0.27         6
     ORG.NAM       0.37      0.40      0.39        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.69      0.80      0.74        90
     PER.NOM       0.79      0.75      0.77       208

   micro avg       0.67      0.70      0.69       389
   macro avg       0.39      0.49      0.43       389
weighted avg       0.68      0.70      0.69       389



Epoch: 8/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.26it/s, F1=0.898, train_acc=0.993, train_loss=1.24, train_precision=0.891, train_recall=0.911]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.83      0.88      0.86        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.57      0.57      0.57        21
     LOC.NOM       0.46      0.52      0.49        21
     ORG.NAM       0.89      0.94      0.91        79
     ORG.NOM       0.38      0.38      0.38        13
     PER.NAM       0.92      0.95      0.93       223
     PER.NOM       0.92      0.94      0.93       268

   micro avg       0.87      0.90      0.89       695
   macro avg       0.62      0.65      0.63       695
weighted avg       0.87      0.90      0.89       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.43it/s, F1=0.681, eval_acc=0.967, eval_loss=5.18, eval_precision=0.637, eval_recall=0.735]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.61      0.65      0.63        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.33      0.83      0.48         6
     LOC.NOM       0.20      0.33      0.25         6
     ORG.NAM       0.40      0.45      0.42        47
     ORG.NOM       0.38      0.60      0.46         5
     PER.NAM       0.62      0.83      0.71        90
     PER.NOM       0.78      0.77      0.77       208

   micro avg       0.64      0.73      0.68       389
   macro avg       0.41      0.56      0.47       389
weighted avg       0.66      0.73      0.69       389



Epoch: 9/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.26it/s, F1=0.912, train_acc=0.995, train_loss=0.952, train_precision=0.903, train_recall=0.927]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.96      0.96      0.96        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.68      0.81      0.74        21
     LOC.NOM       0.70      0.67      0.68        21
     ORG.NAM       0.94      0.95      0.94        79
     ORG.NOM       0.64      0.69      0.67        13
     PER.NAM       0.93      0.95      0.94       223
     PER.NOM       0.95      0.96      0.95       268

   micro avg       0.92      0.93      0.93       695
   macro avg       0.72      0.75      0.73       695
weighted avg       0.92      0.93      0.92       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.33it/s, F1=0.675, eval_acc=0.966, eval_loss=5.49, eval_precision=0.622, eval_recall=0.742]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.67      0.77      0.71        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.42      0.83      0.56         6
     LOC.NOM       0.10      0.17      0.12         6
     ORG.NAM       0.32      0.43      0.37        47
     ORG.NOM       0.22      0.80      0.35         5
     PER.NAM       0.64      0.76      0.69        90
     PER.NOM       0.79      0.80      0.80       208

   micro avg       0.63      0.73      0.68       389
   macro avg       0.39      0.57      0.45       389
weighted avg       0.66      0.73      0.69       389



Epoch: 10/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.20it/s, F1=0.919, train_acc=0.994, train_loss=0.942, train_precision=0.916, train_recall=0.927]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.94      0.97      0.96        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.87      0.95      0.91        21
     LOC.NOM       0.76      0.76      0.76        21
     ORG.NAM       0.91      0.94      0.92        79
     ORG.NOM       0.79      0.85      0.81        13
     PER.NAM       0.94      0.94      0.94       223
     PER.NOM       0.94      0.97      0.96       268

   micro avg       0.93      0.95      0.94       695
   macro avg       0.77      0.80      0.78       695
weighted avg       0.92      0.95      0.93       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.45it/s, F1=0.652, eval_acc=0.966, eval_loss=5.87, eval_precision=0.597, eval_recall=0.724]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.71      0.85      0.77        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.62      0.83      0.71         6
     LOC.NOM       0.27      0.50      0.35         6
     ORG.NAM       0.37      0.45      0.40        47
     ORG.NOM       0.24      0.80      0.36         5
     PER.NAM       0.65      0.79      0.71        90
     PER.NOM       0.72      0.77      0.75       208

   micro avg       0.63      0.74      0.68       389
   macro avg       0.45      0.62      0.51       389
weighted avg       0.65      0.74      0.68       389



Epoch: 11/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.25it/s, F1=0.957, train_acc=0.997, train_loss=0.518, train_precision=0.953, train_recall=0.962]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.93      0.93      0.93        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.94      0.81      0.87        21
     LOC.NOM       0.86      0.86      0.86        21
     ORG.NAM       0.96      1.00      0.98        79
     ORG.NOM       0.80      0.92      0.86        13
     PER.NAM       0.95      0.97      0.96       223
     PER.NOM       0.97      0.99      0.98       268

   micro avg       0.95      0.97      0.96       695
   macro avg       0.80      0.81      0.80       695
weighted avg       0.95      0.97      0.96       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.42it/s, F1=0.669, eval_acc=0.964, eval_loss=6.22, eval_precision=0.606, eval_recall=0.75] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.62      0.77      0.69        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.25      1.00      0.40         6
     LOC.NOM       0.17      0.50      0.25         6
     ORG.NAM       0.34      0.40      0.37        47
     ORG.NOM       0.31      0.80      0.44         5
     PER.NAM       0.69      0.77      0.73        90
     PER.NOM       0.76      0.81      0.79       208

   micro avg       0.62      0.74      0.68       389
   macro avg       0.39      0.63      0.46       389
weighted avg       0.66      0.74      0.69       389



Epoch: 12/30 Train: 100%|██████████| 63/63 [00:22<00:00,  2.77it/s, F1=0.976, train_acc=0.998, train_loss=0.372, train_precision=0.969, train_recall=0.985]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.93      0.99      0.96        68
     GPE.NOM       1.00      0.50      0.67         2
     LOC.NAM       0.95      1.00      0.98        21
     LOC.NOM       0.95      0.95      0.95        21
     ORG.NAM       0.97      0.97      0.97        79
     ORG.NOM       0.86      0.92      0.89        13
     PER.NAM       0.98      0.98      0.98       223
     PER.NOM       0.97      0.99      0.98       268

   micro avg       0.97      0.98      0.97       695
   macro avg       0.95      0.91      0.92       695
weighted avg       0.97      0.98      0.97       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.41it/s, F1=0.678, eval_acc=0.965, eval_loss=6.53, eval_precision=0.617, eval_recall=0.758]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.65      0.77      0.70        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.42      0.83      0.56         6
     LOC.NOM       0.33      0.67      0.44         6
     ORG.NAM       0.34      0.51      0.41        47
     ORG.NOM       0.29      0.80      0.42         5
     PER.NAM       0.66      0.77      0.71        90
     PER.NOM       0.78      0.80      0.79       208

   micro avg       0.64      0.75      0.69       389
   macro avg       0.43      0.64      0.50       389
weighted avg       0.67      0.75      0.70       389



Epoch: 13/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.19it/s, F1=0.975, train_acc=0.998, train_loss=0.377, train_precision=0.974, train_recall=0.98] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       0.91      0.95      0.93        21
     LOC.NOM       0.91      0.95      0.93        21
     ORG.NAM       0.96      1.00      0.98        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.99      0.98      0.98       223
     PER.NOM       0.98      0.98      0.98       268

   micro avg       0.98      0.98      0.98       695
   macro avg       0.97      0.98      0.98       695
weighted avg       0.98      0.98      0.98       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.44it/s, F1=0.641, eval_acc=0.964, eval_loss=6.98, eval_precision=0.578, eval_recall=0.725]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.67      0.85      0.75        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.31      0.83      0.45         6
     LOC.NOM       0.20      0.17      0.18         6
     ORG.NAM       0.39      0.47      0.42        47
     ORG.NOM       0.25      0.80      0.38         5
     PER.NAM       0.64      0.79      0.71        90
     PER.NOM       0.70      0.78      0.74       208

   micro avg       0.61      0.74      0.67       389
   macro avg       0.39      0.59      0.45       389
weighted avg       0.62      0.74      0.67       389



Epoch: 14/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.27it/s, F1=0.971, train_acc=0.998, train_loss=0.357, train_precision=0.967, train_recall=0.979]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       0.95      1.00      0.98        21
     LOC.NOM       0.95      1.00      0.98        21
     ORG.NAM       0.97      0.97      0.97        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.98      0.98      0.98       223
     PER.NOM       0.96      0.98      0.97       268

   micro avg       0.97      0.98      0.98       695
   macro avg       0.98      0.99      0.98       695
weighted avg       0.97      0.98      0.98       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.23it/s, F1=0.661, eval_acc=0.966, eval_loss=6.33, eval_precision=0.588, eval_recall=0.759]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.65      0.77      0.70        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.45      0.83      0.59         6
     LOC.NOM       0.18      0.33      0.24         6
     ORG.NAM       0.32      0.47      0.38        47
     ORG.NOM       0.20      0.80      0.32         5
     PER.NAM       0.66      0.79      0.72        90
     PER.NOM       0.74      0.82      0.78       208

   micro avg       0.61      0.76      0.68       389
   macro avg       0.40      0.60      0.47       389
weighted avg       0.64      0.76      0.69       389



Epoch: 15/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.25it/s, F1=0.966, train_acc=0.997, train_loss=0.533, train_precision=0.961, train_recall=0.976]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       0.95      1.00      0.98        21
     LOC.NOM       0.95      0.95      0.95        21
     ORG.NAM       0.96      0.99      0.97        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.94      0.95      0.95       223
     PER.NOM       0.96      0.99      0.97       268

   micro avg       0.96      0.98      0.97       695
   macro avg       0.97      0.98      0.98       695
weighted avg       0.96      0.98      0.97       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.45it/s, F1=0.691, eval_acc=0.968, eval_loss=7.54, eval_precision=0.67, eval_recall=0.716] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.69      0.85      0.76        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.50      0.83      0.62         6
     LOC.NOM       0.50      0.50      0.50         6
     ORG.NAM       0.35      0.36      0.36        47
     ORG.NOM       0.31      0.80      0.44         5
     PER.NAM       0.70      0.67      0.68        90
     PER.NOM       0.80      0.82      0.81       208

   micro avg       0.69      0.72      0.71       389
   macro avg       0.48      0.60      0.52       389
weighted avg       0.70      0.72      0.71       389



Epoch: 16/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.23it/s, F1=0.954, train_acc=0.995, train_loss=1.34, train_precision=0.947, train_recall=0.964] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       0.95      1.00      0.98        21
     LOC.NOM       0.95      1.00      0.98        21
     ORG.NAM       0.97      0.99      0.98        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.88      0.91      0.90       223
     PER.NOM       0.97      0.98      0.98       268

   micro avg       0.95      0.96      0.96       695
   macro avg       0.97      0.99      0.98       695
weighted avg       0.95      0.96      0.96       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.32it/s, F1=0.702, eval_acc=0.968, eval_loss=6.04, eval_precision=0.663, eval_recall=0.75] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.67      0.85      0.75        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.71      0.83      0.77         6
     LOC.NOM       0.29      0.33      0.31         6
     ORG.NAM       0.35      0.43      0.38        47
     ORG.NOM       0.45      1.00      0.62         5
     PER.NAM       0.74      0.71      0.72        90
     PER.NOM       0.76      0.83      0.79       208

   micro avg       0.68      0.75      0.71       389
   macro avg       0.50      0.62      0.54       389
weighted avg       0.69      0.75      0.71       389



Epoch: 17/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.27it/s, F1=0.971, train_acc=0.998, train_loss=0.414, train_precision=0.97, train_recall=0.975] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.97      0.99      0.98        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       0.86      0.90      0.88        21
     LOC.NOM       0.95      0.95      0.95        21
     ORG.NAM       1.00      0.99      0.99        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.97      0.98      0.98       223
     PER.NOM       0.97      0.98      0.98       268

   micro avg       0.97      0.98      0.98       695
   macro avg       0.97      0.97      0.97       695
weighted avg       0.97      0.98      0.98       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.45it/s, F1=0.691, eval_acc=0.967, eval_loss=6.77, eval_precision=0.639, eval_recall=0.756]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.61      0.77      0.68        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.56      0.83      0.67         6
     LOC.NOM       0.33      0.50      0.40         6
     ORG.NAM       0.34      0.45      0.39        47
     ORG.NOM       0.33      0.80      0.47         5
     PER.NAM       0.65      0.79      0.71        90
     PER.NOM       0.79      0.81      0.80       208

   micro avg       0.65      0.75      0.70       389
   macro avg       0.45      0.62      0.51       389
weighted avg       0.67      0.75      0.71       389



Epoch: 18/30 Train: 100%|██████████| 63/63 [00:22<00:00,  2.76it/s, F1=0.97, train_acc=0.998, train_loss=0.417, train_precision=0.961, train_recall=0.982] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.92      0.99      0.95        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       0.87      0.95      0.91        21
     LOC.NOM       0.95      0.95      0.95        21
     ORG.NAM       0.94      0.94      0.94        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.96      0.97      0.97       223
     PER.NOM       0.98      1.00      0.99       268

   micro avg       0.96      0.98      0.97       695
   macro avg       0.95      0.97      0.96       695
weighted avg       0.96      0.98      0.97       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.44it/s, F1=0.701, eval_acc=0.968, eval_loss=6.2, eval_precision=0.689, eval_recall=0.718] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.75      0.69      0.72        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.62      0.83      0.71         6
     LOC.NOM       0.17      0.33      0.22         6
     ORG.NAM       0.38      0.49      0.43        47
     ORG.NOM       0.50      1.00      0.67         5
     PER.NAM       0.73      0.72      0.73        90
     PER.NOM       0.84      0.75      0.79       208

   micro avg       0.70      0.70      0.70       389
   macro avg       0.50      0.60      0.53       389
weighted avg       0.73      0.70      0.72       389



Epoch: 19/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.27it/s, F1=0.983, train_acc=0.998, train_loss=0.294, train_precision=0.982, train_recall=0.985]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      0.99      0.99        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       0.95      1.00      0.98        21
     LOC.NOM       1.00      0.95      0.98        21
     ORG.NAM       0.95      0.96      0.96        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       1.00      0.99      0.99       223
     PER.NOM       0.98      0.98      0.98       268

   micro avg       0.98      0.98      0.98       695
   macro avg       0.98      0.98      0.98       695
weighted avg       0.98      0.98      0.98       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.47it/s, F1=0.69, eval_acc=0.967, eval_loss=7.37, eval_precision=0.65, eval_recall=0.741]  


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.67      0.85      0.75        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.24      0.83      0.37         6
     LOC.NOM       0.29      0.67      0.40         6
     ORG.NAM       0.37      0.40      0.38        47
     ORG.NOM       0.50      1.00      0.67         5
     PER.NAM       0.69      0.74      0.72        90
     PER.NOM       0.82      0.78      0.80       208

   micro avg       0.67      0.73      0.70       389
   macro avg       0.45      0.66      0.51       389
weighted avg       0.70      0.73      0.71       389



Epoch: 20/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.26it/s, F1=0.965, train_acc=0.998, train_loss=0.308, train_precision=0.961, train_recall=0.973]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.96      1.00      0.98        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       0.95      1.00      0.98        21
     LOC.NOM       0.95      0.95      0.95        21
     ORG.NAM       0.95      0.97      0.96        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.95      0.98      0.97       223
     PER.NOM       0.97      0.98      0.98       268

   micro avg       0.96      0.98      0.97       695
   macro avg       0.97      0.99      0.98       695
weighted avg       0.96      0.98      0.97       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.31it/s, F1=0.694, eval_acc=0.965, eval_loss=6.49, eval_precision=0.668, eval_recall=0.726]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.69      0.69      0.69        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.33      0.83      0.48         6
     LOC.NOM       0.40      0.33      0.36         6
     ORG.NAM       0.40      0.45      0.42        47
     ORG.NOM       0.50      1.00      0.67         5
     PER.NAM       0.64      0.78      0.70        90
     PER.NOM       0.83      0.75      0.79       208

   micro avg       0.68      0.71      0.70       389
   macro avg       0.47      0.60      0.51       389
weighted avg       0.70      0.71      0.70       389



Epoch: 21/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.28it/s, F1=0.982, train_acc=0.999, train_loss=0.191, train_precision=0.981, train_recall=0.983]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       1.00      1.00      1.00        21
     LOC.NOM       0.95      1.00      0.98        21
     ORG.NAM       1.00      0.99      0.99        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.98      0.98      0.98       223
     PER.NOM       0.99      0.99      0.99       268

   micro avg       0.99      0.99      0.99       695
   macro avg       0.99      0.99      0.99       695
weighted avg       0.99      0.99      0.99       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.33it/s, F1=0.687, eval_acc=0.965, eval_loss=7.35, eval_precision=0.648, eval_recall=0.734]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.70      0.81      0.75        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.24      0.83      0.37         6
     LOC.NOM       0.25      0.50      0.33         6
     ORG.NAM       0.35      0.45      0.39        47
     ORG.NOM       0.50      1.00      0.67         5
     PER.NAM       0.69      0.73      0.71        90
     PER.NOM       0.80      0.77      0.79       208

   micro avg       0.66      0.72      0.69       389
   macro avg       0.44      0.64      0.50       389
weighted avg       0.69      0.72      0.70       389



Epoch: 22/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.25it/s, F1=0.986, train_acc=0.999, train_loss=0.237, train_precision=0.983, train_recall=0.99]  


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       0.91      0.95      0.93        21
     LOC.NOM       0.95      1.00      0.98        21
     ORG.NAM       0.96      1.00      0.98        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.97      0.99      0.98       223
     PER.NOM       0.99      0.99      0.99       268

   micro avg       0.98      0.99      0.98       695
   macro avg       0.97      0.99      0.98       695
weighted avg       0.98      0.99      0.98       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.44it/s, F1=0.686, eval_acc=0.965, eval_loss=7.26, eval_precision=0.634, eval_recall=0.753]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.66      0.81      0.72        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.29      0.83      0.43         6
     LOC.NOM       0.22      0.33      0.27         6
     ORG.NAM       0.35      0.38      0.37        47
     ORG.NOM       0.42      1.00      0.59         5
     PER.NAM       0.73      0.74      0.74        90
     PER.NOM       0.76      0.84      0.80       208

   micro avg       0.66      0.75      0.70       389
   macro avg       0.43      0.62      0.49       389
weighted avg       0.67      0.75      0.71       389



Epoch: 23/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.19it/s, F1=0.967, train_acc=0.998, train_loss=0.209, train_precision=0.967, train_recall=0.969]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       0.95      1.00      0.98        21
     LOC.NOM       0.95      0.95      0.95        21
     ORG.NAM       1.00      0.99      0.99        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.99      0.98      0.98       223
     PER.NOM       0.97      0.99      0.98       268

   micro avg       0.98      0.99      0.98       695
   macro avg       0.98      0.99      0.99       695
weighted avg       0.98      0.99      0.98       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.25it/s, F1=0.682, eval_acc=0.964, eval_loss=7.65, eval_precision=0.617, eval_recall=0.767]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.71      0.85      0.77        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.28      0.83      0.42         6
     LOC.NOM       0.38      0.50      0.43         6
     ORG.NAM       0.33      0.38      0.36        47
     ORG.NOM       0.42      1.00      0.59         5
     PER.NAM       0.57      0.84      0.68        90
     PER.NOM       0.78      0.82      0.80       208

   micro avg       0.63      0.77      0.69       389
   macro avg       0.43      0.65      0.51       389
weighted avg       0.65      0.77      0.70       389



Epoch: 24/30 Train: 100%|██████████| 63/63 [00:22<00:00,  2.77it/s, F1=0.988, train_acc=0.998, train_loss=0.204, train_precision=0.986, train_recall=0.99] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       0.95      0.95      0.95        21
     LOC.NOM       1.00      0.95      0.98        21
     ORG.NAM       0.99      1.00      0.99        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.99      1.00      0.99       223
     PER.NOM       0.98      0.98      0.98       268

   micro avg       0.98      0.99      0.99       695
   macro avg       0.99      0.98      0.99       695
weighted avg       0.98      0.99      0.99       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.34it/s, F1=0.693, eval_acc=0.965, eval_loss=7.3, eval_precision=0.648, eval_recall=0.747] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.67      0.85      0.75        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.22      0.67      0.33         6
     LOC.NOM       0.44      0.67      0.53         6
     ORG.NAM       0.39      0.40      0.40        47
     ORG.NOM       0.44      0.80      0.57         5
     PER.NAM       0.69      0.82      0.75        90
     PER.NOM       0.76      0.78      0.77       208

   micro avg       0.66      0.74      0.70       389
   macro avg       0.45      0.62      0.51       389
weighted avg       0.67      0.74      0.70       389



Epoch: 25/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.26it/s, F1=0.992, train_acc=0.999, train_loss=0.146, train_precision=0.993, train_recall=0.992] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       1.00      0.95      0.98        21
     LOC.NOM       0.95      1.00      0.98        21
     ORG.NAM       0.99      0.97      0.98        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.99      0.99      0.99       223
     PER.NOM       0.99      0.99      0.99       268

   micro avg       0.99      0.99      0.99       695
   macro avg       0.99      0.99      0.99       695
weighted avg       0.99      0.99      0.99       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.41it/s, F1=0.676, eval_acc=0.963, eval_loss=7.97, eval_precision=0.621, eval_recall=0.743]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.64      0.81      0.71        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.17      0.83      0.29         6
     LOC.NOM       0.20      0.33      0.25         6
     ORG.NAM       0.32      0.45      0.38        47
     ORG.NOM       0.33      0.80      0.47         5
     PER.NAM       0.71      0.78      0.74        90
     PER.NOM       0.80      0.79      0.79       208

   micro avg       0.63      0.74      0.68       389
   macro avg       0.40      0.60      0.45       389
weighted avg       0.68      0.74      0.70       389



Epoch: 26/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.22it/s, F1=0.968, train_acc=0.998, train_loss=0.198, train_precision=0.966, train_recall=0.973]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       0.95      1.00      0.98        21
     LOC.NOM       0.95      0.95      0.95        21
     ORG.NAM       0.96      0.97      0.97        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.99      0.99      0.99       223
     PER.NOM       0.98      0.99      0.99       268

   micro avg       0.98      0.99      0.98       695
   macro avg       0.98      0.99      0.98       695
weighted avg       0.98      0.99      0.98       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.42it/s, F1=0.679, eval_acc=0.963, eval_loss=7.32, eval_precision=0.618, eval_recall=0.755]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.69      0.77      0.73        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.26      0.83      0.40         6
     LOC.NOM       0.27      0.50      0.35         6
     ORG.NAM       0.32      0.45      0.37        47
     ORG.NOM       0.31      0.80      0.44         5
     PER.NAM       0.66      0.81      0.73        90
     PER.NOM       0.78      0.81      0.79       208

   micro avg       0.63      0.76      0.69       389
   macro avg       0.41      0.62      0.48       389
weighted avg       0.66      0.76      0.70       389



Epoch: 27/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.31it/s, F1=0.981, train_acc=0.998, train_loss=0.207, train_precision=0.982, train_recall=0.982]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       1.00      0.95      0.98        21
     LOC.NOM       0.95      1.00      0.98        21
     ORG.NAM       0.98      1.00      0.99        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.98      0.98      0.98       223
     PER.NOM       0.98      0.98      0.98       268

   micro avg       0.98      0.98      0.98       695
   macro avg       0.99      0.99      0.99       695
weighted avg       0.98      0.98      0.98       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.22it/s, F1=0.713, eval_acc=0.968, eval_loss=8.01, eval_precision=0.675, eval_recall=0.758]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.74      0.77      0.75        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.22      0.83      0.34         6
     LOC.NOM       0.40      0.33      0.36         6
     ORG.NAM       0.43      0.40      0.42        47
     ORG.NOM       0.62      1.00      0.77         5
     PER.NAM       0.62      0.83      0.71        90
     PER.NOM       0.79      0.81      0.80       208

   micro avg       0.67      0.76      0.71       389
   macro avg       0.48      0.62      0.52       389
weighted avg       0.68      0.76      0.71       389



Epoch: 28/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.25it/s, F1=0.974, train_acc=0.997, train_loss=0.303, train_precision=0.976, train_recall=0.98] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       0.95      1.00      0.98        21
     LOC.NOM       0.82      0.86      0.84        21
     ORG.NAM       0.99      0.99      0.99        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.98      0.99      0.99       223
     PER.NOM       0.98      0.99      0.98       268

   micro avg       0.98      0.99      0.98       695
   macro avg       0.97      0.98      0.97       695
weighted avg       0.98      0.99      0.98       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.22it/s, F1=0.692, eval_acc=0.967, eval_loss=7.78, eval_precision=0.661, eval_recall=0.728]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.73      0.73      0.73        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.23      0.50      0.32         6
     LOC.NOM       0.33      0.17      0.22         6
     ORG.NAM       0.42      0.43      0.42        47
     ORG.NOM       0.67      0.80      0.73         5
     PER.NAM       0.61      0.81      0.70        90
     PER.NOM       0.80      0.77      0.79       208

   micro avg       0.68      0.72      0.70       389
   macro avg       0.47      0.53      0.49       389
weighted avg       0.69      0.72      0.70       389



Epoch: 29/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.23it/s, F1=0.978, train_acc=0.998, train_loss=0.216, train_precision=0.976, train_recall=0.983]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       0.95      1.00      0.98        21
     LOC.NOM       0.95      0.95      0.95        21
     ORG.NAM       1.00      0.99      0.99        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.98      0.99      0.98       223
     PER.NOM       0.97      0.97      0.97       268

   micro avg       0.98      0.98      0.98       695
   macro avg       0.98      0.99      0.98       695
weighted avg       0.98      0.98      0.98       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.44it/s, F1=0.719, eval_acc=0.97, eval_loss=7.4, eval_precision=0.702, eval_recall=0.739]  


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.68      0.81      0.74        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.33      0.83      0.48         6
     LOC.NOM       0.50      0.50      0.50         6
     ORG.NAM       0.40      0.43      0.41        47
     ORG.NOM       0.71      1.00      0.83         5
     PER.NAM       0.77      0.71      0.74        90
     PER.NOM       0.80      0.80      0.80       208

   micro avg       0.71      0.73      0.72       389
   macro avg       0.52      0.63      0.56       389
weighted avg       0.72      0.73      0.72       389



Epoch: 30/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.25it/s, F1=0.968, train_acc=0.998, train_loss=0.183, train_precision=0.969, train_recall=0.969]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       0.95      0.95      0.95        21
     LOC.NOM       0.95      0.95      0.95        21
     ORG.NAM       0.99      1.00      0.99        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.99      0.99      0.99       223
     PER.NOM       0.98      0.98      0.98       268

   micro avg       0.98      0.99      0.99       695
   macro avg       0.98      0.98      0.98       695
weighted avg       0.98      0.99      0.99       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.44it/s, F1=0.699, eval_acc=0.968, eval_loss=7.83, eval_precision=0.658, eval_recall=0.75] 


eval_reports:


calculate data/few_shot/weibo/train_500.json etag: 100%|██████████| 339k/339k [00:00<00:00, 169MB/s]
calculate data/few_shot/weibo/dev.json etag: 100%|██████████| 180k/180k [00:00<00:00, 190MB/s]
calculate data/few_shot/weibo/test.json etag: 100%|██████████| 184k/184k [00:00<00:00, 188MB/s]
calculate data/few_shot/weibo/labels.txt etag: 100%|██████████| 272/272 [00:00<00:00, 551kB/s]

              precision    recall  f1-score   support

     GPE.NAM       0.64      0.81      0.71        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.28      0.83      0.42         6
     LOC.NOM       0.21      0.50      0.30         6
     ORG.NAM       0.41      0.38      0.40        47
     ORG.NOM       0.56      1.00      0.71         5
     PER.NAM       0.68      0.79      0.73        90
     PER.NOM       0.80      0.80      0.80       208

   micro avg       0.67      0.75      0.71       389
   macro avg       0.45      0.64      0.51       389
weighted avg       0.69      0.75      0.71       389

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/weibo/train_500.json",
    "eval_file": "data/few_shot/weibo/dev.json",
    "test_file": "data/few_shot/w


count line size data/few_shot/weibo/labels.txt: 29L [00:00, 224005.19L/s]
build line mapper: 29L [00:00, 250793.44L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 29/29 [00:00<00:00, 7697.43it/s]
load vocab from list: 100%|██████████| 28/28 [00:00<00:00, 273754.11it/s]
load dataset from data/few_shot/weibo/train_500.json: 54it [00:00, 537.59it/s]

load cached ./temp/ada2fdd9eb2e52ae2745d5d8c800bddd_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/matched_words
load cached ./temp/ada2fdd9eb2e52ae2745d5d8c800bddd_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/word_vocab
load cached ./temp/ada2fdd9eb2e52ae2745d5d8c800bddd_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/vocab_embedding


load dataset from data/few_shot/weibo/train_500.json: 500it [00:01, 493.25it/s]
load dataset from data/few_shot/weibo/dev.json: 271it [00:00, 501.85it/s]
Some weights of the model checkpoint at save_pretrained/weibo_pretrain_lebert_500_pretraind_task/Bert_480/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model fr

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.22it/s, F1=0, train_acc=0.566, train_loss=97, train_precision=0, train_recall=0]   


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        21
     LOC.NOM       0.00      0.00      0.00        21
     ORG.NAM       0.00      0.00      0.00        79
     ORG.NOM       0.00      0.00      0.00        13
     PER.NAM       0.00      0.00      0.00       223
     PER.NOM       0.00      0.00      0.00       268

   micro avg       0.00      0.00      0.00       695
   macro avg       0.00      0.00      0.00       695
weighted avg       0.00      0.00      0.00       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.30it/s, F1=0, eval_acc=0.933, eval_loss=23.2, eval_precision=0, eval_recall=0]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.00      0.00      0.00        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.00      0.00      0.00        90
     PER.NOM       0.00      0.00      0.00       208

   micro avg       0.00      0.00      0.00       389
   macro avg       0.00      0.00      0.00       389
weighted avg       0.00      0.00      0.00       389



Epoch: 2/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.25it/s, F1=0, train_acc=0.932, train_loss=23.2, train_precision=0, train_recall=0]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        21
     LOC.NOM       0.00      0.00      0.00        21
     ORG.NAM       0.00      0.00      0.00        79
     ORG.NOM       0.00      0.00      0.00        13
     PER.NAM       0.00      0.00      0.00       223
     PER.NOM       0.00      0.00      0.00       268

   micro avg       0.00      0.00      0.00       695
   macro avg       0.00      0.00      0.00       695
weighted avg       0.00      0.00      0.00       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.34it/s, F1=0, eval_acc=0.933, eval_loss=16.4, eval_precision=0, eval_recall=0]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.00      0.00      0.00        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.00      0.00      0.00        90
     PER.NOM       0.00      0.00      0.00       208

   micro avg       0.00      0.00      0.00       389
   macro avg       0.00      0.00      0.00       389
weighted avg       0.00      0.00      0.00       389



Epoch: 3/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.24it/s, F1=0.105, train_acc=0.942, train_loss=15.3, train_precision=0.122, train_recall=0.106]   


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        21
     LOC.NOM       0.00      0.00      0.00        21
     ORG.NAM       0.00      0.00      0.00        79
     ORG.NOM       0.00      0.00      0.00        13
     PER.NAM       0.04      0.04      0.04       223
     PER.NOM       0.25      0.22      0.24       268

   micro avg       0.14      0.10      0.12       695
   macro avg       0.04      0.03      0.03       695
weighted avg       0.11      0.10      0.10       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.33it/s, F1=0.319, eval_acc=0.95, eval_loss=10.1, eval_precision=0.356, eval_recall=0.291] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.00      0.00      0.00        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.13      0.29      0.18        90
     PER.NOM       0.71      0.46      0.56       208

   micro avg       0.36      0.31      0.34       389
   macro avg       0.11      0.09      0.09       389
weighted avg       0.41      0.31      0.34       389



Epoch: 4/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.21it/s, F1=0.297, train_acc=0.959, train_loss=8.78, train_precision=0.279, train_recall=0.334]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        21
     LOC.NOM       0.00      0.00      0.00        21
     ORG.NAM       0.01      0.03      0.02        79
     ORG.NOM       0.00      0.00      0.00        13
     PER.NAM       0.24      0.37      0.29       223
     PER.NOM       0.49      0.61      0.54       268

   micro avg       0.28      0.36      0.31       695
   macro avg       0.09      0.13      0.11       695
weighted avg       0.27      0.36      0.30       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.43it/s, F1=0.417, eval_acc=0.961, eval_loss=7.16, eval_precision=0.334, eval_recall=0.57] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.02      0.04      0.02        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.10      0.34      0.16        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.52      0.66      0.58        90
     PER.NOM       0.52      0.74      0.61       208

   micro avg       0.37      0.59      0.45       389
   macro avg       0.15      0.22      0.17       389
weighted avg       0.41      0.59      0.48       389



Epoch: 5/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.24it/s, F1=0.555, train_acc=0.973, train_loss=5.23, train_precision=0.525, train_recall=0.612]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.35      0.51      0.41        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.00      0.00      0.00        21
     LOC.NOM       0.00      0.00      0.00        21
     ORG.NAM       0.30      0.52      0.38        79
     ORG.NOM       0.00      0.00      0.00        13
     PER.NAM       0.61      0.77      0.68       223
     PER.NOM       0.55      0.69      0.61       268

   micro avg       0.50      0.62      0.55       695
   macro avg       0.23      0.31      0.26       695
weighted avg       0.48      0.62      0.54       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.41it/s, F1=0.493, eval_acc=0.956, eval_loss=6.79, eval_precision=0.414, eval_recall=0.614]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.41      0.58      0.48        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.22      0.49      0.30        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.35      0.74      0.48        90
     PER.NOM       0.68      0.70      0.69       208

   micro avg       0.45      0.64      0.53       389
   macro avg       0.21      0.31      0.24       389
weighted avg       0.50      0.64      0.55       389



Epoch: 6/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.22it/s, F1=0.686, train_acc=0.983, train_loss=3.48, train_precision=0.647, train_recall=0.742]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.51      0.74      0.60        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.09      0.14      0.11        21
     LOC.NOM       0.00      0.00      0.00        21
     ORG.NAM       0.63      0.77      0.69        79
     ORG.NOM       0.00      0.00      0.00        13
     PER.NAM       0.67      0.81      0.73       223
     PER.NOM       0.75      0.84      0.80       268

   micro avg       0.64      0.75      0.69       695
   macro avg       0.33      0.41      0.37       695
weighted avg       0.63      0.75      0.68       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.43it/s, F1=0.568, eval_acc=0.958, eval_loss=7.33, eval_precision=0.47, eval_recall=0.722] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.40      0.77      0.53        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.08      0.17      0.11         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.22      0.45      0.29        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.46      0.74      0.57        90
     PER.NOM       0.67      0.80      0.73       208

   micro avg       0.48      0.71      0.57       389
   macro avg       0.23      0.37      0.28       389
weighted avg       0.52      0.71      0.59       389



Epoch: 7/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.24it/s, F1=0.792, train_acc=0.987, train_loss=2.61, train_precision=0.773, train_recall=0.824]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.68      0.82      0.75        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.24      0.33      0.28        21
     LOC.NOM       0.07      0.05      0.06        21
     ORG.NAM       0.74      0.87      0.80        79
     ORG.NOM       0.15      0.15      0.15        13
     PER.NAM       0.79      0.87      0.83       223
     PER.NOM       0.84      0.89      0.86       268

   micro avg       0.75      0.82      0.78       695
   macro avg       0.44      0.50      0.47       695
weighted avg       0.74      0.82      0.78       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.41it/s, F1=0.656, eval_acc=0.968, eval_loss=6.31, eval_precision=0.609, eval_recall=0.717]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.58      0.73      0.64        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.15      0.33      0.21         6
     LOC.NOM       0.12      0.17      0.14         6
     ORG.NAM       0.32      0.38      0.35        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.62      0.72      0.67        90
     PER.NOM       0.77      0.81      0.79       208

   micro avg       0.63      0.70      0.66       389
   macro avg       0.32      0.39      0.35       389
weighted avg       0.64      0.70      0.67       389



Epoch: 8/30 Train: 100%|██████████| 63/63 [00:20<00:00,  3.15it/s, F1=0.864, train_acc=0.992, train_loss=1.84, train_precision=0.85, train_recall=0.886] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.86      0.91      0.89        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.54      0.67      0.60        21
     LOC.NOM       0.36      0.38      0.37        21
     ORG.NAM       0.76      0.89      0.82        79
     ORG.NOM       0.07      0.08      0.07        13
     PER.NAM       0.88      0.92      0.90       223
     PER.NOM       0.92      0.95      0.93       268

   micro avg       0.83      0.88      0.86       695
   macro avg       0.55      0.60      0.57       695
weighted avg       0.84      0.88      0.86       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.40it/s, F1=0.644, eval_acc=0.967, eval_loss=6.79, eval_precision=0.594, eval_recall=0.713]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.59      0.73      0.66        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.17      0.67      0.28         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.30      0.43      0.35        47
     ORG.NOM       0.67      0.40      0.50         5
     PER.NAM       0.65      0.76      0.70        90
     PER.NOM       0.76      0.76      0.76       208

   micro avg       0.62      0.70      0.66       389
   macro avg       0.39      0.47      0.41       389
weighted avg       0.64      0.70      0.67       389



Epoch: 9/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.24it/s, F1=0.882, train_acc=0.994, train_loss=1.33, train_precision=0.868, train_recall=0.901] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.89      0.91      0.90        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.56      0.71      0.63        21
     LOC.NOM       0.73      0.52      0.61        21
     ORG.NAM       0.80      0.92      0.86        79
     ORG.NOM       0.62      0.62      0.62        13
     PER.NAM       0.91      0.95      0.93       223
     PER.NOM       0.91      0.96      0.93       268

   micro avg       0.87      0.92      0.89       695
   macro avg       0.68      0.70      0.68       695
weighted avg       0.87      0.92      0.89       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.43it/s, F1=0.648, eval_acc=0.965, eval_loss=7.47, eval_precision=0.588, eval_recall=0.726]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.55      0.81      0.66        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.17      0.50      0.25         6
     LOC.NOM       0.11      0.17      0.13         6
     ORG.NAM       0.34      0.34      0.34        47
     ORG.NOM       0.36      0.80      0.50         5
     PER.NAM       0.58      0.72      0.64        90
     PER.NOM       0.73      0.81      0.77       208

   micro avg       0.59      0.72      0.65       389
   macro avg       0.35      0.52      0.41       389
weighted avg       0.61      0.72      0.66       389



Epoch: 10/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.26it/s, F1=0.925, train_acc=0.995, train_loss=1.02, train_precision=0.916, train_recall=0.937] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.89      0.93      0.91        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.79      0.90      0.84        21
     LOC.NOM       0.84      0.76      0.80        21
     ORG.NAM       0.89      0.95      0.92        79
     ORG.NOM       0.47      0.54      0.50        13
     PER.NAM       0.94      0.95      0.94       223
     PER.NOM       0.93      0.97      0.95       268

   micro avg       0.91      0.94      0.92       695
   macro avg       0.72      0.75      0.73       695
weighted avg       0.91      0.94      0.92       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.45it/s, F1=0.627, eval_acc=0.964, eval_loss=7.45, eval_precision=0.55, eval_recall=0.737] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.58      0.85      0.69        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.22      0.67      0.33         6
     LOC.NOM       0.18      0.33      0.24         6
     ORG.NAM       0.28      0.49      0.36        47
     ORG.NOM       0.44      0.80      0.57         5
     PER.NAM       0.57      0.79      0.66        90
     PER.NOM       0.77      0.79      0.78       208

   micro avg       0.59      0.75      0.66       389
   macro avg       0.38      0.59      0.45       389
weighted avg       0.63      0.75      0.68       389



Epoch: 11/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.26it/s, F1=0.929, train_acc=0.996, train_loss=0.807, train_precision=0.924, train_recall=0.942]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.89      0.93      0.91        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.90      0.86      0.88        21
     LOC.NOM       0.81      0.81      0.81        21
     ORG.NAM       0.94      0.97      0.96        79
     ORG.NOM       0.77      0.77      0.77        13
     PER.NAM       0.94      0.97      0.95       223
     PER.NOM       0.94      0.96      0.95       268

   micro avg       0.93      0.95      0.94       695
   macro avg       0.77      0.78      0.78       695
weighted avg       0.92      0.95      0.93       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.17it/s, F1=0.664, eval_acc=0.968, eval_loss=7.59, eval_precision=0.628, eval_recall=0.711]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.63      0.85      0.72        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.27      0.67      0.38         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.39      0.47      0.43        47
     ORG.NOM       0.29      0.40      0.33         5
     PER.NAM       0.65      0.74      0.69        90
     PER.NOM       0.81      0.77      0.79       208

   micro avg       0.66      0.71      0.69       389
   macro avg       0.38      0.49      0.42       389
weighted avg       0.68      0.71      0.69       389



Epoch: 12/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.28it/s, F1=0.958, train_acc=0.997, train_loss=0.646, train_precision=0.95, train_recall=0.968] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      1.00      0.99        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.95      0.95      0.95        21
     LOC.NOM       0.83      0.90      0.86        21
     ORG.NAM       0.95      0.96      0.96        79
     ORG.NOM       0.71      0.77      0.74        13
     PER.NAM       0.96      0.98      0.97       223
     PER.NOM       0.93      0.95      0.94       268

   micro avg       0.94      0.96      0.95       695
   macro avg       0.79      0.81      0.80       695
weighted avg       0.94      0.96      0.95       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.43it/s, F1=0.673, eval_acc=0.968, eval_loss=7.78, eval_precision=0.615, eval_recall=0.75] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.58      0.81      0.68        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.40      0.67      0.50         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.37      0.49      0.42        47
     ORG.NOM       0.25      0.40      0.31         5
     PER.NAM       0.63      0.76      0.69        90
     PER.NOM       0.77      0.83      0.80       208

   micro avg       0.64      0.75      0.69       389
   macro avg       0.37      0.49      0.42       389
weighted avg       0.65      0.75      0.69       389



Epoch: 13/30 Train: 100%|██████████| 63/63 [00:22<00:00,  2.79it/s, F1=0.948, train_acc=0.996, train_loss=0.698, train_precision=0.935, train_recall=0.963]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.96      1.00      0.98        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.91      0.95      0.93        21
     LOC.NOM       0.82      0.86      0.84        21
     ORG.NAM       0.93      0.96      0.94        79
     ORG.NOM       0.92      0.92      0.92        13
     PER.NAM       0.95      0.97      0.96       223
     PER.NOM       0.94      0.97      0.95       268

   micro avg       0.93      0.97      0.95       695
   macro avg       0.80      0.83      0.82       695
weighted avg       0.93      0.97      0.95       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.43it/s, F1=0.64, eval_acc=0.964, eval_loss=7.81, eval_precision=0.571, eval_recall=0.732] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.62      0.81      0.70        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.57      0.67      0.62         6
     LOC.NOM       0.33      0.17      0.22         6
     ORG.NAM       0.31      0.45      0.37        47
     ORG.NOM       0.36      0.80      0.50         5
     PER.NAM       0.50      0.86      0.63        90
     PER.NOM       0.76      0.78      0.77       208

   micro avg       0.59      0.75      0.66       389
   macro avg       0.43      0.57      0.48       389
weighted avg       0.62      0.75      0.67       389



Epoch: 14/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.25it/s, F1=0.932, train_acc=0.995, train_loss=0.936, train_precision=0.921, train_recall=0.948]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      0.99      0.99        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.90      0.90      0.90        21
     LOC.NOM       0.73      0.90      0.81        21
     ORG.NAM       0.90      0.94      0.92        79
     ORG.NOM       0.83      0.77      0.80        13
     PER.NAM       0.91      0.95      0.93       223
     PER.NOM       0.93      0.94      0.94       268

   micro avg       0.91      0.94      0.93       695
   macro avg       0.77      0.80      0.79       695
weighted avg       0.91      0.94      0.93       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  3.91it/s, F1=0.652, eval_acc=0.968, eval_loss=7.52, eval_precision=0.578, eval_recall=0.755]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.56      0.77      0.65        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.18      0.33      0.24         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.31      0.47      0.37        47
     ORG.NOM       0.20      1.00      0.33         5
     PER.NAM       0.73      0.72      0.73        90
     PER.NOM       0.74      0.86      0.79       208

   micro avg       0.61      0.75      0.67       389
   macro avg       0.34      0.52      0.39       389
weighted avg       0.64      0.75      0.69       389



Epoch: 15/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.20it/s, F1=0.943, train_acc=0.997, train_loss=0.572, train_precision=0.933, train_recall=0.956]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.96      0.99      0.97        68
     GPE.NOM       0.00      0.00      0.00         2
     LOC.NAM       0.91      0.95      0.93        21
     LOC.NOM       0.77      0.81      0.79        21
     ORG.NAM       0.91      0.95      0.93        79
     ORG.NOM       0.92      0.92      0.92        13
     PER.NAM       0.94      0.96      0.95       223
     PER.NOM       0.95      0.97      0.96       268

   micro avg       0.93      0.96      0.94       695
   macro avg       0.80      0.82      0.81       695
weighted avg       0.93      0.96      0.94       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.43it/s, F1=0.648, eval_acc=0.963, eval_loss=8.44, eval_precision=0.573, eval_recall=0.753]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.61      0.88      0.72        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.17      0.67      0.27         6
     LOC.NOM       0.25      0.67      0.36         6
     ORG.NAM       0.32      0.43      0.36        47
     ORG.NOM       0.36      0.80      0.50         5
     PER.NAM       0.62      0.74      0.68        90
     PER.NOM       0.75      0.82      0.78       208

   micro avg       0.60      0.75      0.67       389
   macro avg       0.38      0.63      0.46       389
weighted avg       0.63      0.75      0.68       389



Epoch: 16/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.25it/s, F1=0.961, train_acc=0.997, train_loss=0.439, train_precision=0.952, train_recall=0.973]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.94      0.99      0.96        68
     GPE.NOM       0.50      0.50      0.50         2
     LOC.NAM       0.81      0.81      0.81        21
     LOC.NOM       0.83      0.90      0.86        21
     ORG.NAM       0.97      0.97      0.97        79
     ORG.NOM       0.86      0.92      0.89        13
     PER.NAM       0.95      0.97      0.96       223
     PER.NOM       0.97      0.99      0.98       268

   micro avg       0.95      0.97      0.96       695
   macro avg       0.85      0.88      0.87       695
weighted avg       0.95      0.97      0.96       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.41it/s, F1=0.634, eval_acc=0.967, eval_loss=8.04, eval_precision=0.596, eval_recall=0.683]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.60      0.58      0.59        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.40      0.67      0.50         6
     LOC.NOM       0.25      0.50      0.33         6
     ORG.NAM       0.34      0.57      0.43        47
     ORG.NOM       0.57      0.80      0.67         5
     PER.NAM       0.65      0.79      0.71        90
     PER.NOM       0.81      0.73      0.76       208

   micro avg       0.64      0.71      0.67       389
   macro avg       0.45      0.58      0.50       389
weighted avg       0.68      0.71      0.69       389



Epoch: 17/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.27it/s, F1=0.981, train_acc=0.998, train_loss=0.325, train_precision=0.979, train_recall=0.984]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        68
     GPE.NOM       1.00      0.50      0.67         2
     LOC.NAM       0.95      1.00      0.98        21
     LOC.NOM       0.90      0.90      0.90        21
     ORG.NAM       0.99      1.00      0.99        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.98      0.99      0.98       223
     PER.NOM       0.97      0.97      0.97       268

   micro avg       0.98      0.98      0.98       695
   macro avg       0.97      0.92      0.94       695
weighted avg       0.98      0.98      0.98       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.44it/s, F1=0.646, eval_acc=0.963, eval_loss=9.05, eval_precision=0.565, eval_recall=0.762]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.68      0.81      0.74        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.18      0.50      0.26         6
     LOC.NOM       0.08      0.17      0.11         6
     ORG.NAM       0.36      0.55      0.44        47
     ORG.NOM       0.42      1.00      0.59         5
     PER.NAM       0.60      0.79      0.68        90
     PER.NOM       0.69      0.81      0.75       208

   micro avg       0.58      0.76      0.66       389
   macro avg       0.37      0.58      0.44       389
weighted avg       0.61      0.76      0.67       389



Epoch: 18/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.25it/s, F1=0.969, train_acc=0.998, train_loss=0.306, train_precision=0.96, train_recall=0.982] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       0.91      1.00      0.95        21
     LOC.NOM       0.90      0.90      0.90        21
     ORG.NAM       0.99      0.99      0.99        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.97      0.99      0.98       223
     PER.NOM       0.95      0.99      0.97       268

   micro avg       0.97      0.99      0.98       695
   macro avg       0.97      0.98      0.97       695
weighted avg       0.97      0.99      0.98       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.42it/s, F1=0.656, eval_acc=0.967, eval_loss=8.49, eval_precision=0.605, eval_recall=0.723]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.65      0.77      0.70        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.25      0.67      0.36         6
     LOC.NOM       0.31      0.67      0.42         6
     ORG.NAM       0.32      0.49      0.39        47
     ORG.NOM       0.50      0.80      0.62         5
     PER.NAM       0.68      0.73      0.71        90
     PER.NOM       0.78      0.78      0.78       208

   micro avg       0.64      0.73      0.68       389
   macro avg       0.44      0.61      0.50       389
weighted avg       0.67      0.73      0.69       389



Epoch: 19/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.25it/s, F1=0.966, train_acc=0.998, train_loss=0.378, train_precision=0.961, train_recall=0.973]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       0.95      1.00      0.98        21
     LOC.NOM       0.86      0.90      0.88        21
     ORG.NAM       0.98      1.00      0.99        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.94      0.96      0.95       223
     PER.NOM       0.96      0.97      0.96       268

   micro avg       0.96      0.97      0.96       695
   macro avg       0.96      0.98      0.97       695
weighted avg       0.96      0.97      0.96       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.43it/s, F1=0.681, eval_acc=0.968, eval_loss=8.74, eval_precision=0.665, eval_recall=0.702]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.74      0.88      0.81        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.29      0.67      0.40         6
     LOC.NOM       0.29      0.33      0.31         6
     ORG.NAM       0.42      0.47      0.44        47
     ORG.NOM       0.57      0.80      0.67         5
     PER.NAM       0.71      0.73      0.72        90
     PER.NOM       0.78      0.74      0.76       208

   micro avg       0.69      0.71      0.70       389
   macro avg       0.47      0.58      0.51       389
weighted avg       0.70      0.71      0.70       389



Epoch: 20/30 Train: 100%|██████████| 63/63 [00:22<00:00,  2.79it/s, F1=0.961, train_acc=0.998, train_loss=0.402, train_precision=0.953, train_recall=0.973]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       1.00      0.95      0.98        21
     LOC.NOM       0.95      1.00      0.98        21
     ORG.NAM       0.99      0.99      0.99        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.95      0.97      0.96       223
     PER.NOM       0.97      0.97      0.97       268

   micro avg       0.97      0.98      0.97       695
   macro avg       0.98      0.99      0.98       695
weighted avg       0.97      0.98      0.97       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.44it/s, F1=0.654, eval_acc=0.964, eval_loss=8.61, eval_precision=0.585, eval_recall=0.745]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.69      0.85      0.76        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.16      0.50      0.24         6
     LOC.NOM       0.23      0.50      0.32         6
     ORG.NAM       0.37      0.45      0.40        47
     ORG.NOM       0.33      0.80      0.47         5
     PER.NAM       0.63      0.71      0.67        90
     PER.NOM       0.69      0.82      0.75       208

   micro avg       0.60      0.74      0.66       389
   macro avg       0.39      0.58      0.45       389
weighted avg       0.62      0.74      0.67       389



Epoch: 21/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.23it/s, F1=0.974, train_acc=0.998, train_loss=0.341, train_precision=0.969, train_recall=0.982]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      0.99      0.99        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       0.95      0.95      0.95        21
     LOC.NOM       0.95      0.95      0.95        21
     ORG.NAM       0.93      0.97      0.95        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.99      0.99      0.99       223
     PER.NOM       0.98      0.99      0.98       268

   micro avg       0.98      0.98      0.98       695
   macro avg       0.97      0.98      0.98       695
weighted avg       0.98      0.98      0.98       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  3.92it/s, F1=0.703, eval_acc=0.967, eval_loss=9.34, eval_precision=0.681, eval_recall=0.731]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.74      0.88      0.81        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.29      0.67      0.40         6
     LOC.NOM       0.29      0.33      0.31         6
     ORG.NAM       0.36      0.30      0.33        47
     ORG.NOM       0.57      0.80      0.67         5
     PER.NAM       0.65      0.73      0.69        90
     PER.NOM       0.77      0.81      0.79       208

   micro avg       0.67      0.72      0.70       389
   macro avg       0.46      0.57      0.50       389
weighted avg       0.67      0.72      0.69       389



Epoch: 22/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.23it/s, F1=0.97, train_acc=0.998, train_loss=0.329, train_precision=0.966, train_recall=0.976] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       0.95      1.00      0.98        21
     LOC.NOM       0.95      1.00      0.98        21
     ORG.NAM       0.99      0.99      0.99        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.98      0.98      0.98       223
     PER.NOM       0.98      0.99      0.99       268

   micro avg       0.98      0.99      0.98       695
   macro avg       0.98      1.00      0.99       695
weighted avg       0.98      0.99      0.98       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.43it/s, F1=0.68, eval_acc=0.968, eval_loss=8.79, eval_precision=0.664, eval_recall=0.7]   


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.68      0.81      0.74        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.29      0.67      0.40         6
     LOC.NOM       0.33      0.33      0.33         6
     ORG.NAM       0.34      0.34      0.34        47
     ORG.NOM       0.44      0.80      0.57         5
     PER.NAM       0.68      0.74      0.71        90
     PER.NOM       0.79      0.77      0.78       208

   micro avg       0.67      0.70      0.69       389
   macro avg       0.44      0.56      0.48       389
weighted avg       0.68      0.70      0.69       389



Epoch: 23/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.22it/s, F1=0.976, train_acc=0.998, train_loss=0.266, train_precision=0.976, train_recall=0.979]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       0.95      1.00      0.98        21
     LOC.NOM       0.95      0.95      0.95        21
     ORG.NAM       0.99      0.99      0.99        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.98      0.98      0.98       223
     PER.NOM       0.99      0.98      0.98       268

   micro avg       0.98      0.98      0.98       695
   macro avg       0.98      0.99      0.98       695
weighted avg       0.98      0.98      0.98       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.44it/s, F1=0.675, eval_acc=0.966, eval_loss=9.82, eval_precision=0.624, eval_recall=0.737]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.61      0.85      0.71        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.25      0.50      0.33         6
     LOC.NOM       0.33      0.33      0.33         6
     ORG.NAM       0.31      0.32      0.31        47
     ORG.NOM       0.36      0.80      0.50         5
     PER.NAM       0.64      0.73      0.68        90
     PER.NOM       0.74      0.83      0.78       208

   micro avg       0.63      0.73      0.68       389
   macro avg       0.41      0.54      0.46       389
weighted avg       0.63      0.73      0.68       389



Epoch: 24/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.18it/s, F1=0.98, train_acc=0.999, train_loss=0.245, train_precision=0.973, train_recall=0.988] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       0.95      1.00      0.98        21
     LOC.NOM       0.95      1.00      0.98        21
     ORG.NAM       0.99      0.99      0.99        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.97      0.98      0.98       223
     PER.NOM       0.98      1.00      0.99       268

   micro avg       0.98      0.99      0.98       695
   macro avg       0.98      1.00      0.99       695
weighted avg       0.98      0.99      0.98       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.38it/s, F1=0.643, eval_acc=0.965, eval_loss=8.8, eval_precision=0.596, eval_recall=0.704] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.61      0.85      0.71        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.36      0.67      0.47         6
     LOC.NOM       0.38      0.50      0.43         6
     ORG.NAM       0.33      0.47      0.39        47
     ORG.NOM       0.33      0.60      0.43         5
     PER.NAM       0.59      0.71      0.65        90
     PER.NOM       0.78      0.76      0.77       208

   micro avg       0.62      0.71      0.66       389
   macro avg       0.42      0.57      0.48       389
weighted avg       0.65      0.71      0.67       389



Epoch: 25/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.29it/s, F1=0.979, train_acc=0.998, train_loss=0.279, train_precision=0.981, train_recall=0.979] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       1.00      0.95      0.98        21
     LOC.NOM       1.00      0.95      0.98        21
     ORG.NAM       1.00      0.99      0.99        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.97      0.98      0.97       223
     PER.NOM       0.98      0.98      0.98       268

   micro avg       0.98      0.98      0.98       695
   macro avg       0.99      0.98      0.99       695
weighted avg       0.98      0.98      0.98       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.42it/s, F1=0.667, eval_acc=0.968, eval_loss=8.77, eval_precision=0.611, eval_recall=0.742]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.58      0.81      0.68        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.33      0.67      0.44         6
     LOC.NOM       0.27      0.50      0.35         6
     ORG.NAM       0.34      0.49      0.40        47
     ORG.NOM       0.33      0.60      0.43         5
     PER.NAM       0.65      0.73      0.69        90
     PER.NOM       0.76      0.80      0.78       208

   micro avg       0.63      0.74      0.68       389
   macro avg       0.41      0.57      0.47       389
weighted avg       0.65      0.74      0.69       389



Epoch: 26/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.20it/s, F1=0.974, train_acc=0.998, train_loss=0.196, train_precision=0.966, train_recall=0.986]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      0.99      0.99        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       0.91      0.95      0.93        21
     LOC.NOM       0.95      1.00      0.98        21
     ORG.NAM       0.96      0.99      0.97        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.97      0.99      0.98       223
     PER.NOM       0.98      0.99      0.99       268

   micro avg       0.97      0.99      0.98       695
   macro avg       0.97      0.99      0.98       695
weighted avg       0.97      0.99      0.98       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.32it/s, F1=0.687, eval_acc=0.967, eval_loss=9.44, eval_precision=0.64, eval_recall=0.745] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.59      0.85      0.70        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.27      0.67      0.38         6
     LOC.NOM       0.50      0.67      0.57         6
     ORG.NAM       0.35      0.38      0.36        47
     ORG.NOM       0.30      0.60      0.40         5
     PER.NAM       0.68      0.74      0.71        90
     PER.NOM       0.77      0.82      0.79       208

   micro avg       0.65      0.74      0.69       389
   macro avg       0.43      0.59      0.49       389
weighted avg       0.67      0.74      0.70       389



Epoch: 27/30 Train: 100%|██████████| 63/63 [00:22<00:00,  2.77it/s, F1=0.979, train_acc=0.999, train_loss=0.179, train_precision=0.975, train_recall=0.984]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       1.00      0.90      0.95        21
     LOC.NOM       1.00      1.00      1.00        21
     ORG.NAM       0.95      0.97      0.96        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.95      0.98      0.96       223
     PER.NOM       0.99      0.99      0.99       268

   micro avg       0.97      0.98      0.98       695
   macro avg       0.99      0.98      0.98       695
weighted avg       0.97      0.98      0.98       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.03it/s, F1=0.634, eval_acc=0.962, eval_loss=10.2, eval_precision=0.563, eval_recall=0.732]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.56      0.85      0.68        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.20      0.67      0.31         6
     LOC.NOM       0.33      0.50      0.40         6
     ORG.NAM       0.27      0.45      0.33        47
     ORG.NOM       0.27      0.60      0.37         5
     PER.NAM       0.56      0.72      0.63        90
     PER.NOM       0.79      0.78      0.79       208

   micro avg       0.58      0.72      0.65       389
   macro avg       0.37      0.57      0.44       389
weighted avg       0.63      0.72      0.67       389



Epoch: 28/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.23it/s, F1=0.959, train_acc=0.998, train_loss=0.352, train_precision=0.957, train_recall=0.963] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       0.95      0.95      0.95        21
     LOC.NOM       0.95      0.95      0.95        21
     ORG.NAM       0.96      0.97      0.97        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.96      0.97      0.97       223
     PER.NOM       1.00      0.98      0.99       268

   micro avg       0.98      0.98      0.98       695
   macro avg       0.98      0.98      0.98       695
weighted avg       0.98      0.98      0.98       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.26it/s, F1=0.623, eval_acc=0.958, eval_loss=10.9, eval_precision=0.53, eval_recall=0.762] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.61      0.85      0.71        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.27      0.50      0.35         6
     LOC.NOM       0.43      1.00      0.60         6
     ORG.NAM       0.26      0.53      0.35        47
     ORG.NOM       0.31      0.80      0.44         5
     PER.NAM       0.55      0.76      0.64        90
     PER.NOM       0.68      0.80      0.73       208

   micro avg       0.54      0.76      0.63       389
   macro avg       0.39      0.65      0.48       389
weighted avg       0.58      0.76      0.65       389



Epoch: 29/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.19it/s, F1=0.969, train_acc=0.998, train_loss=0.345, train_precision=0.965, train_recall=0.976]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       1.00      1.00      1.00        21
     LOC.NOM       0.95      0.95      0.95        21
     ORG.NAM       0.99      0.99      0.99        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.96      0.97      0.97       223
     PER.NOM       0.99      0.99      0.99       268

   micro avg       0.98      0.98      0.98       695
   macro avg       0.99      0.99      0.99       695
weighted avg       0.98      0.98      0.98       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.40it/s, F1=0.645, eval_acc=0.965, eval_loss=9.69, eval_precision=0.584, eval_recall=0.728]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.61      0.88      0.72        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.36      0.83      0.50         6
     LOC.NOM       0.31      0.67      0.42         6
     ORG.NAM       0.31      0.49      0.38        47
     ORG.NOM       0.33      0.60      0.43         5
     PER.NAM       0.63      0.73      0.68        90
     PER.NOM       0.77      0.78      0.78       208

   micro avg       0.62      0.74      0.67       389
   macro avg       0.41      0.62      0.49       389
weighted avg       0.65      0.74      0.68       389



Epoch: 30/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.23it/s, F1=0.952, train_acc=0.997, train_loss=0.773, train_precision=0.946, train_recall=0.965]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00        68
     GPE.NOM       1.00      1.00      1.00         2
     LOC.NAM       0.87      0.95      0.91        21
     LOC.NOM       0.91      1.00      0.95        21
     ORG.NAM       0.97      0.99      0.98        79
     ORG.NOM       1.00      1.00      1.00        13
     PER.NAM       0.90      0.96      0.93       223
     PER.NOM       0.96      0.96      0.96       268

   micro avg       0.94      0.97      0.96       695
   macro avg       0.95      0.98      0.97       695
weighted avg       0.94      0.97      0.96       695



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.29it/s, F1=0.579, eval_acc=0.961, eval_loss=17.1, eval_precision=0.728, eval_recall=0.485]


eval_reports:


calculate data/few_shot/weibo/train_1000.json etag:   0%|          | 0.00/665k [00:00<?, ?B/s]

              precision    recall  f1-score   support

     GPE.NAM       0.62      0.77      0.69        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.75      0.50      0.60         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.38      0.26      0.30        47
     ORG.NOM       0.80      0.80      0.80         5
     PER.NAM       0.58      0.41      0.48        90
     PER.NOM       0.86      0.52      0.65       208

   micro avg       0.70      0.48      0.57       389
   macro avg       0.50      0.41      0.44       389
weighted avg       0.70      0.48      0.56       389

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/weibo/train_1000.json",
    "eval_file": "data/few_shot/weibo/dev.json",
    "test_file": "data/few_shot/

calculate data/few_shot/weibo/train_1000.json etag: 100%|██████████| 665k/665k [00:00<00:00, 20.1MB/s]
calculate data/few_shot/weibo/dev.json etag: 100%|██████████| 180k/180k [00:00<00:00, 190MB/s]
calculate data/few_shot/weibo/test.json etag: 100%|██████████| 184k/184k [00:00<00:00, 291MB/s]
calculate data/few_shot/weibo/labels.txt etag: 100%|██████████| 272/272 [00:00<00:00, 544kB/s]


load cached ./temp/b8906855ab5cdf4bb18730a0e123dcf9_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/lexicon_tree


count line size data/few_shot/weibo/labels.txt: 29L [00:00, 238032.91L/s]
build line mapper: 29L [00:00, 29900.40L/s]9 [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 29/29 [00:00<00:00, 8510.69it/s]
load vocab from list: 100%|██████████| 28/28 [00:00<00:00, 280958.16it/s]

load cached ./temp/b8906855ab5cdf4bb18730a0e123dcf9_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/matched_words
load cached ./temp/b8906855ab5cdf4bb18730a0e123dcf9_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/word_vocab
load cached ./temp/b8906855ab5cdf4bb18730a0e123dcf9_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/vocab_embedding



load dataset from data/few_shot/weibo/train_1000.json: 1000it [00:01, 505.65it/s]
load dataset from data/few_shot/weibo/dev.json: 271it [00:00, 505.85it/s]
Some weights of the model checkpoint at save_pretrained/weibo_pretrain_lebert_1000_pretraind_task/Bert_960/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification mode

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.27it/s, F1=0.000278, train_acc=0.777, train_loss=55.7, train_precision=0.000146, train_recall=0.00313]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00       137
     GPE.NOM       0.00      0.00      0.00         4
     LOC.NAM       0.00      0.00      0.00        41
     LOC.NOM       0.00      0.00      0.00        38
     ORG.NAM       0.00      0.00      0.00       141
     ORG.NOM       0.00      0.00      0.00        27
     PER.NAM       0.00      0.01      0.00       432
     PER.NOM       0.00      0.01      0.00       543

   micro avg       0.00      0.01      0.00      1363
   macro avg       0.00      0.00      0.00      1363
weighted avg       0.00      0.01      0.00      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.25it/s, F1=0, eval_acc=0.933, eval_loss=16.4, eval_precision=0, eval_recall=0]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.00      0.00      0.00        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.00      0.00      0.00        90
     PER.NOM       0.00      0.00      0.00       208

   micro avg       0.00      0.00      0.00       389
   macro avg       0.00      0.00      0.00       389
weighted avg       0.00      0.00      0.00       389



Epoch: 2/30 Train: 100%|██████████| 125/125 [00:42<00:00,  2.95it/s, F1=0.18, train_acc=0.948, train_loss=11.8, train_precision=0.176, train_recall=0.201]    


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.11      0.08      0.09       137
     GPE.NOM       0.00      0.00      0.00         4
     LOC.NAM       0.00      0.00      0.00        41
     LOC.NOM       0.00      0.00      0.00        38
     ORG.NAM       0.03      0.03      0.03       141
     ORG.NOM       0.00      0.00      0.00        27
     PER.NAM       0.06      0.09      0.07       432
     PER.NOM       0.48      0.44      0.46       543

   micro avg       0.20      0.22      0.21      1363
   macro avg       0.08      0.08      0.08      1363
weighted avg       0.22      0.22      0.22      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.37it/s, F1=0.473, eval_acc=0.956, eval_loss=8.27, eval_precision=0.37, eval_recall=0.67]  


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.27      0.65      0.38        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.09      0.13      0.11        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.23      0.62      0.33        90
     PER.NOM       0.66      0.84      0.74       208

   micro avg       0.39      0.65      0.49       389
   macro avg       0.16      0.28      0.19       389
weighted avg       0.43      0.65      0.51       389



Epoch: 3/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.26it/s, F1=0.59, train_acc=0.972, train_loss=5.8, train_precision=0.571, train_recall=0.643]  


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.53      0.74      0.62       137
     GPE.NOM       0.00      0.00      0.00         4
     LOC.NAM       0.00      0.00      0.00        41
     LOC.NOM       0.00      0.00      0.00        38
     ORG.NAM       0.34      0.45      0.39       141
     ORG.NOM       0.00      0.00      0.00        27
     PER.NAM       0.49      0.65      0.56       432
     PER.NOM       0.71      0.79      0.75       543

   micro avg       0.54      0.64      0.59      1363
   macro avg       0.26      0.33      0.29      1363
weighted avg       0.53      0.64      0.58      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.30it/s, F1=0.577, eval_acc=0.96, eval_loss=6.79, eval_precision=0.481, eval_recall=0.727] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.38      0.69      0.49        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.20      0.50      0.29         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.25      0.47      0.33        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.39      0.78      0.52        90
     PER.NOM       0.74      0.80      0.77       208

   micro avg       0.50      0.72      0.59       389
   macro avg       0.24      0.40      0.30       389
weighted avg       0.54      0.72      0.61       389



Epoch: 4/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.25it/s, F1=0.717, train_acc=0.98, train_loss=4, train_precision=0.693, train_recall=0.761]    


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.69      0.81      0.75       137
     GPE.NOM       0.00      0.00      0.00         4
     LOC.NAM       0.13      0.22      0.16        41
     LOC.NOM       0.14      0.08      0.10        38
     ORG.NAM       0.63      0.77      0.69       141
     ORG.NOM       0.17      0.04      0.06        27
     PER.NAM       0.62      0.76      0.69       432
     PER.NOM       0.77      0.85      0.81       543

   micro avg       0.66      0.75      0.70      1363
   macro avg       0.39      0.44      0.41      1363
weighted avg       0.65      0.75      0.70      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.25it/s, F1=0.635, eval_acc=0.966, eval_loss=6.44, eval_precision=0.544, eval_recall=0.766]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.59      0.88      0.71        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.04      0.17      0.07         6
     ORG.NAM       0.32      0.55      0.40        47
     ORG.NOM       0.33      0.80      0.47         5
     PER.NAM       0.58      0.76      0.66        90
     PER.NOM       0.75      0.84      0.79       208

   micro avg       0.57      0.76      0.65       389
   macro avg       0.33      0.50      0.39       389
weighted avg       0.62      0.76      0.68       389



Epoch: 5/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.25it/s, F1=0.769, train_acc=0.986, train_loss=2.66, train_precision=0.744, train_recall=0.812]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.83      0.89      0.86       137
     GPE.NOM       0.00      0.00      0.00         4
     LOC.NAM       0.20      0.34      0.25        41
     LOC.NOM       0.31      0.29      0.30        38
     ORG.NAM       0.77      0.89      0.83       141
     ORG.NOM       0.54      0.48      0.51        27
     PER.NAM       0.69      0.82      0.75       432
     PER.NOM       0.83      0.90      0.86       543

   micro avg       0.73      0.83      0.78      1363
   macro avg       0.52      0.58      0.54      1363
weighted avg       0.74      0.83      0.78      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.28it/s, F1=0.647, eval_acc=0.966, eval_loss=6.69, eval_precision=0.601, eval_recall=0.703]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.55      0.85      0.67        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.11      0.33      0.17         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.36      0.40      0.38        47
     ORG.NOM       0.50      0.80      0.62         5
     PER.NAM       0.65      0.73      0.69        90
     PER.NOM       0.75      0.74      0.74       208

   micro avg       0.61      0.68      0.65       389
   macro avg       0.36      0.48      0.41       389
weighted avg       0.64      0.68      0.66       389



Epoch: 6/30 Train: 100%|██████████| 125/125 [00:41<00:00,  3.01it/s, F1=0.85, train_acc=0.991, train_loss=1.77, train_precision=0.832, train_recall=0.878] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.85      0.91      0.88       137
     GPE.NOM       0.00      0.00      0.00         4
     LOC.NAM       0.58      0.76      0.66        41
     LOC.NOM       0.40      0.42      0.41        38
     ORG.NAM       0.85      0.91      0.88       141
     ORG.NOM       0.53      0.59      0.56        27
     PER.NAM       0.81      0.88      0.84       432
     PER.NOM       0.88      0.93      0.91       543

   micro avg       0.82      0.88      0.85      1363
   macro avg       0.61      0.67      0.64      1363
weighted avg       0.82      0.88      0.85      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.32it/s, F1=0.665, eval_acc=0.965, eval_loss=7.42, eval_precision=0.608, eval_recall=0.735]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.58      0.85      0.69        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.19      0.50      0.27         6
     LOC.NOM       0.06      0.17      0.09         6
     ORG.NAM       0.42      0.49      0.45        47
     ORG.NOM       0.29      0.80      0.42         5
     PER.NAM       0.63      0.78      0.70        90
     PER.NOM       0.76      0.77      0.77       208

   micro avg       0.62      0.73      0.67       389
   macro avg       0.37      0.54      0.42       389
weighted avg       0.65      0.73      0.68       389



Epoch: 7/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.24it/s, F1=0.865, train_acc=0.992, train_loss=1.43, train_precision=0.842, train_recall=0.9]  


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.91      0.94      0.93       137
     GPE.NOM       0.00      0.00      0.00         4
     LOC.NAM       0.65      0.83      0.73        41
     LOC.NOM       0.44      0.58      0.50        38
     ORG.NAM       0.88      0.93      0.90       141
     ORG.NOM       0.54      0.56      0.55        27
     PER.NAM       0.86      0.93      0.90       432
     PER.NOM       0.89      0.94      0.91       543

   micro avg       0.85      0.91      0.88      1363
   macro avg       0.65      0.71      0.68      1363
weighted avg       0.85      0.91      0.88      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.29it/s, F1=0.641, eval_acc=0.961, eval_loss=8.18, eval_precision=0.555, eval_recall=0.759]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.51      0.85      0.64        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.28      0.83      0.42         6
     LOC.NOM       0.07      0.17      0.10         6
     ORG.NAM       0.36      0.43      0.39        47
     ORG.NOM       0.19      0.80      0.31         5
     PER.NAM       0.50      0.81      0.62        90
     PER.NOM       0.75      0.82      0.79       208

   micro avg       0.56      0.76      0.65       389
   macro avg       0.33      0.59      0.41       389
weighted avg       0.60      0.76      0.66       389



Epoch: 8/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.26it/s, F1=0.902, train_acc=0.994, train_loss=1.19, train_precision=0.882, train_recall=0.929]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.91      0.93      0.92       137
     GPE.NOM       0.00      0.00      0.00         4
     LOC.NAM       0.78      0.88      0.83        41
     LOC.NOM       0.53      0.63      0.58        38
     ORG.NAM       0.93      0.95      0.94       141
     ORG.NOM       0.79      0.81      0.80        27
     PER.NAM       0.86      0.92      0.89       432
     PER.NOM       0.91      0.96      0.94       543

   micro avg       0.88      0.93      0.90      1363
   macro avg       0.71      0.76      0.74      1363
weighted avg       0.88      0.93      0.90      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.36it/s, F1=0.675, eval_acc=0.966, eval_loss=7.37, eval_precision=0.617, eval_recall=0.747]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.55      0.85      0.67        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.36      0.83      0.50         6
     LOC.NOM       0.08      0.17      0.11         6
     ORG.NAM       0.34      0.45      0.39        47
     ORG.NOM       0.27      0.80      0.40         5
     PER.NAM       0.68      0.77      0.72        90
     PER.NOM       0.79      0.80      0.79       208

   micro avg       0.63      0.74      0.68       389
   macro avg       0.38      0.58      0.45       389
weighted avg       0.67      0.74      0.70       389



Epoch: 9/30 Train: 100%|██████████| 125/125 [00:41<00:00,  2.99it/s, F1=0.93, train_acc=0.996, train_loss=0.888, train_precision=0.917, train_recall=0.951] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.96      0.96      0.96       137
     GPE.NOM       0.00      0.00      0.00         4
     LOC.NAM       0.77      0.90      0.83        41
     LOC.NOM       0.68      0.71      0.69        38
     ORG.NAM       0.95      0.97      0.96       141
     ORG.NOM       0.85      0.85      0.85        27
     PER.NAM       0.91      0.95      0.93       432
     PER.NOM       0.94      0.97      0.95       543

   micro avg       0.92      0.95      0.93      1363
   macro avg       0.76      0.79      0.77      1363
weighted avg       0.92      0.95      0.93      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.41it/s, F1=0.696, eval_acc=0.969, eval_loss=7.88, eval_precision=0.655, eval_recall=0.745]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.61      0.85      0.71        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.25      0.33      0.29         6
     LOC.NOM       0.14      0.17      0.15         6
     ORG.NAM       0.36      0.34      0.35        47
     ORG.NOM       0.40      0.80      0.53         5
     PER.NAM       0.68      0.78      0.73        90
     PER.NOM       0.77      0.83      0.80       208

   micro avg       0.66      0.74      0.70       389
   macro avg       0.40      0.51      0.44       389
weighted avg       0.66      0.74      0.70       389



Epoch: 10/30 Train: 100%|██████████| 125/125 [00:37<00:00,  3.30it/s, F1=0.94, train_acc=0.996, train_loss=0.716, train_precision=0.93, train_recall=0.954]  


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.96      0.97      0.96       137
     GPE.NOM       0.00      0.00      0.00         4
     LOC.NAM       0.83      0.85      0.84        41
     LOC.NOM       0.84      0.82      0.83        38
     ORG.NAM       0.96      0.99      0.97       141
     ORG.NOM       0.92      0.89      0.91        27
     PER.NAM       0.93      0.96      0.94       432
     PER.NOM       0.94      0.97      0.96       543

   micro avg       0.93      0.96      0.94      1363
   macro avg       0.80      0.81      0.80      1363
weighted avg       0.93      0.96      0.94      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.41it/s, F1=0.678, eval_acc=0.966, eval_loss=8.34, eval_precision=0.607, eval_recall=0.77] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.65      0.85      0.73        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.38      0.83      0.53         6
     LOC.NOM       0.06      0.17      0.09         6
     ORG.NAM       0.41      0.47      0.44        47
     ORG.NOM       0.19      0.80      0.31         5
     PER.NAM       0.70      0.77      0.73        90
     PER.NOM       0.76      0.85      0.80       208

   micro avg       0.63      0.77      0.69       389
   macro avg       0.39      0.59      0.45       389
weighted avg       0.67      0.77      0.71       389



Epoch: 11/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.24it/s, F1=0.942, train_acc=0.997, train_loss=0.586, train_precision=0.933, train_recall=0.957]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.97      0.99      0.98       137
     GPE.NOM       0.00      0.00      0.00         4
     LOC.NAM       0.84      0.90      0.87        41
     LOC.NOM       0.80      0.84      0.82        38
     ORG.NAM       0.98      0.99      0.98       141
     ORG.NOM       0.93      0.93      0.93        27
     PER.NAM       0.93      0.97      0.95       432
     PER.NOM       0.95      0.97      0.96       543

   micro avg       0.94      0.96      0.95      1363
   macro avg       0.80      0.82      0.81      1363
weighted avg       0.94      0.96      0.95      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.44it/s, F1=0.7, eval_acc=0.967, eval_loss=8.61, eval_precision=0.683, eval_recall=0.72]   


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.78      0.81      0.79        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.08      0.17      0.11         6
     ORG.NAM       0.48      0.43      0.45        47
     ORG.NOM       0.20      0.80      0.32         5
     PER.NAM       0.72      0.70      0.71        90
     PER.NOM       0.78      0.80      0.79       208

   micro avg       0.67      0.71      0.69       389
   macro avg       0.38      0.46      0.40       389
weighted avg       0.70      0.71      0.70       389



Epoch: 12/30 Train: 100%|██████████| 125/125 [00:41<00:00,  3.00it/s, F1=0.954, train_acc=0.997, train_loss=0.584, train_precision=0.951, train_recall=0.961]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      0.99      0.99       137
     GPE.NOM       0.25      0.25      0.25         4
     LOC.NAM       0.90      0.90      0.90        41
     LOC.NOM       0.95      0.95      0.95        38
     ORG.NAM       0.98      0.98      0.98       141
     ORG.NOM       0.93      0.96      0.95        27
     PER.NAM       0.95      0.95      0.95       432
     PER.NOM       0.96      0.97      0.96       543

   micro avg       0.95      0.96      0.96      1363
   macro avg       0.86      0.87      0.87      1363
weighted avg       0.95      0.96      0.96      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.42it/s, F1=0.647, eval_acc=0.962, eval_loss=8.54, eval_precision=0.576, eval_recall=0.741]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.59      0.85      0.70        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.38      0.83      0.53         6
     LOC.NOM       0.06      0.17      0.08         6
     ORG.NAM       0.31      0.45      0.37        47
     ORG.NOM       0.17      0.80      0.29         5
     PER.NAM       0.65      0.73      0.69        90
     PER.NOM       0.74      0.80      0.77       208

   micro avg       0.58      0.73      0.65       389
   macro avg       0.36      0.58      0.43       389
weighted avg       0.63      0.73      0.67       389



Epoch: 13/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.23it/s, F1=0.958, train_acc=0.997, train_loss=0.556, train_precision=0.948, train_recall=0.973]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      0.99      0.99       137
     GPE.NOM       0.75      0.75      0.75         4
     LOC.NAM       0.93      0.93      0.93        41
     LOC.NOM       0.95      0.97      0.96        38
     ORG.NAM       0.93      0.95      0.94       141
     ORG.NOM       1.00      0.96      0.98        27
     PER.NAM       0.92      0.96      0.94       432
     PER.NOM       0.96      0.98      0.97       543

   micro avg       0.95      0.97      0.96      1363
   macro avg       0.93      0.94      0.93      1363
weighted avg       0.95      0.97      0.96      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.42it/s, F1=0.67, eval_acc=0.965, eval_loss=9.08, eval_precision=0.62, eval_recall=0.733]  


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.59      0.85      0.70        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.45      0.83      0.59         6
     LOC.NOM       0.14      0.17      0.15         6
     ORG.NAM       0.38      0.38      0.38        47
     ORG.NOM       0.22      0.80      0.35         5
     PER.NAM       0.68      0.78      0.73        90
     PER.NOM       0.74      0.78      0.76       208

   micro avg       0.64      0.72      0.68       389
   macro avg       0.40      0.57      0.46       389
weighted avg       0.65      0.72      0.68       389



Epoch: 14/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.23it/s, F1=0.954, train_acc=0.997, train_loss=0.398, train_precision=0.946, train_recall=0.969]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      0.99      0.99       137
     GPE.NOM       0.75      0.75      0.75         4
     LOC.NAM       0.93      0.98      0.95        41
     LOC.NOM       0.95      0.97      0.96        38
     ORG.NAM       0.97      0.99      0.98       141
     ORG.NOM       0.96      1.00      0.98        27
     PER.NAM       0.93      0.97      0.95       432
     PER.NOM       0.95      0.97      0.96       543

   micro avg       0.95      0.97      0.96      1363
   macro avg       0.93      0.95      0.94      1363
weighted avg       0.95      0.97      0.96      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  3.80it/s, F1=0.697, eval_acc=0.968, eval_loss=9.83, eval_precision=0.671, eval_recall=0.727]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.60      0.81      0.69        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.36      0.67      0.47         6
     LOC.NOM       0.07      0.17      0.10         6
     ORG.NAM       0.47      0.38      0.42        47
     ORG.NOM       0.40      0.80      0.53         5
     PER.NAM       0.72      0.68      0.70        90
     PER.NOM       0.79      0.82      0.80       208

   micro avg       0.68      0.72      0.70       389
   macro avg       0.43      0.54      0.46       389
weighted avg       0.70      0.72      0.70       389



Epoch: 15/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.22it/s, F1=0.95, train_acc=0.997, train_loss=0.387, train_precision=0.943, train_recall=0.96]  


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      0.99      0.99       137
     GPE.NOM       0.75      0.75      0.75         4
     LOC.NAM       0.95      0.95      0.95        41
     LOC.NOM       1.00      0.97      0.99        38
     ORG.NAM       0.99      0.99      0.99       141
     ORG.NOM       1.00      0.96      0.98        27
     PER.NAM       0.91      0.96      0.93       432
     PER.NOM       0.95      0.96      0.96       543

   micro avg       0.95      0.97      0.96      1363
   macro avg       0.94      0.94      0.94      1363
weighted avg       0.95      0.97      0.96      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.44it/s, F1=0.679, eval_acc=0.968, eval_loss=9.21, eval_precision=0.637, eval_recall=0.73] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.64      0.81      0.71        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.50      0.83      0.62         6
     LOC.NOM       0.10      0.17      0.12         6
     ORG.NAM       0.36      0.38      0.37        47
     ORG.NOM       0.31      0.80      0.44         5
     PER.NAM       0.64      0.74      0.69        90
     PER.NOM       0.79      0.79      0.79       208

   micro avg       0.65      0.72      0.69       389
   macro avg       0.42      0.57      0.47       389
weighted avg       0.67      0.72      0.69       389



Epoch: 16/30 Train: 100%|██████████| 125/125 [00:41<00:00,  2.99it/s, F1=0.969, train_acc=0.997, train_loss=0.425, train_precision=0.963, train_recall=0.979]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      0.99      0.99       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.95      0.93      0.94        41
     LOC.NOM       0.97      1.00      0.99        38
     ORG.NAM       0.99      0.99      0.99       141
     ORG.NOM       0.93      0.96      0.95        27
     PER.NAM       0.94      0.97      0.95       432
     PER.NOM       0.97      0.98      0.98       543

   micro avg       0.96      0.98      0.97      1363
   macro avg       0.97      0.98      0.97      1363
weighted avg       0.96      0.98      0.97      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.41it/s, F1=0.689, eval_acc=0.966, eval_loss=9.56, eval_precision=0.636, eval_recall=0.755]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.65      0.85      0.73        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.42      0.83      0.56         6
     LOC.NOM       0.20      0.33      0.25         6
     ORG.NAM       0.43      0.43      0.43        47
     ORG.NOM       0.21      0.80      0.33         5
     PER.NAM       0.63      0.77      0.69        90
     PER.NOM       0.77      0.82      0.80       208

   micro avg       0.64      0.75      0.69       389
   macro avg       0.41      0.60      0.47       389
weighted avg       0.67      0.75      0.70       389



Epoch: 17/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.21it/s, F1=0.97, train_acc=0.998, train_loss=0.325, train_precision=0.964, train_recall=0.977] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      0.99      0.99       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.95      1.00      0.98        41
     LOC.NOM       0.97      0.97      0.97        38
     ORG.NAM       0.99      0.99      0.99       141
     ORG.NOM       0.96      0.96      0.96        27
     PER.NAM       0.94      0.97      0.95       432
     PER.NOM       0.96      0.98      0.97       543

   micro avg       0.96      0.98      0.97      1363
   macro avg       0.97      0.98      0.98      1363
weighted avg       0.96      0.98      0.97      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.40it/s, F1=0.679, eval_acc=0.964, eval_loss=9.54, eval_precision=0.609, eval_recall=0.772]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.73      0.85      0.79        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.62      0.83      0.71         6
     LOC.NOM       0.14      0.17      0.15         6
     ORG.NAM       0.43      0.62      0.50        47
     ORG.NOM       0.19      0.80      0.31         5
     PER.NAM       0.62      0.80      0.70        90
     PER.NOM       0.76      0.80      0.78       208

   micro avg       0.64      0.77      0.70       389
   macro avg       0.44      0.61      0.49       389
weighted avg       0.66      0.77      0.71       389



Epoch: 18/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.25it/s, F1=0.958, train_acc=0.997, train_loss=0.418, train_precision=0.957, train_recall=0.964]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.98      0.98      0.98        41
     LOC.NOM       0.97      1.00      0.99        38
     ORG.NAM       0.98      0.98      0.98       141
     ORG.NOM       0.96      0.89      0.92        27
     PER.NAM       0.94      0.97      0.95       432
     PER.NOM       0.96      0.97      0.96       543

   micro avg       0.96      0.97      0.97      1363
   macro avg       0.97      0.97      0.97      1363
weighted avg       0.96      0.97      0.97      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.26it/s, F1=0.682, eval_acc=0.965, eval_loss=9.65, eval_precision=0.628, eval_recall=0.747]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.70      0.88      0.78        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.36      0.67      0.47         6
     LOC.NOM       0.12      0.33      0.17         6
     ORG.NAM       0.37      0.49      0.42        47
     ORG.NOM       0.27      0.80      0.40         5
     PER.NAM       0.69      0.74      0.72        90
     PER.NOM       0.76      0.80      0.78       208

   micro avg       0.63      0.74      0.68       389
   macro avg       0.41      0.59      0.47       389
weighted avg       0.67      0.74      0.70       389



Epoch: 19/30 Train: 100%|██████████| 125/125 [00:41<00:00,  2.98it/s, F1=0.925, train_acc=0.996, train_loss=0.856, train_precision=0.91, train_recall=0.947] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      0.99      0.99       137
     GPE.NOM       0.80      1.00      0.89         4
     LOC.NAM       0.90      0.93      0.92        41
     LOC.NOM       0.90      0.95      0.92        38
     ORG.NAM       0.92      0.96      0.94       141
     ORG.NOM       0.76      0.81      0.79        27
     PER.NAM       0.85      0.92      0.88       432
     PER.NOM       0.96      0.98      0.97       543

   micro avg       0.91      0.95      0.93      1363
   macro avg       0.89      0.94      0.91      1363
weighted avg       0.91      0.95      0.93      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.31it/s, F1=0.654, eval_acc=0.965, eval_loss=8.99, eval_precision=0.601, eval_recall=0.721]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.65      0.85      0.73        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.50      0.83      0.62         6
     LOC.NOM       0.10      0.17      0.12         6
     ORG.NAM       0.35      0.40      0.38        47
     ORG.NOM       0.19      0.80      0.31         5
     PER.NAM       0.59      0.72      0.65        90
     PER.NOM       0.77      0.77      0.77       208

   micro avg       0.62      0.71      0.66       389
   macro avg       0.39      0.57      0.45       389
weighted avg       0.64      0.71      0.67       389



Epoch: 20/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.24it/s, F1=0.968, train_acc=0.998, train_loss=0.301, train_precision=0.962, train_recall=0.977]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       137
     GPE.NOM       0.75      0.75      0.75         4
     LOC.NAM       0.91      0.95      0.93        41
     LOC.NOM       0.90      0.95      0.92        38
     ORG.NAM       0.99      1.00      0.99       141
     ORG.NOM       0.96      0.96      0.96        27
     PER.NAM       0.93      0.97      0.95       432
     PER.NOM       0.97      0.98      0.97       543

   micro avg       0.96      0.98      0.97      1363
   macro avg       0.93      0.94      0.94      1363
weighted avg       0.96      0.98      0.97      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.41it/s, F1=0.688, eval_acc=0.968, eval_loss=9.73, eval_precision=0.651, eval_recall=0.732]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.75      0.81      0.78        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.67      0.67      0.67         6
     LOC.NOM       0.17      0.17      0.17         6
     ORG.NAM       0.41      0.55      0.47        47
     ORG.NOM       0.40      0.80      0.53         5
     PER.NAM       0.67      0.73      0.70        90
     PER.NOM       0.76      0.76      0.76       208

   micro avg       0.67      0.72      0.69       389
   macro avg       0.48      0.56      0.51       389
weighted avg       0.68      0.72      0.70       389



Epoch: 21/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.25it/s, F1=0.96, train_acc=0.998, train_loss=0.27, train_precision=0.957, train_recall=0.967]  


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.93      0.93      0.93        41
     LOC.NOM       0.97      0.95      0.96        38
     ORG.NAM       0.98      0.98      0.98       141
     ORG.NOM       0.93      0.96      0.95        27
     PER.NAM       0.93      0.96      0.95       432
     PER.NOM       0.97      0.97      0.97       543

   micro avg       0.96      0.97      0.97      1363
   macro avg       0.96      0.97      0.97      1363
weighted avg       0.96      0.97      0.97      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.28it/s, F1=0.662, eval_acc=0.964, eval_loss=10, eval_precision=0.599, eval_recall=0.744]  


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.58      0.85      0.69        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.56      0.83      0.67         6
     LOC.NOM       0.10      0.17      0.12         6
     ORG.NAM       0.37      0.49      0.42        47
     ORG.NOM       0.31      0.80      0.44         5
     PER.NAM       0.59      0.80      0.68        90
     PER.NOM       0.79      0.77      0.78       208

   micro avg       0.62      0.74      0.67       389
   macro avg       0.41      0.59      0.47       389
weighted avg       0.65      0.74      0.69       389



Epoch: 22/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.24it/s, F1=0.972, train_acc=0.998, train_loss=0.276, train_precision=0.969, train_recall=0.978]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.93      0.98      0.95        41
     LOC.NOM       0.97      1.00      0.99        38
     ORG.NAM       0.99      0.99      0.99       141
     ORG.NOM       0.96      0.96      0.96        27
     PER.NAM       0.93      0.96      0.95       432
     PER.NOM       0.97      0.97      0.97       543

   micro avg       0.96      0.97      0.97      1363
   macro avg       0.97      0.98      0.98      1363
weighted avg       0.96      0.97      0.97      1363



Eval Result: 100%|██████████| 5/5 [00:04<00:00,  1.11it/s, F1=0.672, eval_acc=0.966, eval_loss=10.4, eval_precision=0.622, eval_recall=0.735]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.66      0.88      0.75        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.50      0.83      0.62         6
     LOC.NOM       0.22      0.33      0.27         6
     ORG.NAM       0.38      0.38      0.38        47
     ORG.NOM       0.27      0.80      0.40         5
     PER.NAM       0.68      0.74      0.71        90
     PER.NOM       0.75      0.79      0.77       208

   micro avg       0.65      0.73      0.69       389
   macro avg       0.43      0.60      0.49       389
weighted avg       0.66      0.73      0.69       389



Epoch: 23/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.26it/s, F1=0.971, train_acc=0.998, train_loss=0.26, train_precision=0.967, train_recall=0.98]  


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.95      0.90      0.92        41
     LOC.NOM       0.97      0.97      0.97        38
     ORG.NAM       0.99      0.99      0.99       141
     ORG.NOM       1.00      0.96      0.98        27
     PER.NAM       0.95      0.97      0.96       432
     PER.NOM       0.97      0.99      0.98       543

   micro avg       0.97      0.98      0.97      1363
   macro avg       0.98      0.97      0.98      1363
weighted avg       0.97      0.98      0.97      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.43it/s, F1=0.669, eval_acc=0.964, eval_loss=11.1, eval_precision=0.63, eval_recall=0.718] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.63      0.85      0.72        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.45      0.83      0.59         6
     LOC.NOM       0.17      0.17      0.17         6
     ORG.NAM       0.38      0.36      0.37        47
     ORG.NOM       0.22      0.80      0.35         5
     PER.NAM       0.63      0.78      0.70        90
     PER.NOM       0.78      0.75      0.76       208

   micro avg       0.64      0.71      0.67       389
   macro avg       0.41      0.57      0.46       389
weighted avg       0.66      0.71      0.68       389



Epoch: 24/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.23it/s, F1=0.973, train_acc=0.998, train_loss=0.191, train_precision=0.97, train_recall=0.978] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.91      0.95      0.93        41
     LOC.NOM       1.00      0.95      0.97        38
     ORG.NAM       0.98      0.99      0.99       141
     ORG.NOM       1.00      0.96      0.98        27
     PER.NAM       0.95      0.97      0.96       432
     PER.NOM       0.97      0.97      0.97       543

   micro avg       0.97      0.98      0.97      1363
   macro avg       0.98      0.98      0.98      1363
weighted avg       0.97      0.98      0.97      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.43it/s, F1=0.672, eval_acc=0.965, eval_loss=11.5, eval_precision=0.627, eval_recall=0.728]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.66      0.88      0.75        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.44      0.67      0.53         6
     LOC.NOM       0.09      0.17      0.12         6
     ORG.NAM       0.37      0.43      0.40        47
     ORG.NOM       0.25      0.80      0.38         5
     PER.NAM       0.69      0.77      0.73        90
     PER.NOM       0.76      0.76      0.76       208

   micro avg       0.65      0.72      0.68       389
   macro avg       0.41      0.56      0.46       389
weighted avg       0.67      0.72      0.69       389



Epoch: 25/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.23it/s, F1=0.973, train_acc=0.998, train_loss=0.188, train_precision=0.97, train_recall=0.979] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.95      0.98      0.96        41
     LOC.NOM       0.97      0.97      0.97        38
     ORG.NAM       0.99      0.99      0.99       141
     ORG.NOM       0.96      0.96      0.96        27
     PER.NAM       0.95      0.98      0.96       432
     PER.NOM       0.98      0.98      0.98       543

   micro avg       0.97      0.98      0.98      1363
   macro avg       0.98      0.98      0.98      1363
weighted avg       0.97      0.98      0.98      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.28it/s, F1=0.671, eval_acc=0.966, eval_loss=12, eval_precision=0.64, eval_recall=0.714]   


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.65      0.85      0.73        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.56      0.83      0.67         6
     LOC.NOM       0.14      0.17      0.15         6
     ORG.NAM       0.34      0.43      0.38        47
     ORG.NOM       0.44      0.80      0.57         5
     PER.NAM       0.72      0.76      0.74        90
     PER.NOM       0.79      0.74      0.76       208

   micro avg       0.67      0.70      0.69       389
   macro avg       0.46      0.57      0.50       389
weighted avg       0.69      0.70      0.69       389



Epoch: 26/30 Train: 100%|██████████| 125/125 [00:41<00:00,  3.02it/s, F1=0.953, train_acc=0.997, train_loss=0.591, train_precision=0.944, train_recall=0.969]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       137
     GPE.NOM       0.20      0.25      0.22         4
     LOC.NAM       0.81      0.93      0.86        41
     LOC.NOM       0.78      0.84      0.81        38
     ORG.NAM       0.97      0.99      0.98       141
     ORG.NOM       0.85      0.85      0.85        27
     PER.NAM       0.93      0.97      0.95       432
     PER.NOM       0.96      0.97      0.97       543

   micro avg       0.94      0.97      0.95      1363
   macro avg       0.81      0.85      0.83      1363
weighted avg       0.94      0.97      0.95      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.38it/s, F1=0.665, eval_acc=0.964, eval_loss=9.88, eval_precision=0.621, eval_recall=0.72] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.64      0.88      0.74        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.33      0.83      0.48         6
     LOC.NOM       0.11      0.17      0.13         6
     ORG.NAM       0.36      0.38      0.37        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.69      0.78      0.73        90
     PER.NOM       0.76      0.76      0.76       208

   micro avg       0.64      0.71      0.67       389
   macro avg       0.36      0.48      0.40       389
weighted avg       0.66      0.71      0.68       389



Epoch: 27/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.27it/s, F1=0.961, train_acc=0.997, train_loss=0.414, train_precision=0.962, train_recall=0.965]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.93      0.95      0.94        41
     LOC.NOM       1.00      0.97      0.99        38
     ORG.NAM       0.98      0.97      0.98       141
     ORG.NOM       0.92      0.89      0.91        27
     PER.NAM       0.95      0.97      0.96       432
     PER.NOM       0.96      0.96      0.96       543

   micro avg       0.96      0.97      0.96      1363
   macro avg       0.97      0.96      0.97      1363
weighted avg       0.96      0.97      0.96      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.43it/s, F1=0.695, eval_acc=0.968, eval_loss=9.7, eval_precision=0.676, eval_recall=0.717] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.68      0.88      0.77        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.33      0.83      0.48         6
     LOC.NOM       0.33      0.33      0.33         6
     ORG.NAM       0.43      0.38      0.40        47
     ORG.NOM       0.15      0.40      0.22         5
     PER.NAM       0.71      0.78      0.74        90
     PER.NOM       0.82      0.75      0.78       208

   micro avg       0.69      0.71      0.70       389
   macro avg       0.43      0.55      0.47       389
weighted avg       0.71      0.71      0.70       389



Epoch: 28/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.25it/s, F1=0.97, train_acc=0.998, train_loss=0.272, train_precision=0.964, train_recall=0.98]  


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      1.00      1.00       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.93      0.98      0.95        41
     LOC.NOM       0.97      1.00      0.99        38
     ORG.NAM       0.99      0.99      0.99       141
     ORG.NOM       0.96      0.96      0.96        27
     PER.NAM       0.94      0.98      0.96       432
     PER.NOM       0.97      0.98      0.97       543

   micro avg       0.96      0.98      0.97      1363
   macro avg       0.97      0.99      0.98      1363
weighted avg       0.96      0.98      0.97      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.41it/s, F1=0.691, eval_acc=0.967, eval_loss=10.1, eval_precision=0.666, eval_recall=0.721]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.61      0.88      0.72        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.42      0.83      0.56         6
     LOC.NOM       0.40      0.33      0.36         6
     ORG.NAM       0.37      0.38      0.37        47
     ORG.NOM       0.30      0.60      0.40         5
     PER.NAM       0.70      0.77      0.73        90
     PER.NOM       0.82      0.76      0.79       208

   micro avg       0.68      0.71      0.70       389
   macro avg       0.45      0.57      0.49       389
weighted avg       0.70      0.71      0.70       389



Epoch: 29/30 Train: 100%|██████████| 125/125 [00:39<00:00,  3.20it/s, F1=0.945, train_acc=0.997, train_loss=0.541, train_precision=0.94, train_recall=0.954] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.93      0.93      0.93        41
     LOC.NOM       0.95      0.97      0.96        38
     ORG.NAM       0.96      0.96      0.96       141
     ORG.NOM       0.93      0.96      0.95        27
     PER.NAM       0.91      0.94      0.93       432
     PER.NOM       0.97      0.97      0.97       543

   micro avg       0.95      0.96      0.96      1363
   macro avg       0.95      0.97      0.96      1363
weighted avg       0.95      0.96      0.96      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.39it/s, F1=0.696, eval_acc=0.968, eval_loss=9.49, eval_precision=0.665, eval_recall=0.732]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.61      0.85      0.71        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.62      0.83      0.71         6
     LOC.NOM       0.50      0.17      0.25         6
     ORG.NAM       0.34      0.49      0.40        47
     ORG.NOM       0.33      0.80      0.47         5
     PER.NAM       0.70      0.70      0.70        90
     PER.NOM       0.82      0.79      0.80       208

   micro avg       0.68      0.72      0.70       389
   macro avg       0.49      0.58      0.51       389
weighted avg       0.70      0.72      0.71       389



Epoch: 30/30 Train: 100%|██████████| 125/125 [00:41<00:00,  3.00it/s, F1=0.955, train_acc=0.997, train_loss=0.555, train_precision=0.947, train_recall=0.966]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      0.99      1.00       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.90      0.90      0.90        41
     LOC.NOM       0.97      0.97      0.97        38
     ORG.NAM       0.96      0.97      0.96       141
     ORG.NOM       0.96      0.93      0.94        27
     PER.NAM       0.89      0.94      0.92       432
     PER.NOM       0.97      0.98      0.98       543

   micro avg       0.95      0.96      0.95      1363
   macro avg       0.96      0.96      0.96      1363
weighted avg       0.95      0.96      0.96      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.21it/s, F1=0.694, eval_acc=0.968, eval_loss=8.69, eval_precision=0.689, eval_recall=0.7]  


eval_reports:


calculate data/few_shot/weibo/train_1000.json etag:   0%|          | 0.00/665k [00:00<?, ?B/s]

              precision    recall  f1-score   support

     GPE.NAM       0.69      0.85      0.76        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.38      0.83      0.53         6
     LOC.NOM       0.33      0.17      0.22         6
     ORG.NAM       0.44      0.45      0.44        47
     ORG.NOM       0.22      0.80      0.35         5
     PER.NAM       0.75      0.72      0.73        90
     PER.NOM       0.81      0.71      0.76       208

   micro avg       0.69      0.68      0.69       389
   macro avg       0.45      0.57      0.47       389
weighted avg       0.72      0.68      0.69       389

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/weibo/train_1000.json",
    "eval_file": "data/few_shot/weibo/dev.json",
    "test_file": "data/few_shot/

calculate data/few_shot/weibo/train_1000.json etag: 100%|██████████| 665k/665k [00:00<00:00, 283MB/s]
calculate data/few_shot/weibo/dev.json etag: 100%|██████████| 180k/180k [00:00<00:00, 186MB/s]
calculate data/few_shot/weibo/test.json etag: 100%|██████████| 184k/184k [00:00<00:00, 193MB/s]
calculate data/few_shot/weibo/labels.txt etag: 100%|██████████| 272/272 [00:00<00:00, 504kB/s]


load cached ./temp/b8906855ab5cdf4bb18730a0e123dcf9_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/lexicon_tree


count line size data/few_shot/weibo/labels.txt: 29L [00:00, 229067.45L/s]
build line mapper: 29L [00:00, 250277.40L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 29/29 [00:00<00:00, 8524.41it/s]
load vocab from list: 100%|██████████| 28/28 [00:00<00:00, 263319.53it/s]
load dataset from data/few_shot/weibo/train_1000.json: 36it [00:00, 356.09it/s]

load cached ./temp/b8906855ab5cdf4bb18730a0e123dcf9_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/matched_words
load cached ./temp/b8906855ab5cdf4bb18730a0e123dcf9_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/word_vocab
load cached ./temp/b8906855ab5cdf4bb18730a0e123dcf9_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/vocab_embedding


load dataset from data/few_shot/weibo/train_1000.json: 1000it [00:02, 348.04it/s]
load dataset from data/few_shot/weibo/dev.json: 271it [00:00, 451.85it/s]
Some weights of the model checkpoint at save_pretrained/weibo_pretrain_lebert_1000_pretraind_task/Bert_960/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 125/125 [00:39<00:00,  3.19it/s, F1=0, train_acc=0.754, train_loss=47.9, train_precision=0, train_recall=0] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00       137
     GPE.NOM       0.00      0.00      0.00         4
     LOC.NAM       0.00      0.00      0.00        41
     LOC.NOM       0.00      0.00      0.00        38
     ORG.NAM       0.00      0.00      0.00       141
     ORG.NOM       0.00      0.00      0.00        27
     PER.NAM       0.00      0.00      0.00       432
     PER.NOM       0.00      0.00      0.00       543

   micro avg       0.00      0.00      0.00      1363
   macro avg       0.00      0.00      0.00      1363
weighted avg       0.00      0.00      0.00      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.34it/s, F1=0, eval_acc=0.932, eval_loss=14.1, eval_precision=0, eval_recall=0]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.00      0.00      0.00        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.00      0.00      0.00        90
     PER.NOM       0.00      0.00      0.00       208

   micro avg       0.00      0.00      0.00       389
   macro avg       0.00      0.00      0.00       389
weighted avg       0.00      0.00      0.00       389



Epoch: 2/30 Train: 100%|██████████| 125/125 [00:39<00:00,  3.18it/s, F1=0.334, train_acc=0.952, train_loss=9.48, train_precision=0.354, train_recall=0.342]     


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.28      0.24      0.26       137
     GPE.NOM       0.00      0.00      0.00         4
     LOC.NAM       0.00      0.00      0.00        41
     LOC.NOM       0.00      0.00      0.00        38
     ORG.NAM       0.09      0.07      0.08       141
     ORG.NOM       0.00      0.00      0.00        27
     PER.NAM       0.66      0.55      0.60       432
     PER.NOM       0.28      0.37      0.32       543

   micro avg       0.37      0.35      0.36      1363
   macro avg       0.16      0.15      0.16      1363
weighted avg       0.36      0.35      0.35      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.42it/s, F1=0.519, eval_acc=0.962, eval_loss=5.67, eval_precision=0.469, eval_recall=0.587]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.38      0.73      0.50        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.12      0.15      0.13        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.68      0.79      0.73        90
     PER.NOM       0.54      0.63      0.58       208

   micro avg       0.49      0.59      0.54       389
   macro avg       0.21      0.29      0.24       389
weighted avg       0.49      0.59      0.53       389



Epoch: 3/30 Train: 100%|██████████| 125/125 [00:39<00:00,  3.20it/s, F1=0.657, train_acc=0.974, train_loss=4.75, train_precision=0.638, train_recall=0.702]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.56      0.72      0.63       137
     GPE.NOM       0.00      0.00      0.00         4
     LOC.NAM       0.06      0.05      0.05        41
     LOC.NOM       0.00      0.00      0.00        38
     ORG.NAM       0.43      0.55      0.48       141
     ORG.NOM       0.00      0.00      0.00        27
     PER.NAM       0.78      0.79      0.78       432
     PER.NOM       0.63      0.76      0.69       543

   micro avg       0.62      0.69      0.65      1363
   macro avg       0.31      0.36      0.33      1363
weighted avg       0.60      0.69      0.64      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.40it/s, F1=0.565, eval_acc=0.965, eval_loss=5.66, eval_precision=0.524, eval_recall=0.621]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.39      0.77      0.52        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.30      0.50      0.37         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.26      0.40      0.32        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.78      0.77      0.77        90
     PER.NOM       0.63      0.64      0.64       208

   micro avg       0.56      0.63      0.59       389
   macro avg       0.29      0.39      0.33       389
weighted avg       0.58      0.63      0.60       389



Epoch: 4/30 Train: 100%|██████████| 125/125 [00:42<00:00,  2.93it/s, F1=0.767, train_acc=0.981, train_loss=3.27, train_precision=0.755, train_recall=0.797]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.65      0.80      0.72       137
     GPE.NOM       0.00      0.00      0.00         4
     LOC.NAM       0.42      0.56      0.48        41
     LOC.NOM       0.60      0.16      0.25        38
     ORG.NAM       0.68      0.80      0.74       141
     ORG.NOM       0.17      0.04      0.06        27
     PER.NAM       0.79      0.80      0.79       432
     PER.NOM       0.77      0.87      0.82       543

   micro avg       0.73      0.79      0.76      1363
   macro avg       0.51      0.50      0.48      1363
weighted avg       0.72      0.79      0.75      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  3.83it/s, F1=0.624, eval_acc=0.964, eval_loss=5.37, eval_precision=0.551, eval_recall=0.728]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.44      0.73      0.55        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.43      0.50      0.46         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.26      0.45      0.33        47
     ORG.NOM       0.23      0.60      0.33         5
     PER.NAM       0.70      0.79      0.74        90
     PER.NOM       0.70      0.78      0.74       208

   micro avg       0.58      0.72      0.64       389
   macro avg       0.34      0.48      0.39       389
weighted avg       0.61      0.72      0.65       389



Epoch: 5/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.25it/s, F1=0.815, train_acc=0.985, train_loss=2.35, train_precision=0.818, train_recall=0.833]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.75      0.86      0.80       137
     GPE.NOM       0.00      0.00      0.00         4
     LOC.NAM       0.57      0.66      0.61        41
     LOC.NOM       0.39      0.29      0.33        38
     ORG.NAM       0.78      0.85      0.82       141
     ORG.NOM       0.42      0.37      0.39        27
     PER.NAM       0.81      0.84      0.83       432
     PER.NOM       0.83      0.90      0.87       543

   micro avg       0.79      0.83      0.81      1363
   macro avg       0.57      0.60      0.58      1363
weighted avg       0.78      0.83      0.81      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.30it/s, F1=0.655, eval_acc=0.961, eval_loss=6.39, eval_precision=0.579, eval_recall=0.758]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.58      0.69      0.63        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.26      0.83      0.40         6
     LOC.NOM       0.50      0.17      0.25         6
     ORG.NAM       0.31      0.51      0.38        47
     ORG.NOM       0.25      0.60      0.35         5
     PER.NAM       0.64      0.83      0.72        90
     PER.NOM       0.71      0.81      0.75       208

   micro avg       0.59      0.76      0.66       389
   macro avg       0.41      0.56      0.44       389
weighted avg       0.62      0.76      0.67       389



Epoch: 6/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.27it/s, F1=0.87, train_acc=0.991, train_loss=1.54, train_precision=0.86, train_recall=0.889]  


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.85      0.91      0.88       137
     GPE.NOM       0.00      0.00      0.00         4
     LOC.NAM       0.69      0.83      0.76        41
     LOC.NOM       0.44      0.39      0.42        38
     ORG.NAM       0.81      0.90      0.86       141
     ORG.NOM       0.33      0.44      0.38        27
     PER.NAM       0.91      0.92      0.91       432
     PER.NOM       0.89      0.93      0.91       543

   micro avg       0.85      0.89      0.87      1363
   macro avg       0.62      0.67      0.64      1363
weighted avg       0.85      0.89      0.87      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.37it/s, F1=0.675, eval_acc=0.966, eval_loss=6.56, eval_precision=0.632, eval_recall=0.729]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.60      0.92      0.73        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.45      0.83      0.59         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.34      0.40      0.37        47
     ORG.NOM       0.25      0.80      0.38         5
     PER.NAM       0.74      0.71      0.72        90
     PER.NOM       0.75      0.78      0.77       208

   micro avg       0.65      0.72      0.68       389
   macro avg       0.39      0.56      0.44       389
weighted avg       0.66      0.72      0.68       389



Epoch: 7/30 Train: 100%|██████████| 125/125 [00:39<00:00,  3.15it/s, F1=0.9, train_acc=0.993, train_loss=1.22, train_precision=0.891, train_recall=0.916]  


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.94      0.96      0.95       137
     GPE.NOM       0.00      0.00      0.00         4
     LOC.NAM       0.79      0.93      0.85        41
     LOC.NOM       0.67      0.63      0.65        38
     ORG.NAM       0.84      0.91      0.87       141
     ORG.NOM       0.59      0.63      0.61        27
     PER.NAM       0.91      0.94      0.93       432
     PER.NOM       0.90      0.94      0.92       543

   micro avg       0.89      0.92      0.90      1363
   macro avg       0.71      0.74      0.72      1363
weighted avg       0.88      0.92      0.90      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.40it/s, F1=0.652, eval_acc=0.963, eval_loss=6.97, eval_precision=0.577, eval_recall=0.751]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.64      0.88      0.74        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.30      0.45      0.36        47
     ORG.NOM       0.24      1.00      0.38         5
     PER.NAM       0.76      0.78      0.77        90
     PER.NOM       0.71      0.83      0.76       208

   micro avg       0.59      0.75      0.66       389
   macro avg       0.33      0.49      0.38       389
weighted avg       0.64      0.75      0.68       389



Epoch: 8/30 Train: 100%|██████████| 125/125 [00:42<00:00,  2.96it/s, F1=0.921, train_acc=0.994, train_loss=0.973, train_precision=0.913, train_recall=0.935]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.96      0.96      0.96       137
     GPE.NOM       0.00      0.00      0.00         4
     LOC.NAM       0.81      0.85      0.83        41
     LOC.NOM       0.76      0.82      0.78        38
     ORG.NAM       0.93      0.97      0.95       141
     ORG.NOM       0.68      0.70      0.69        27
     PER.NAM       0.92      0.93      0.93       432
     PER.NOM       0.92      0.96      0.94       543

   micro avg       0.91      0.94      0.92      1363
   macro avg       0.75      0.77      0.76      1363
weighted avg       0.91      0.94      0.92      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.37it/s, F1=0.665, eval_acc=0.961, eval_loss=7.43, eval_precision=0.596, eval_recall=0.757]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.59      0.88      0.71        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.19      0.67      0.30         6
     LOC.NOM       0.14      0.17      0.15         6
     ORG.NAM       0.37      0.45      0.40        47
     ORG.NOM       0.20      0.80      0.32         5
     PER.NAM       0.66      0.80      0.72        90
     PER.NOM       0.75      0.81      0.78       208

   micro avg       0.62      0.75      0.68       389
   macro avg       0.36      0.57      0.42       389
weighted avg       0.65      0.75      0.69       389



Epoch: 9/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.29it/s, F1=0.943, train_acc=0.996, train_loss=0.687, train_precision=0.938, train_recall=0.953]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.95      0.96      0.95       137
     GPE.NOM       0.00      0.00      0.00         4
     LOC.NAM       0.86      0.93      0.89        41
     LOC.NOM       0.84      0.82      0.83        38
     ORG.NAM       0.94      0.97      0.95       141
     ORG.NOM       0.93      0.93      0.93        27
     PER.NAM       0.95      0.96      0.95       432
     PER.NOM       0.94      0.97      0.95       543

   micro avg       0.93      0.96      0.94      1363
   macro avg       0.80      0.82      0.81      1363
weighted avg       0.93      0.96      0.94      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.41it/s, F1=0.661, eval_acc=0.961, eval_loss=7.91, eval_precision=0.614, eval_recall=0.72] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.56      0.85      0.68        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.42      0.83      0.56         6
     LOC.NOM       0.18      0.33      0.24         6
     ORG.NAM       0.28      0.32      0.30        47
     ORG.NOM       0.36      0.80      0.50         5
     PER.NAM       0.63      0.79      0.70        90
     PER.NOM       0.75      0.76      0.76       208

   micro avg       0.62      0.71      0.66       389
   macro avg       0.40      0.59      0.47       389
weighted avg       0.63      0.71      0.67       389



Epoch: 10/30 Train: 100%|██████████| 125/125 [00:39<00:00,  3.19it/s, F1=0.946, train_acc=0.995, train_loss=0.758, train_precision=0.94, train_recall=0.958] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.97      0.98      0.97       137
     GPE.NOM       0.00      0.00      0.00         4
     LOC.NAM       0.97      0.93      0.95        41
     LOC.NOM       0.95      0.95      0.95        38
     ORG.NAM       0.92      0.94      0.93       141
     ORG.NOM       0.93      0.96      0.95        27
     PER.NAM       0.93      0.95      0.94       432
     PER.NOM       0.94      0.97      0.96       543

   micro avg       0.94      0.96      0.95      1363
   macro avg       0.83      0.83      0.83      1363
weighted avg       0.94      0.96      0.95      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.37it/s, F1=0.692, eval_acc=0.968, eval_loss=8.44, eval_precision=0.665, eval_recall=0.726]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.51      0.88      0.65        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.36      0.83      0.50         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.39      0.30      0.34        47
     ORG.NOM       0.57      0.80      0.67         5
     PER.NAM       0.85      0.73      0.79        90
     PER.NOM       0.75      0.80      0.77       208

   micro avg       0.69      0.71      0.70       389
   macro avg       0.43      0.54      0.46       389
weighted avg       0.69      0.71      0.69       389



Epoch: 11/30 Train: 100%|██████████| 125/125 [00:42<00:00,  2.92it/s, F1=0.951, train_acc=0.996, train_loss=0.585, train_precision=0.945, train_recall=0.96] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.96      0.97      0.96       137
     GPE.NOM       0.00      0.00      0.00         4
     LOC.NAM       0.88      0.93      0.90        41
     LOC.NOM       0.95      0.95      0.95        38
     ORG.NAM       0.97      0.96      0.97       141
     ORG.NOM       0.93      0.96      0.95        27
     PER.NAM       0.95      0.96      0.96       432
     PER.NOM       0.94      0.97      0.96       543

   micro avg       0.94      0.96      0.95      1363
   macro avg       0.82      0.84      0.83      1363
weighted avg       0.94      0.96      0.95      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.40it/s, F1=0.669, eval_acc=0.965, eval_loss=8.32, eval_precision=0.639, eval_recall=0.708]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.56      0.88      0.69        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.25      0.83      0.38         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.38      0.36      0.37        47
     ORG.NOM       0.29      0.80      0.42         5
     PER.NAM       0.81      0.72      0.76        90
     PER.NOM       0.75      0.75      0.75       208

   micro avg       0.65      0.69      0.67       389
   macro avg       0.38      0.54      0.42       389
weighted avg       0.68      0.69      0.68       389



Epoch: 12/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.27it/s, F1=0.952, train_acc=0.997, train_loss=0.504, train_precision=0.947, train_recall=0.96] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.96      0.97      0.97       137
     GPE.NOM       0.00      0.00      0.00         4
     LOC.NAM       0.93      0.98      0.95        41
     LOC.NOM       0.95      0.97      0.96        38
     ORG.NAM       0.96      0.97      0.96       141
     ORG.NOM       0.93      0.93      0.93        27
     PER.NAM       0.96      0.96      0.96       432
     PER.NOM       0.94      0.96      0.95       543

   micro avg       0.95      0.96      0.95      1363
   macro avg       0.83      0.84      0.84      1363
weighted avg       0.95      0.96      0.95      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.42it/s, F1=0.699, eval_acc=0.968, eval_loss=8.91, eval_precision=0.676, eval_recall=0.727]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.55      0.85      0.67        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.45      0.83      0.59         6
     LOC.NOM       0.30      0.50      0.37         6
     ORG.NAM       0.37      0.30      0.33        47
     ORG.NOM       0.20      0.60      0.30         5
     PER.NAM       0.84      0.76      0.80        90
     PER.NOM       0.80      0.79      0.80       208

   micro avg       0.70      0.72      0.71       389
   macro avg       0.44      0.58      0.48       389
weighted avg       0.72      0.72      0.71       389



Epoch: 13/30 Train: 100%|██████████| 125/125 [00:37<00:00,  3.30it/s, F1=0.97, train_acc=0.997, train_loss=0.38, train_precision=0.966, train_recall=0.977]  


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      1.00      0.99       137
     GPE.NOM       0.50      0.50      0.50         4
     LOC.NAM       0.93      0.93      0.93        41
     LOC.NOM       0.97      0.97      0.97        38
     ORG.NAM       0.99      1.00      0.99       141
     ORG.NOM       0.96      0.96      0.96        27
     PER.NAM       0.96      0.97      0.97       432
     PER.NOM       0.95      0.97      0.96       543

   micro avg       0.96      0.97      0.97      1363
   macro avg       0.91      0.91      0.91      1363
weighted avg       0.96      0.97      0.97      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.06it/s, F1=0.692, eval_acc=0.966, eval_loss=8.65, eval_precision=0.649, eval_recall=0.744]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.65      0.85      0.73        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.29      0.83      0.43         6
     LOC.NOM       0.30      0.50      0.37         6
     ORG.NAM       0.43      0.43      0.43        47
     ORG.NOM       0.17      0.60      0.26         5
     PER.NAM       0.74      0.78      0.76        90
     PER.NOM       0.77      0.79      0.78       208

   micro avg       0.67      0.74      0.70       389
   macro avg       0.42      0.60      0.47       389
weighted avg       0.69      0.74      0.71       389



Epoch: 14/30 Train: 100%|██████████| 125/125 [00:41<00:00,  2.98it/s, F1=0.977, train_acc=0.998, train_loss=0.337, train_precision=0.972, train_recall=0.985]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       137
     GPE.NOM       0.80      1.00      0.89         4
     LOC.NAM       0.91      0.95      0.93        41
     LOC.NOM       0.95      1.00      0.97        38
     ORG.NAM       0.99      0.99      0.99       141
     ORG.NOM       1.00      0.96      0.98        27
     PER.NAM       0.97      0.98      0.97       432
     PER.NOM       0.96      0.97      0.97       543

   micro avg       0.97      0.98      0.97      1363
   macro avg       0.95      0.98      0.96      1363
weighted avg       0.97      0.98      0.97      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.44it/s, F1=0.69, eval_acc=0.966, eval_loss=8.96, eval_precision=0.66, eval_recall=0.728]  


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.62      0.88      0.73        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.45      0.83      0.59         6
     LOC.NOM       0.25      0.33      0.29         6
     ORG.NAM       0.37      0.34      0.36        47
     ORG.NOM       0.18      0.60      0.27         5
     PER.NAM       0.78      0.78      0.78        90
     PER.NOM       0.78      0.77      0.77       208

   micro avg       0.68      0.72      0.70       389
   macro avg       0.43      0.57      0.47       389
weighted avg       0.70      0.72      0.70       389



Epoch: 15/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.25it/s, F1=0.971, train_acc=0.998, train_loss=0.291, train_precision=0.971, train_recall=0.975]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.97      0.95      0.96        41
     LOC.NOM       0.95      0.95      0.95        38
     ORG.NAM       1.00      0.99      1.00       141
     ORG.NOM       0.96      0.96      0.96        27
     PER.NAM       0.98      0.98      0.98       432
     PER.NOM       0.96      0.97      0.97       543

   micro avg       0.97      0.98      0.98      1363
   macro avg       0.98      0.98      0.98      1363
weighted avg       0.97      0.98      0.98      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.41it/s, F1=0.691, eval_acc=0.967, eval_loss=9.6, eval_precision=0.663, eval_recall=0.725] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.66      0.88      0.75        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.50      0.83      0.62         6
     LOC.NOM       0.20      0.17      0.18         6
     ORG.NAM       0.42      0.40      0.41        47
     ORG.NOM       0.17      0.60      0.26         5
     PER.NAM       0.75      0.74      0.75        90
     PER.NOM       0.78      0.76      0.77       208

   micro avg       0.68      0.71      0.70       389
   macro avg       0.43      0.55      0.47       389
weighted avg       0.70      0.71      0.70       389



Epoch: 16/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.21it/s, F1=0.964, train_acc=0.997, train_loss=0.35, train_precision=0.959, train_recall=0.978] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      0.99      0.99       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.97      0.93      0.95        41
     LOC.NOM       1.00      0.97      0.99        38
     ORG.NAM       0.99      0.99      0.99       141
     ORG.NOM       0.93      0.93      0.93        27
     PER.NAM       0.96      0.97      0.96       432
     PER.NOM       0.96      0.98      0.97       543

   micro avg       0.97      0.98      0.97      1363
   macro avg       0.98      0.97      0.97      1363
weighted avg       0.97      0.98      0.97      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.36it/s, F1=0.69, eval_acc=0.967, eval_loss=9.12, eval_precision=0.653, eval_recall=0.737] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.64      0.88      0.74        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.42      0.83      0.56         6
     LOC.NOM       0.15      0.33      0.21         6
     ORG.NAM       0.38      0.40      0.39        47
     ORG.NOM       0.15      0.60      0.24         5
     PER.NAM       0.79      0.81      0.80        90
     PER.NOM       0.78      0.76      0.77       208

   micro avg       0.67      0.73      0.70       389
   macro avg       0.54      0.70      0.59       389
weighted avg       0.70      0.73      0.71       389



Epoch: 17/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.23it/s, F1=0.97, train_acc=0.997, train_loss=0.354, train_precision=0.963, train_recall=0.98]  


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       137
     GPE.NOM       0.75      0.75      0.75         4
     LOC.NAM       0.93      0.98      0.95        41
     LOC.NOM       0.97      0.97      0.97        38
     ORG.NAM       0.99      1.00      1.00       141
     ORG.NOM       0.93      0.96      0.95        27
     PER.NAM       0.96      0.97      0.96       432
     PER.NOM       0.96      0.97      0.97       543

   micro avg       0.97      0.98      0.97      1363
   macro avg       0.94      0.95      0.94      1363
weighted avg       0.97      0.98      0.97      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.34it/s, F1=0.675, eval_acc=0.967, eval_loss=7.66, eval_precision=0.636, eval_recall=0.727]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.66      0.88      0.75        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.56      0.83      0.67         6
     LOC.NOM       0.20      0.33      0.25         6
     ORG.NAM       0.32      0.43      0.36        47
     ORG.NOM       0.18      0.60      0.27         5
     PER.NAM       0.78      0.74      0.76        90
     PER.NOM       0.78      0.75      0.76       208

   micro avg       0.66      0.71      0.68       389
   macro avg       0.56      0.70      0.60       389
weighted avg       0.69      0.71      0.70       389



Epoch: 18/30 Train: 100%|██████████| 125/125 [00:42<00:00,  2.97it/s, F1=0.961, train_acc=0.996, train_loss=0.528, train_precision=0.961, train_recall=0.968]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.93      0.98      0.95        41
     LOC.NOM       0.97      1.00      0.99        38
     ORG.NAM       0.99      0.99      0.99       141
     ORG.NOM       0.96      1.00      0.98        27
     PER.NAM       0.95      0.94      0.95       432
     PER.NOM       0.95      0.97      0.96       543

   micro avg       0.96      0.97      0.96      1363
   macro avg       0.97      0.98      0.98      1363
weighted avg       0.96      0.97      0.96      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.04it/s, F1=0.663, eval_acc=0.963, eval_loss=9.44, eval_precision=0.606, eval_recall=0.736]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.64      0.88      0.74        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.45      0.83      0.59         6
     LOC.NOM       0.09      0.17      0.12         6
     ORG.NAM       0.35      0.40      0.37        47
     ORG.NOM       0.14      0.60      0.23         5
     PER.NAM       0.67      0.71      0.69        90
     PER.NOM       0.74      0.80      0.77       208

   micro avg       0.62      0.72      0.67       389
   macro avg       0.51      0.67      0.56       389
weighted avg       0.65      0.72      0.68       389



Epoch: 19/30 Train: 100%|██████████| 125/125 [00:37<00:00,  3.29it/s, F1=0.969, train_acc=0.997, train_loss=0.381, train_precision=0.967, train_recall=0.975]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.95      0.95      0.95        41
     LOC.NOM       0.97      0.97      0.97        38
     ORG.NAM       0.98      0.97      0.98       141
     ORG.NOM       0.96      0.96      0.96        27
     PER.NAM       0.95      0.97      0.96       432
     PER.NOM       0.97      0.98      0.97       543

   micro avg       0.97      0.97      0.97      1363
   macro avg       0.97      0.98      0.97      1363
weighted avg       0.97      0.97      0.97      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.30it/s, F1=0.692, eval_acc=0.965, eval_loss=9.75, eval_precision=0.646, eval_recall=0.749]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.62      0.88      0.73        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.42      0.83      0.56         6
     LOC.NOM       0.22      0.67      0.33         6
     ORG.NAM       0.41      0.36      0.39        47
     ORG.NOM       0.25      0.60      0.35         5
     PER.NAM       0.76      0.82      0.79        90
     PER.NOM       0.74      0.78      0.76       208

   micro avg       0.66      0.75      0.70       389
   macro avg       0.55      0.74      0.61       389
weighted avg       0.68      0.75      0.71       389



Epoch: 20/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.24it/s, F1=0.972, train_acc=0.998, train_loss=0.272, train_precision=0.965, train_recall=0.983]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.95      0.95      0.95        41
     LOC.NOM       0.97      1.00      0.99        38
     ORG.NAM       0.99      0.99      0.99       141
     ORG.NOM       1.00      0.93      0.96        27
     PER.NAM       0.95      0.97      0.96       432
     PER.NOM       0.96      0.98      0.97       543

   micro avg       0.97      0.98      0.97      1363
   macro avg       0.98      0.98      0.98      1363
weighted avg       0.97      0.98      0.97      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.01it/s, F1=0.685, eval_acc=0.966, eval_loss=9.23, eval_precision=0.669, eval_recall=0.709]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.64      0.88      0.74        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.45      0.83      0.59         6
     LOC.NOM       0.12      0.17      0.14         6
     ORG.NAM       0.45      0.40      0.43        47
     ORG.NOM       0.31      0.80      0.44         5
     PER.NAM       0.78      0.78      0.78        90
     PER.NOM       0.78      0.72      0.75       208

   micro avg       0.69      0.70      0.69       389
   macro avg       0.44      0.57      0.48       389
weighted avg       0.71      0.70      0.70       389



Epoch: 21/30 Train: 100%|██████████| 125/125 [00:42<00:00,  2.95it/s, F1=0.979, train_acc=0.998, train_loss=0.267, train_precision=0.975, train_recall=0.985]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      0.99      0.99       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.91      0.95      0.93        41
     LOC.NOM       0.97      1.00      0.99        38
     ORG.NAM       0.99      1.00      1.00       141
     ORG.NOM       0.96      1.00      0.98        27
     PER.NAM       0.97      0.98      0.98       432
     PER.NOM       0.97      0.98      0.98       543

   micro avg       0.97      0.99      0.98      1363
   macro avg       0.97      0.99      0.98      1363
weighted avg       0.97      0.99      0.98      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.40it/s, F1=0.665, eval_acc=0.963, eval_loss=9.89, eval_precision=0.621, eval_recall=0.719]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.59      0.92      0.72        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.45      0.83      0.59         6
     LOC.NOM       0.13      0.33      0.19         6
     ORG.NAM       0.40      0.40      0.40        47
     ORG.NOM       0.14      0.80      0.24         5
     PER.NAM       0.74      0.78      0.76        90
     PER.NOM       0.76      0.73      0.74       208

   micro avg       0.63      0.71      0.67       389
   macro avg       0.53      0.72      0.58       389
weighted avg       0.68      0.71      0.69       389



Epoch: 22/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.23it/s, F1=0.966, train_acc=0.998, train_loss=0.305, train_precision=0.966, train_recall=0.969]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      0.99      1.00       137
     GPE.NOM       0.80      1.00      0.89         4
     LOC.NAM       0.95      0.93      0.94        41
     LOC.NOM       1.00      0.97      0.99        38
     ORG.NAM       0.95      0.97      0.96       141
     ORG.NOM       0.86      0.93      0.89        27
     PER.NAM       0.97      0.98      0.98       432
     PER.NOM       0.97      0.98      0.98       543

   micro avg       0.97      0.98      0.97      1363
   macro avg       0.94      0.97      0.95      1363
weighted avg       0.97      0.98      0.97      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.33it/s, F1=0.674, eval_acc=0.965, eval_loss=9.36, eval_precision=0.636, eval_recall=0.72] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.56      0.92      0.70        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.50      0.83      0.62         6
     LOC.NOM       0.33      0.50      0.40         6
     ORG.NAM       0.33      0.38      0.36        47
     ORG.NOM       0.36      0.80      0.50         5
     PER.NAM       0.77      0.77      0.77        90
     PER.NOM       0.74      0.74      0.74       208

   micro avg       0.65      0.71      0.68       389
   macro avg       0.45      0.62      0.51       389
weighted avg       0.67      0.71      0.69       389



Epoch: 23/30 Train: 100%|██████████| 125/125 [00:39<00:00,  3.16it/s, F1=0.967, train_acc=0.997, train_loss=0.422, train_precision=0.965, train_recall=0.974]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.98      0.99      0.98       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.93      0.95      0.94        41
     LOC.NOM       1.00      0.97      0.99        38
     ORG.NAM       0.93      0.96      0.94       141
     ORG.NOM       0.75      0.89      0.81        27
     PER.NAM       0.97      0.98      0.98       432
     PER.NOM       0.96      0.98      0.97       543

   micro avg       0.96      0.97      0.97      1363
   macro avg       0.94      0.96      0.95      1363
weighted avg       0.96      0.97      0.97      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.42it/s, F1=0.695, eval_acc=0.967, eval_loss=8.56, eval_precision=0.669, eval_recall=0.728]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.70      0.81      0.75        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.38      0.83      0.53         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.39      0.47      0.42        47
     ORG.NOM       0.20      0.40      0.27         5
     PER.NAM       0.79      0.77      0.78        90
     PER.NOM       0.77      0.77      0.77       208

   micro avg       0.68      0.72      0.70       389
   macro avg       0.40      0.51      0.44       389
weighted avg       0.70      0.72      0.71       389



Epoch: 24/30 Train: 100%|██████████| 125/125 [00:41<00:00,  2.98it/s, F1=0.959, train_acc=0.998, train_loss=0.257, train_precision=0.957, train_recall=0.964]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.93      0.93      0.93        41
     LOC.NOM       0.86      0.95      0.90        38
     ORG.NAM       0.99      0.99      0.99       141
     ORG.NOM       0.93      0.96      0.95        27
     PER.NAM       0.99      0.98      0.98       432
     PER.NOM       0.97      0.97      0.97       543

   micro avg       0.97      0.98      0.98      1363
   macro avg       0.96      0.97      0.96      1363
weighted avg       0.97      0.98      0.98      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.41it/s, F1=0.675, eval_acc=0.963, eval_loss=8.95, eval_precision=0.628, eval_recall=0.736]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.65      0.85      0.73        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.45      0.83      0.59         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.36      0.43      0.39        47
     ORG.NOM       0.27      0.60      0.37         5
     PER.NAM       0.65      0.84      0.73        90
     PER.NOM       0.77      0.76      0.77       208

   micro avg       0.66      0.73      0.69       389
   macro avg       0.40      0.54      0.45       389
weighted avg       0.66      0.73      0.69       389



Epoch: 25/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.22it/s, F1=0.966, train_acc=0.997, train_loss=0.451, train_precision=0.966, train_recall=0.97] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.86      0.93      0.89        41
     LOC.NOM       0.76      0.76      0.76        38
     ORG.NAM       0.94      0.96      0.95       141
     ORG.NOM       0.96      1.00      0.98        27
     PER.NAM       0.99      0.97      0.98       432
     PER.NOM       0.96      0.97      0.97       543

   micro avg       0.96      0.96      0.96      1363
   macro avg       0.93      0.95      0.94      1363
weighted avg       0.96      0.96      0.96      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.33it/s, F1=0.699, eval_acc=0.966, eval_loss=9.43, eval_precision=0.659, eval_recall=0.746]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.66      0.88      0.75        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.45      0.83      0.59         6
     LOC.NOM       0.14      0.33      0.20         6
     ORG.NAM       0.38      0.43      0.40        47
     ORG.NOM       0.43      0.60      0.50         5
     PER.NAM       0.69      0.83      0.76        90
     PER.NOM       0.78      0.77      0.78       208

   micro avg       0.67      0.74      0.70       389
   macro avg       0.57      0.71      0.62       389
weighted avg       0.69      0.74      0.71       389



Epoch: 26/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.22it/s, F1=0.962, train_acc=0.997, train_loss=0.368, train_precision=0.959, train_recall=0.968]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      0.99      1.00       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.80      0.85      0.82        41
     LOC.NOM       0.82      0.87      0.85        38
     ORG.NAM       0.96      0.98      0.97       141
     ORG.NOM       0.96      0.96      0.96        27
     PER.NAM       0.97      0.98      0.98       432
     PER.NOM       0.96      0.97      0.97       543

   micro avg       0.96      0.97      0.97      1363
   macro avg       0.93      0.95      0.94      1363
weighted avg       0.96      0.97      0.97      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.32it/s, F1=0.678, eval_acc=0.963, eval_loss=9.84, eval_precision=0.621, eval_recall=0.751]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.63      0.85      0.72        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.36      0.83      0.50         6
     LOC.NOM       0.18      0.33      0.24         6
     ORG.NAM       0.41      0.45      0.43        47
     ORG.NOM       0.29      0.80      0.42         5
     PER.NAM       0.70      0.79      0.74        90
     PER.NOM       0.71      0.79      0.75       208

   micro avg       0.63      0.75      0.68       389
   macro avg       0.53      0.73      0.60       389
weighted avg       0.65      0.75      0.69       389



Epoch: 27/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.23it/s, F1=0.978, train_acc=0.998, train_loss=0.196, train_precision=0.978, train_recall=0.981]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       1.00      0.95      0.97        41
     LOC.NOM       0.95      0.97      0.96        38
     ORG.NAM       1.00      0.99      1.00       141
     ORG.NOM       1.00      0.96      0.98        27
     PER.NAM       0.98      0.98      0.98       432
     PER.NOM       0.97      0.97      0.97       543

   micro avg       0.98      0.98      0.98      1363
   macro avg       0.99      0.98      0.98      1363
weighted avg       0.98      0.98      0.98      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.08it/s, F1=0.688, eval_acc=0.965, eval_loss=9.88, eval_precision=0.636, eval_recall=0.756]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.65      0.85      0.73        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.28      0.83      0.42         6
     LOC.NOM       0.22      0.33      0.27         6
     ORG.NAM       0.35      0.47      0.40        47
     ORG.NOM       0.33      0.80      0.47         5
     PER.NAM       0.74      0.80      0.77        90
     PER.NOM       0.76      0.79      0.78       208

   micro avg       0.65      0.75      0.70       389
   macro avg       0.54      0.73      0.60       389
weighted avg       0.68      0.75      0.71       389



Epoch: 28/30 Train: 100%|██████████| 125/125 [00:42<00:00,  2.97it/s, F1=0.976, train_acc=0.998, train_loss=0.213, train_precision=0.975, train_recall=0.981]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.91      0.95      0.93        41
     LOC.NOM       0.97      0.95      0.96        38
     ORG.NAM       0.99      1.00      1.00       141
     ORG.NOM       1.00      0.96      0.98        27
     PER.NAM       0.99      0.98      0.99       432
     PER.NOM       0.95      0.97      0.96       543

   micro avg       0.97      0.98      0.98      1363
   macro avg       0.98      0.98      0.98      1363
weighted avg       0.97      0.98      0.98      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.42it/s, F1=0.68, eval_acc=0.965, eval_loss=9.18, eval_precision=0.645, eval_recall=0.723] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.69      0.85      0.76        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.45      0.83      0.59         6
     LOC.NOM       0.29      0.33      0.31         6
     ORG.NAM       0.38      0.45      0.41        47
     ORG.NOM       0.31      0.80      0.44         5
     PER.NAM       0.68      0.81      0.74        90
     PER.NOM       0.80      0.76      0.78       208

   micro avg       0.67      0.73      0.70       389
   macro avg       0.45      0.60      0.50       389
weighted avg       0.69      0.73      0.71       389



Epoch: 29/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.24it/s, F1=0.975, train_acc=0.997, train_loss=0.231, train_precision=0.975, train_recall=0.978]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.97      0.95      0.96        41
     LOC.NOM       0.95      1.00      0.97        38
     ORG.NAM       0.99      0.99      0.99       141
     ORG.NOM       0.96      0.96      0.96        27
     PER.NAM       0.97      0.99      0.98       432
     PER.NOM       0.97      0.96      0.96       543

   micro avg       0.98      0.98      0.98      1363
   macro avg       0.98      0.98      0.98      1363
weighted avg       0.98      0.98      0.98      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.42it/s, F1=0.684, eval_acc=0.966, eval_loss=9.55, eval_precision=0.641, eval_recall=0.739]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.68      0.88      0.77        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.38      0.83      0.53         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.36      0.45      0.40        47
     ORG.NOM       0.21      0.60      0.32         5
     PER.NAM       0.74      0.79      0.76        90
     PER.NOM       0.76      0.77      0.77       208

   micro avg       0.65      0.73      0.69       389
   macro avg       0.39      0.54      0.44       389
weighted avg       0.67      0.73      0.70       389



Epoch: 30/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.22it/s, F1=0.983, train_acc=0.999, train_loss=0.143, train_precision=0.982, train_recall=0.987]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.95      0.98      0.96        41
     LOC.NOM       1.00      0.95      0.97        38
     ORG.NAM       0.99      0.99      0.99       141
     ORG.NOM       0.96      1.00      0.98        27
     PER.NAM       0.99      1.00      0.99       432
     PER.NOM       0.97      0.98      0.98       543

   micro avg       0.98      0.99      0.99      1363
   macro avg       0.98      0.99      0.99      1363
weighted avg       0.98      0.99      0.99      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.43it/s, F1=0.694, eval_acc=0.967, eval_loss=10.6, eval_precision=0.66, eval_recall=0.736] 


eval_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.65      0.85      0.73        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.50      0.83      0.62         6
     LOC.NOM       0.20      0.33      0.25         6
     ORG.NAM       0.38      0.45      0.41        47
     ORG.NOM       0.33      0.80      0.47         5
     PER.NAM       0.73      0.79      0.76        90
     PER.NOM       0.80      0.76      0.78       208

   micro avg       0.68      0.73      0.70       389
   macro avg       0.45      0.60      0.50       389
weighted avg       0.70      0.73      0.71       389



calculate data/few_shot/weibo/train_1000.json etag: 100%|██████████| 665k/665k [00:00<00:00, 283MB/s]
calculate data/few_shot/weibo/dev.json etag: 100%|██████████| 180k/180k [00:00<00:00, 194MB/s]
calculate data/few_shot/weibo/test.json etag: 100%|██████████| 184k/184k [00:00<00:00, 197MB/s]
calculate data/few_shot/weibo/labels.txt etag: 100%|██████████| 272/272 [00:00<00:00, 526kB/s]

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/weibo/train_1000.json",
    "eval_file": "data/few_shot/weibo/dev.json",
    "test_file": "data/few_shot/weibo/test.json",
    "tag_file": "data/few_shot/weibo/labels.txt",
    "bert_vocab_file": "./model/chinese_wwm_ext/vocab.txt",
    "output_eval": true,
    "max_scan_num": 1000000,
    "add_seq_vocab": false,
    "max_seq_length": 150,
    "max_word_num": 5,
    "default_tag": "O",
    "use_test": false,
    "do_shuffle": true,
    "do_predict": false,
    "task_name": "weibo_pretrain_lebert_crf_1000_x3"
}
load cached ./temp/b8906855ab5cdf4bb18730a0e123dcf9_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/lexicon_tree



count line size data/few_shot/weibo/labels.txt: 29L [00:00, 259903.45L/s]
build line mapper: 29L [00:00, 259903.45L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 29/29 [00:00<00:00, 8667.77it/s]
load vocab from list: 100%|██████████| 28/28 [00:00<00:00, 256420.33it/s]
load dataset from data/few_shot/weibo/train_1000.json: 55it [00:00, 543.69it/s]

load cached ./temp/b8906855ab5cdf4bb18730a0e123dcf9_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/matched_words
load cached ./temp/b8906855ab5cdf4bb18730a0e123dcf9_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/word_vocab
load cached ./temp/b8906855ab5cdf4bb18730a0e123dcf9_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/vocab_embedding


load dataset from data/few_shot/weibo/train_1000.json: 1000it [00:01, 505.68it/s]
load dataset from data/few_shot/weibo/dev.json: 271it [00:00, 501.95it/s]
Some weights of the model checkpoint at save_pretrained/weibo_pretrain_lebert_1000_pretraind_task/Bert_960/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.26it/s, F1=0, train_acc=0.792, train_loss=43.1, train_precision=0, train_recall=0]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00       137
     GPE.NOM       0.00      0.00      0.00         4
     LOC.NAM       0.00      0.00      0.00        41
     LOC.NOM       0.00      0.00      0.00        38
     ORG.NAM       0.00      0.00      0.00       141
     ORG.NOM       0.00      0.00      0.00        27
     PER.NAM       0.00      0.00      0.00       432
     PER.NOM       0.00      0.00      0.00       543

   micro avg       0.00      0.00      0.00      1363
   macro avg       0.00      0.00      0.00      1363
weighted avg       0.00      0.00      0.00      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.38it/s, F1=0.0027, eval_acc=0.934, eval_loss=12.3, eval_precision=0.0105, eval_recall=0.00155] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.00      0.00      0.00        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.05      0.01      0.02        90
     PER.NOM       0.00      0.00      0.00       208

   micro avg       0.03      0.00      0.00       389
   macro avg       0.01      0.00      0.00       389
weighted avg       0.01      0.00      0.00       389



Epoch: 2/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.22it/s, F1=0.337, train_acc=0.954, train_loss=9.12, train_precision=0.374, train_recall=0.33]      


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.20      0.15      0.17       137
     GPE.NOM       0.00      0.00      0.00         4
     LOC.NAM       0.00      0.00      0.00        41
     LOC.NOM       0.00      0.00      0.00        38
     ORG.NAM       0.14      0.06      0.08       141
     ORG.NOM       0.00      0.00      0.00        27
     PER.NAM       0.38      0.41      0.39       432
     PER.NOM       0.43      0.46      0.45       543

   micro avg       0.38      0.34      0.36      1363
   macro avg       0.14      0.14      0.14      1363
weighted avg       0.33      0.34      0.33      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.39it/s, F1=0.614, eval_acc=0.96, eval_loss=6.15, eval_precision=0.584, eval_recall=0.653] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.39      0.65      0.49        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.26      0.19      0.22        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.57      0.78      0.66        90
     PER.NOM       0.67      0.76      0.71       208

   micro avg       0.58      0.65      0.61       389
   macro avg       0.24      0.30      0.26       389
weighted avg       0.55      0.65      0.59       389



Epoch: 3/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.24it/s, F1=0.682, train_acc=0.974, train_loss=4.5, train_precision=0.697, train_recall=0.694] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.53      0.73      0.61       137
     GPE.NOM       0.00      0.00      0.00         4
     LOC.NAM       0.00      0.00      0.00        41
     LOC.NOM       0.00      0.00      0.00        38
     ORG.NAM       0.63      0.62      0.63       141
     ORG.NOM       0.00      0.00      0.00        27
     PER.NAM       0.77      0.77      0.77       432
     PER.NOM       0.70      0.78      0.74       543

   micro avg       0.66      0.69      0.68      1363
   macro avg       0.33      0.36      0.34      1363
weighted avg       0.64      0.69      0.66      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.40it/s, F1=0.616, eval_acc=0.957, eval_loss=6.27, eval_precision=0.538, eval_recall=0.726]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.36      0.73      0.48        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.23      0.49      0.31        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.62      0.74      0.68        90
     PER.NOM       0.74      0.82      0.78       208

   micro avg       0.54      0.72      0.62       389
   macro avg       0.24      0.35      0.28       389
weighted avg       0.59      0.72      0.64       389



Epoch: 4/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.21it/s, F1=0.761, train_acc=0.983, train_loss=2.94, train_precision=0.751, train_recall=0.791]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.67      0.82      0.74       137
     GPE.NOM       0.00      0.00      0.00         4
     LOC.NAM       0.21      0.32      0.25        41
     LOC.NOM       0.11      0.05      0.07        38
     ORG.NAM       0.71      0.82      0.76       141
     ORG.NOM       0.11      0.04      0.06        27
     PER.NAM       0.84      0.84      0.84       432
     PER.NOM       0.81      0.88      0.84       543

   micro avg       0.75      0.80      0.77      1363
   macro avg       0.43      0.47      0.45      1363
weighted avg       0.74      0.80      0.77      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.15it/s, F1=0.648, eval_acc=0.963, eval_loss=5.73, eval_precision=0.587, eval_recall=0.727]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.52      0.88      0.66        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.20      0.33      0.25         6
     ORG.NAM       0.37      0.53      0.44        47
     ORG.NOM       0.40      0.40      0.40         5
     PER.NAM       0.69      0.74      0.72        90
     PER.NOM       0.69      0.76      0.72       208

   micro avg       0.60      0.71      0.65       389
   macro avg       0.36      0.46      0.40       389
weighted avg       0.61      0.71      0.66       389



Epoch: 5/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.28it/s, F1=0.845, train_acc=0.988, train_loss=1.9, train_precision=0.839, train_recall=0.864] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.80      0.91      0.85       137
     GPE.NOM       0.00      0.00      0.00         4
     LOC.NAM       0.47      0.61      0.53        41
     LOC.NOM       0.29      0.29      0.29        38
     ORG.NAM       0.87      0.91      0.89       141
     ORG.NOM       0.52      0.44      0.48        27
     PER.NAM       0.88      0.87      0.88       432
     PER.NOM       0.88      0.92      0.90       543

   micro avg       0.83      0.87      0.85      1363
   macro avg       0.59      0.62      0.60      1363
weighted avg       0.83      0.87      0.85      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.43it/s, F1=0.671, eval_acc=0.965, eval_loss=6.42, eval_precision=0.622, eval_recall=0.733]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.56      0.85      0.68        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.29      0.83      0.43         6
     LOC.NOM       0.08      0.17      0.11         6
     ORG.NAM       0.36      0.43      0.39        47
     ORG.NOM       0.30      0.60      0.40         5
     PER.NAM       0.74      0.78      0.76        90
     PER.NOM       0.75      0.77      0.76       208

   micro avg       0.64      0.72      0.68       389
   macro avg       0.39      0.55      0.44       389
weighted avg       0.66      0.72      0.69       389



Epoch: 6/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.25it/s, F1=0.862, train_acc=0.99, train_loss=1.55, train_precision=0.856, train_recall=0.88]  


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.90      0.96      0.93       137
     GPE.NOM       0.00      0.00      0.00         4
     LOC.NAM       0.63      0.71      0.67        41
     LOC.NOM       0.41      0.42      0.42        38
     ORG.NAM       0.87      0.93      0.90       141
     ORG.NOM       0.55      0.59      0.57        27
     PER.NAM       0.87      0.89      0.88       432
     PER.NOM       0.90      0.92      0.91       543

   micro avg       0.86      0.89      0.87      1363
   macro avg       0.64      0.68      0.66      1363
weighted avg       0.86      0.89      0.87      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.43it/s, F1=0.663, eval_acc=0.965, eval_loss=6.41, eval_precision=0.639, eval_recall=0.692]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.57      0.81      0.67        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.26      0.83      0.40         6
     LOC.NOM       0.22      0.33      0.27         6
     ORG.NAM       0.39      0.40      0.40        47
     ORG.NOM       0.50      0.80      0.62         5
     PER.NAM       0.73      0.77      0.75        90
     PER.NOM       0.77      0.72      0.74       208

   micro avg       0.65      0.69      0.67       389
   macro avg       0.43      0.58      0.48       389
weighted avg       0.68      0.69      0.68       389



Epoch: 7/30 Train: 100%|██████████| 125/125 [00:39<00:00,  3.19it/s, F1=0.922, train_acc=0.994, train_loss=1.05, train_precision=0.918, train_recall=0.932] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.93      0.95      0.94       137
     GPE.NOM       0.00      0.00      0.00         4
     LOC.NAM       0.69      0.80      0.74        41
     LOC.NOM       0.62      0.68      0.65        38
     ORG.NAM       0.95      0.98      0.96       141
     ORG.NOM       0.80      0.74      0.77        27
     PER.NAM       0.92      0.92      0.92       432
     PER.NOM       0.92      0.95      0.93       543

   micro avg       0.91      0.92      0.92      1363
   macro avg       0.73      0.75      0.74      1363
weighted avg       0.90      0.92      0.91      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  3.90it/s, F1=0.657, eval_acc=0.966, eval_loss=6.44, eval_precision=0.614, eval_recall=0.71] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.51      0.73      0.60        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.50      0.67      0.57         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.38      0.51      0.44        47
     ORG.NOM       0.25      1.00      0.40         5
     PER.NAM       0.78      0.66      0.71        90
     PER.NOM       0.72      0.77      0.75       208

   micro avg       0.63      0.70      0.66       389
   macro avg       0.39      0.54      0.43       389
weighted avg       0.66      0.70      0.67       389



Epoch: 8/30 Train: 100%|██████████| 125/125 [00:41<00:00,  3.00it/s, F1=0.935, train_acc=0.995, train_loss=0.864, train_precision=0.932, train_recall=0.945]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.97      0.96      0.96       137
     GPE.NOM       0.50      0.25      0.33         4
     LOC.NAM       0.85      0.95      0.90        41
     LOC.NOM       0.65      0.68      0.67        38
     ORG.NAM       0.92      0.96      0.94       141
     ORG.NOM       0.82      0.85      0.84        27
     PER.NAM       0.94      0.95      0.95       432
     PER.NOM       0.94      0.96      0.95       543

   micro avg       0.93      0.94      0.93      1363
   macro avg       0.82      0.82      0.82      1363
weighted avg       0.93      0.94      0.93      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.43it/s, F1=0.666, eval_acc=0.961, eval_loss=7.39, eval_precision=0.601, eval_recall=0.749]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.61      0.85      0.71        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.38      0.83      0.53         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.34      0.45      0.39        47
     ORG.NOM       0.40      0.80      0.53         5
     PER.NAM       0.65      0.81      0.72        90
     PER.NOM       0.71      0.79      0.75       208

   micro avg       0.62      0.75      0.68       389
   macro avg       0.39      0.57      0.45       389
weighted avg       0.62      0.75      0.68       389



Epoch: 9/30 Train: 100%|██████████| 125/125 [00:39<00:00,  3.18it/s, F1=0.935, train_acc=0.995, train_loss=0.785, train_precision=0.928, train_recall=0.948]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.93      0.94      0.93       137
     GPE.NOM       0.50      0.25      0.33         4
     LOC.NAM       0.89      0.95      0.92        41
     LOC.NOM       0.84      0.82      0.83        38
     ORG.NAM       0.91      0.95      0.93       141
     ORG.NOM       0.89      0.89      0.89        27
     PER.NAM       0.92      0.95      0.94       432
     PER.NOM       0.94      0.97      0.95       543

   micro avg       0.92      0.95      0.94      1363
   macro avg       0.85      0.84      0.84      1363
weighted avg       0.92      0.95      0.94      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.10it/s, F1=0.664, eval_acc=0.963, eval_loss=6.83, eval_precision=0.613, eval_recall=0.727]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.52      0.85      0.65        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.33      0.83      0.48         6
     LOC.NOM       0.09      0.17      0.12         6
     ORG.NAM       0.35      0.43      0.38        47
     ORG.NOM       0.25      0.80      0.38         5
     PER.NAM       0.74      0.72      0.73        90
     PER.NOM       0.74      0.78      0.76       208

   micro avg       0.62      0.72      0.67       389
   macro avg       0.38      0.57      0.44       389
weighted avg       0.65      0.72      0.68       389



Epoch: 10/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.26it/s, F1=0.939, train_acc=0.996, train_loss=0.598, train_precision=0.931, train_recall=0.951]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.96      0.98      0.97       137
     GPE.NOM       1.00      0.75      0.86         4
     LOC.NAM       0.93      0.90      0.91        41
     LOC.NOM       0.93      0.97      0.95        38
     ORG.NAM       0.94      0.97      0.95       141
     ORG.NOM       0.96      0.96      0.96        27
     PER.NAM       0.93      0.96      0.95       432
     PER.NOM       0.95      0.97      0.96       543

   micro avg       0.94      0.97      0.95      1363
   macro avg       0.95      0.93      0.94      1363
weighted avg       0.94      0.97      0.95      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.39it/s, F1=0.673, eval_acc=0.965, eval_loss=8.36, eval_precision=0.636, eval_recall=0.719]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.59      0.92      0.72        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.27      0.67      0.38         6
     LOC.NOM       0.12      0.17      0.14         6
     ORG.NAM       0.33      0.38      0.35        47
     ORG.NOM       0.44      0.80      0.57         5
     PER.NAM       0.76      0.70      0.73        90
     PER.NOM       0.76      0.78      0.77       208

   micro avg       0.65      0.71      0.68       389
   macro avg       0.41      0.55      0.46       389
weighted avg       0.67      0.71      0.69       389



Epoch: 11/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.26it/s, F1=0.954, train_acc=0.996, train_loss=0.612, train_precision=0.946, train_recall=0.967]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.98      0.99      0.99       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.86      0.93      0.89        41
     LOC.NOM       0.85      0.92      0.89        38
     ORG.NAM       0.92      0.93      0.93       141
     ORG.NOM       0.93      1.00      0.96        27
     PER.NAM       0.96      0.98      0.97       432
     PER.NOM       0.95      0.97      0.96       543

   micro avg       0.95      0.97      0.96      1363
   macro avg       0.93      0.96      0.95      1363
weighted avg       0.95      0.97      0.96      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.38it/s, F1=0.658, eval_acc=0.958, eval_loss=7.4, eval_precision=0.58, eval_recall=0.763]  


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.55      0.88      0.68        26
     GPE.NOM       0.50      1.00      0.67         1
     LOC.NAM       0.28      0.83      0.42         6
     LOC.NOM       0.17      0.17      0.17         6
     ORG.NAM       0.33      0.47      0.39        47
     ORG.NOM       0.19      0.60      0.29         5
     PER.NAM       0.66      0.79      0.72        90
     PER.NOM       0.70      0.82      0.76       208

   micro avg       0.59      0.76      0.67       389
   macro avg       0.42      0.69      0.51       389
weighted avg       0.62      0.76      0.68       389



Epoch: 12/30 Train: 100%|██████████| 125/125 [00:43<00:00,  2.90it/s, F1=0.957, train_acc=0.996, train_loss=0.508, train_precision=0.951, train_recall=0.968]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.96      0.99      0.97       137
     GPE.NOM       0.80      1.00      0.89         4
     LOC.NAM       0.87      0.98      0.92        41
     LOC.NOM       0.94      0.89      0.92        38
     ORG.NAM       0.98      0.99      0.98       141
     ORG.NOM       0.86      0.93      0.89        27
     PER.NAM       0.95      0.96      0.95       432
     PER.NOM       0.95      0.97      0.96       543

   micro avg       0.95      0.97      0.96      1363
   macro avg       0.91      0.96      0.94      1363
weighted avg       0.95      0.97      0.96      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.27it/s, F1=0.683, eval_acc=0.966, eval_loss=8.02, eval_precision=0.65, eval_recall=0.724] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.68      0.81      0.74        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.44      0.67      0.53         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.43      0.40      0.42        47
     ORG.NOM       0.50      0.80      0.62         5
     PER.NAM       0.73      0.68      0.70        90
     PER.NOM       0.72      0.81      0.76       208

   micro avg       0.67      0.71      0.69       389
   macro avg       0.44      0.52      0.47       389
weighted avg       0.66      0.71      0.69       389



Epoch: 13/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.25it/s, F1=0.956, train_acc=0.997, train_loss=0.448, train_precision=0.951, train_recall=0.966]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      0.99      0.99       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.90      0.93      0.92        41
     LOC.NOM       0.93      0.97      0.95        38
     ORG.NAM       0.97      0.99      0.98       141
     ORG.NOM       1.00      0.96      0.98        27
     PER.NAM       0.96      0.97      0.97       432
     PER.NOM       0.94      0.97      0.95       543

   micro avg       0.95      0.97      0.96      1363
   macro avg       0.96      0.97      0.97      1363
weighted avg       0.95      0.97      0.96      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.41it/s, F1=0.685, eval_acc=0.966, eval_loss=7.4, eval_precision=0.656, eval_recall=0.72]  


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.59      0.85      0.70        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.31      0.67      0.42         6
     LOC.NOM       0.25      0.17      0.20         6
     ORG.NAM       0.41      0.43      0.42        47
     ORG.NOM       0.33      0.80      0.47         5
     PER.NAM       0.74      0.79      0.76        90
     PER.NOM       0.78      0.75      0.77       208

   micro avg       0.68      0.71      0.70       389
   macro avg       0.43      0.56      0.47       389
weighted avg       0.69      0.71      0.70       389



Epoch: 14/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.24it/s, F1=0.971, train_acc=0.998, train_loss=0.352, train_precision=0.969, train_recall=0.978]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      0.99      0.99       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.90      0.93      0.92        41
     LOC.NOM       0.95      0.95      0.95        38
     ORG.NAM       0.97      0.99      0.98       141
     ORG.NOM       0.96      1.00      0.98        27
     PER.NAM       0.97      0.98      0.97       432
     PER.NOM       0.97      0.97      0.97       543

   micro avg       0.97      0.98      0.97      1363
   macro avg       0.96      0.97      0.97      1363
weighted avg       0.97      0.98      0.97      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.44it/s, F1=0.695, eval_acc=0.966, eval_loss=8.13, eval_precision=0.647, eval_recall=0.756]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.57      0.88      0.70        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.56      0.83      0.67         6
     LOC.NOM       0.20      0.17      0.18         6
     ORG.NAM       0.41      0.36      0.39        47
     ORG.NOM       0.33      0.80      0.47         5
     PER.NAM       0.72      0.79      0.76        90
     PER.NOM       0.75      0.83      0.79       208

   micro avg       0.67      0.76      0.71       389
   macro avg       0.44      0.58      0.49       389
weighted avg       0.67      0.76      0.71       389



Epoch: 15/30 Train: 100%|██████████| 125/125 [00:42<00:00,  2.97it/s, F1=0.969, train_acc=0.998, train_loss=0.324, train_precision=0.965, train_recall=0.976]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      1.00      1.00       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.87      0.95      0.91        41
     LOC.NOM       1.00      1.00      1.00        38
     ORG.NAM       0.99      0.99      0.99       141
     ORG.NOM       0.96      0.96      0.96        27
     PER.NAM       0.97      0.98      0.98       432
     PER.NOM       0.96      0.98      0.97       543

   micro avg       0.97      0.98      0.97      1363
   macro avg       0.97      0.98      0.98      1363
weighted avg       0.97      0.98      0.97      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.45it/s, F1=0.691, eval_acc=0.967, eval_loss=8.71, eval_precision=0.651, eval_recall=0.739]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.58      0.85      0.69        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.45      0.83      0.59         6
     LOC.NOM       0.20      0.17      0.18         6
     ORG.NAM       0.34      0.40      0.37        47
     ORG.NOM       0.36      0.80      0.50         5
     PER.NAM       0.75      0.71      0.73        90
     PER.NOM       0.77      0.82      0.79       208

   micro avg       0.67      0.73      0.70       389
   macro avg       0.43      0.57      0.48       389
weighted avg       0.68      0.73      0.70       389



Epoch: 16/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.27it/s, F1=0.973, train_acc=0.997, train_loss=0.324, train_precision=0.972, train_recall=0.976]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.90      0.93      0.92        41
     LOC.NOM       1.00      0.95      0.97        38
     ORG.NAM       0.96      0.96      0.96       141
     ORG.NOM       1.00      0.96      0.98        27
     PER.NAM       0.96      0.98      0.97       432
     PER.NOM       0.97      0.98      0.97       543

   micro avg       0.97      0.98      0.97      1363
   macro avg       0.98      0.97      0.97      1363
weighted avg       0.97      0.98      0.97      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.45it/s, F1=0.685, eval_acc=0.965, eval_loss=8.1, eval_precision=0.646, eval_recall=0.732] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.61      0.88      0.72        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.40      0.67      0.50         6
     LOC.NOM       0.12      0.50      0.19         6
     ORG.NAM       0.42      0.34      0.38        47
     ORG.NOM       0.67      0.80      0.73         5
     PER.NAM       0.71      0.78      0.74        90
     PER.NOM       0.78      0.78      0.78       208

   micro avg       0.66      0.72      0.69       389
   macro avg       0.46      0.59      0.50       389
weighted avg       0.69      0.72      0.70       389



Epoch: 17/30 Train: 100%|██████████| 125/125 [00:39<00:00,  3.20it/s, F1=0.953, train_acc=0.998, train_loss=0.296, train_precision=0.953, train_recall=0.958]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      0.99      0.99       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.84      0.93      0.88        41
     LOC.NOM       0.97      0.97      0.97        38
     ORG.NAM       0.95      0.98      0.97       141
     ORG.NOM       0.92      0.85      0.88        27
     PER.NAM       0.98      0.97      0.98       432
     PER.NOM       0.97      0.98      0.98       543

   micro avg       0.97      0.98      0.97      1363
   macro avg       0.95      0.96      0.96      1363
weighted avg       0.97      0.98      0.97      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.43it/s, F1=0.683, eval_acc=0.965, eval_loss=8.35, eval_precision=0.631, eval_recall=0.75] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.50      0.85      0.63        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.36      0.83      0.50         6
     LOC.NOM       0.29      0.33      0.31         6
     ORG.NAM       0.42      0.47      0.44        47
     ORG.NOM       0.26      1.00      0.42         5
     PER.NAM       0.69      0.78      0.73        90
     PER.NOM       0.78      0.78      0.78       208

   micro avg       0.65      0.74      0.69       389
   macro avg       0.41      0.63      0.48       389
weighted avg       0.67      0.74      0.70       389



Epoch: 18/30 Train: 100%|██████████| 125/125 [00:41<00:00,  2.99it/s, F1=0.967, train_acc=0.998, train_loss=0.242, train_precision=0.966, train_recall=0.971]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.95      0.93      0.94        41
     LOC.NOM       0.97      1.00      0.99        38
     ORG.NAM       0.99      0.99      0.99       141
     ORG.NOM       0.96      0.96      0.96        27
     PER.NAM       0.97      0.99      0.98       432
     PER.NOM       0.96      0.97      0.96       543

   micro avg       0.97      0.98      0.98      1363
   macro avg       0.98      0.98      0.98      1363
weighted avg       0.97      0.98      0.98      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.43it/s, F1=0.682, eval_acc=0.965, eval_loss=8.98, eval_precision=0.647, eval_recall=0.726]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.64      0.88      0.74        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.28      0.83      0.42         6
     LOC.NOM       0.17      0.17      0.17         6
     ORG.NAM       0.37      0.49      0.42        47
     ORG.NOM       0.20      0.60      0.30         5
     PER.NAM       0.79      0.70      0.74        90
     PER.NOM       0.80      0.77      0.79       208

   micro avg       0.67      0.72      0.69       389
   macro avg       0.40      0.56      0.45       389
weighted avg       0.71      0.72      0.71       389



Epoch: 19/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.22it/s, F1=0.969, train_acc=0.998, train_loss=0.281, train_precision=0.965, train_recall=0.979]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      0.99      0.99       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.86      0.93      0.89        41
     LOC.NOM       1.00      0.97      0.99        38
     ORG.NAM       0.99      0.99      0.99       141
     ORG.NOM       0.93      0.96      0.95        27
     PER.NAM       0.98      0.99      0.98       432
     PER.NOM       0.95      0.97      0.96       543

   micro avg       0.97      0.98      0.97      1363
   macro avg       0.96      0.98      0.97      1363
weighted avg       0.97      0.98      0.97      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.44it/s, F1=0.655, eval_acc=0.96, eval_loss=9.45, eval_precision=0.595, eval_recall=0.732] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.53      0.88      0.67        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.33      0.67      0.44         6
     LOC.NOM       0.33      0.50      0.40         6
     ORG.NAM       0.34      0.47      0.39        47
     ORG.NOM       0.23      0.60      0.33         5
     PER.NAM       0.70      0.78      0.74        90
     PER.NOM       0.72      0.76      0.74       208

   micro avg       0.61      0.73      0.67       389
   macro avg       0.40      0.58      0.46       389
weighted avg       0.63      0.73      0.68       389



Epoch: 20/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.25it/s, F1=0.973, train_acc=0.998, train_loss=0.24, train_precision=0.971, train_recall=0.978] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.98      0.99      0.98       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.84      0.93      0.88        41
     LOC.NOM       0.97      1.00      0.99        38
     ORG.NAM       0.97      0.99      0.98       141
     ORG.NOM       1.00      0.96      0.98        27
     PER.NAM       0.98      0.99      0.98       432
     PER.NOM       0.97      0.97      0.97       543

   micro avg       0.97      0.98      0.98      1363
   macro avg       0.97      0.98      0.97      1363
weighted avg       0.97      0.98      0.98      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.32it/s, F1=0.687, eval_acc=0.966, eval_loss=9.25, eval_precision=0.662, eval_recall=0.716]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.51      0.85      0.64        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.56      0.83      0.67         6
     LOC.NOM       0.50      0.50      0.50         6
     ORG.NAM       0.41      0.28      0.33        47
     ORG.NOM       0.33      0.80      0.47         5
     PER.NAM       0.76      0.72      0.74        90
     PER.NOM       0.73      0.78      0.76       208

   micro avg       0.67      0.70      0.69       389
   macro avg       0.48      0.59      0.51       389
weighted avg       0.67      0.70      0.68       389



Epoch: 21/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.29it/s, F1=0.968, train_acc=0.998, train_loss=0.284, train_precision=0.967, train_recall=0.973]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.93      1.00      0.96        41
     LOC.NOM       0.97      0.95      0.96        38
     ORG.NAM       0.98      0.98      0.98       141
     ORG.NOM       1.00      0.96      0.98        27
     PER.NAM       0.98      0.98      0.98       432
     PER.NOM       0.97      0.98      0.97       543

   micro avg       0.98      0.98      0.98      1363
   macro avg       0.98      0.98      0.98      1363
weighted avg       0.98      0.98      0.98      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.41it/s, F1=0.695, eval_acc=0.966, eval_loss=8.4, eval_precision=0.672, eval_recall=0.723] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.63      0.85      0.72        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.42      0.83      0.56         6
     LOC.NOM       0.25      0.50      0.33         6
     ORG.NAM       0.40      0.34      0.37        47
     ORG.NOM       0.27      0.80      0.40         5
     PER.NAM       0.76      0.77      0.76        90
     PER.NOM       0.79      0.76      0.77       208

   micro avg       0.68      0.71      0.70       389
   macro avg       0.44      0.61      0.49       389
weighted avg       0.70      0.71      0.70       389



Epoch: 22/30 Train: 100%|██████████| 125/125 [00:41<00:00,  2.98it/s, F1=0.966, train_acc=0.997, train_loss=0.315, train_precision=0.966, train_recall=0.971]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.88      0.93      0.90        41
     LOC.NOM       0.97      0.97      0.97        38
     ORG.NAM       0.97      0.98      0.97       141
     ORG.NOM       1.00      0.96      0.98        27
     PER.NAM       0.97      0.97      0.97       432
     PER.NOM       0.97      0.97      0.97       543

   micro avg       0.97      0.97      0.97      1363
   macro avg       0.97      0.97      0.97      1363
weighted avg       0.97      0.97      0.97      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.36it/s, F1=0.696, eval_acc=0.966, eval_loss=8.89, eval_precision=0.655, eval_recall=0.744]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.59      0.88      0.71        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.44      0.67      0.53         6
     LOC.NOM       0.23      0.50      0.32         6
     ORG.NAM       0.45      0.45      0.45        47
     ORG.NOM       0.25      0.80      0.38         5
     PER.NAM       0.78      0.73      0.75        90
     PER.NOM       0.76      0.80      0.78       208

   micro avg       0.67      0.74      0.70       389
   macro avg       0.44      0.60      0.49       389
weighted avg       0.69      0.74      0.71       389



Epoch: 23/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.26it/s, F1=0.972, train_acc=0.998, train_loss=0.212, train_precision=0.976, train_recall=0.973]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.97      0.95      0.96        41
     LOC.NOM       1.00      1.00      1.00        38
     ORG.NAM       0.99      0.99      0.99       141
     ORG.NOM       0.89      0.89      0.89        27
     PER.NAM       0.98      0.97      0.98       432
     PER.NOM       0.97      0.98      0.97       543

   micro avg       0.98      0.98      0.98      1363
   macro avg       0.97      0.97      0.97      1363
weighted avg       0.98      0.98      0.98      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.30it/s, F1=0.677, eval_acc=0.964, eval_loss=9.09, eval_precision=0.637, eval_recall=0.725]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.67      0.85      0.75        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.31      0.83      0.45         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.38      0.51      0.44        47
     ORG.NOM       0.29      0.80      0.42         5
     PER.NAM       0.75      0.74      0.75        90
     PER.NOM       0.77      0.76      0.77       208

   micro avg       0.66      0.72      0.69       389
   macro avg       0.40      0.56      0.45       389
weighted avg       0.68      0.72      0.70       389



Epoch: 24/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.24it/s, F1=0.979, train_acc=0.998, train_loss=0.293, train_precision=0.977, train_recall=0.983]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      0.99      0.99       137
     GPE.NOM       1.00      0.75      0.86         4
     LOC.NAM       0.95      0.98      0.96        41
     LOC.NOM       0.97      0.97      0.97        38
     ORG.NAM       0.98      0.98      0.98       141
     ORG.NOM       1.00      0.96      0.98        27
     PER.NAM       0.97      0.99      0.98       432
     PER.NOM       0.98      0.98      0.98       543

   micro avg       0.98      0.98      0.98      1363
   macro avg       0.98      0.95      0.96      1363
weighted avg       0.98      0.98      0.98      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.34it/s, F1=0.688, eval_acc=0.967, eval_loss=8.16, eval_precision=0.66, eval_recall=0.723] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.64      0.81      0.71        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.56      0.83      0.67         6
     LOC.NOM       0.12      0.17      0.14         6
     ORG.NAM       0.38      0.38      0.38        47
     ORG.NOM       0.31      0.80      0.44         5
     PER.NAM       0.74      0.74      0.74        90
     PER.NOM       0.78      0.79      0.78       208

   micro avg       0.68      0.72      0.70       389
   macro avg       0.44      0.57      0.48       389
weighted avg       0.69      0.72      0.70       389



Epoch: 25/30 Train: 100%|██████████| 125/125 [00:42<00:00,  2.95it/s, F1=0.961, train_acc=0.997, train_loss=0.49, train_precision=0.959, train_recall=0.966] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.73      0.78      0.75        41
     LOC.NOM       0.97      0.97      0.97        38
     ORG.NAM       0.98      0.97      0.98       141
     ORG.NOM       0.96      0.96      0.96        27
     PER.NAM       0.95      0.96      0.96       432
     PER.NOM       0.97      0.98      0.97       543

   micro avg       0.96      0.97      0.96      1363
   macro avg       0.95      0.95      0.95      1363
weighted avg       0.96      0.97      0.96      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.42it/s, F1=0.673, eval_acc=0.962, eval_loss=8.09, eval_precision=0.609, eval_recall=0.756]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.66      0.88      0.75        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.36      0.67      0.47         6
     LOC.NOM       0.25      0.17      0.20         6
     ORG.NAM       0.34      0.51      0.41        47
     ORG.NOM       0.24      0.80      0.36         5
     PER.NAM       0.67      0.77      0.72        90
     PER.NOM       0.74      0.81      0.78       208

   micro avg       0.63      0.76      0.69       389
   macro avg       0.41      0.58      0.46       389
weighted avg       0.65      0.76      0.70       389



Epoch: 26/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.24it/s, F1=0.977, train_acc=0.997, train_loss=0.329, train_precision=0.977, train_recall=0.979]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.90      0.93      0.92        41
     LOC.NOM       1.00      0.97      0.99        38
     ORG.NAM       0.98      0.98      0.98       141
     ORG.NOM       1.00      0.96      0.98        27
     PER.NAM       0.97      0.98      0.98       432
     PER.NOM       0.97      0.98      0.97       543

   micro avg       0.97      0.98      0.98      1363
   macro avg       0.98      0.98      0.98      1363
weighted avg       0.97      0.98      0.98      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.39it/s, F1=0.682, eval_acc=0.965, eval_loss=9.65, eval_precision=0.643, eval_recall=0.73] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.66      0.88      0.75        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.56      0.83      0.67         6
     LOC.NOM       0.33      0.33      0.33         6
     ORG.NAM       0.36      0.43      0.39        47
     ORG.NOM       0.22      0.80      0.35         5
     PER.NAM       0.69      0.78      0.73        90
     PER.NOM       0.79      0.75      0.77       208

   micro avg       0.66      0.72      0.69       389
   macro avg       0.45      0.60      0.50       389
weighted avg       0.68      0.72      0.70       389



Epoch: 27/30 Train: 100%|██████████| 125/125 [00:39<00:00,  3.18it/s, F1=0.974, train_acc=0.998, train_loss=0.213, train_precision=0.973, train_recall=0.977]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.88      0.93      0.90        41
     LOC.NOM       0.90      0.95      0.92        38
     ORG.NAM       0.99      0.99      0.99       141
     ORG.NOM       0.96      1.00      0.98        27
     PER.NAM       0.98      0.98      0.98       432
     PER.NOM       0.98      0.97      0.98       543

   micro avg       0.98      0.98      0.98      1363
   macro avg       0.96      0.98      0.97      1363
weighted avg       0.98      0.98      0.98      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.35it/s, F1=0.68, eval_acc=0.964, eval_loss=9.77, eval_precision=0.631, eval_recall=0.741] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.61      0.85      0.71        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.56      0.83      0.67         6
     LOC.NOM       0.33      0.33      0.33         6
     ORG.NAM       0.33      0.53      0.41        47
     ORG.NOM       0.29      0.80      0.42         5
     PER.NAM       0.74      0.73      0.74        90
     PER.NOM       0.78      0.77      0.78       208

   micro avg       0.65      0.73      0.69       389
   macro avg       0.45      0.61      0.51       389
weighted avg       0.69      0.73      0.70       389



Epoch: 28/30 Train: 100%|██████████| 125/125 [00:42<00:00,  2.94it/s, F1=0.966, train_acc=0.997, train_loss=0.424, train_precision=0.963, train_recall=0.972]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      0.99      0.99       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.91      0.95      0.93        41
     LOC.NOM       0.95      0.97      0.96        38
     ORG.NAM       0.97      0.99      0.98       141
     ORG.NOM       0.93      0.96      0.95        27
     PER.NAM       0.97      0.96      0.97       432
     PER.NOM       0.96      0.97      0.97       543

   micro avg       0.97      0.97      0.97      1363
   macro avg       0.96      0.98      0.97      1363
weighted avg       0.97      0.97      0.97      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.33it/s, F1=0.673, eval_acc=0.965, eval_loss=8.59, eval_precision=0.642, eval_recall=0.713]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.62      0.81      0.70        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.42      0.83      0.56         6
     LOC.NOM       0.20      0.17      0.18         6
     ORG.NAM       0.39      0.45      0.42        47
     ORG.NOM       0.27      0.80      0.40         5
     PER.NAM       0.76      0.66      0.70        90
     PER.NOM       0.77      0.78      0.77       208

   micro avg       0.67      0.70      0.68       389
   macro avg       0.43      0.56      0.47       389
weighted avg       0.69      0.70      0.69       389



Epoch: 29/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.24it/s, F1=0.944, train_acc=0.996, train_loss=0.564, train_precision=0.943, train_recall=0.95] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      1.00      1.00       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.86      0.93      0.89        41
     LOC.NOM       1.00      0.97      0.99        38
     ORG.NAM       0.98      0.99      0.99       141
     ORG.NOM       0.96      0.96      0.96        27
     PER.NAM       0.90      0.92      0.91       432
     PER.NOM       0.96      0.96      0.96       543

   micro avg       0.94      0.96      0.95      1363
   macro avg       0.96      0.97      0.96      1363
weighted avg       0.94      0.96      0.95      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.41it/s, F1=0.696, eval_acc=0.966, eval_loss=8.61, eval_precision=0.662, eval_recall=0.74] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.70      0.81      0.75        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.56      0.83      0.67         6
     LOC.NOM       0.40      0.33      0.36         6
     ORG.NAM       0.36      0.45      0.40        47
     ORG.NOM       0.33      0.80      0.47         5
     PER.NAM       0.75      0.76      0.75        90
     PER.NOM       0.79      0.79      0.79       208

   micro avg       0.69      0.74      0.71       389
   macro avg       0.49      0.60      0.52       389
weighted avg       0.71      0.74      0.72       389



Epoch: 30/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.28it/s, F1=0.97, train_acc=0.998, train_loss=0.178, train_precision=0.966, train_recall=0.976] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       137
     GPE.NOM       1.00      1.00      1.00         4
     LOC.NAM       0.97      0.93      0.95        41
     LOC.NOM       1.00      0.97      0.99        38
     ORG.NAM       0.99      0.99      0.99       141
     ORG.NOM       1.00      1.00      1.00        27
     PER.NAM       0.97      0.98      0.98       432
     PER.NOM       0.97      0.98      0.98       543

   micro avg       0.98      0.98      0.98      1363
   macro avg       0.99      0.98      0.99      1363
weighted avg       0.98      0.98      0.98      1363



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  3.88it/s, F1=0.699, eval_acc=0.967, eval_loss=9.77, eval_precision=0.676, eval_recall=0.728]


eval_reports:


calculate data/few_shot/weibo/train_1350.json etag:   0%|          | 0.00/911k [00:00<?, ?B/s]

              precision    recall  f1-score   support

     GPE.NAM       0.70      0.81      0.75        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.42      0.83      0.56         6
     LOC.NOM       0.29      0.33      0.31         6
     ORG.NAM       0.38      0.45      0.41        47
     ORG.NOM       0.33      0.80      0.47         5
     PER.NAM       0.76      0.76      0.76        90
     PER.NOM       0.82      0.77      0.79       208

   micro avg       0.70      0.72      0.71       389
   macro avg       0.46      0.59      0.51       389
weighted avg       0.72      0.72      0.72       389

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/weibo/train_1350.json",
    "eval_file": "data/few_shot/weibo/dev.json",
    "test_file": "data/few_shot/

calculate data/few_shot/weibo/train_1350.json etag: 100%|██████████| 911k/911k [00:00<00:00, 23.0MB/s]
calculate data/few_shot/weibo/dev.json etag: 100%|██████████| 180k/180k [00:00<00:00, 178MB/s]
calculate data/few_shot/weibo/test.json etag: 100%|██████████| 184k/184k [00:00<00:00, 185MB/s]
calculate data/few_shot/weibo/labels.txt etag: 100%|██████████| 272/272 [00:00<00:00, 464kB/s]


load cached ./temp/019570c570c6a6a1ee32b781734ca455_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/lexicon_tree


count line size data/few_shot/weibo/labels.txt: 29L [00:00, 219954.46L/s]
build line mapper: 29L [00:00, 232127.51L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 29/29 [00:00<00:00, 7657.21it/s]
load vocab from list: 100%|██████████| 28/28 [00:00<00:00, 265102.74it/s]

load cached ./temp/019570c570c6a6a1ee32b781734ca455_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/matched_words
load cached ./temp/019570c570c6a6a1ee32b781734ca455_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/word_vocab
load cached ./temp/019570c570c6a6a1ee32b781734ca455_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/vocab_embedding



load dataset from data/few_shot/weibo/train_1350.json: 1350it [00:02, 495.90it/s]
load dataset from data/few_shot/weibo/dev.json: 271it [00:00, 504.14it/s]
Some weights of the model checkpoint at save_pretrained/weibo_pretrain_lebert_1350_pretraind_task/Bert_1290/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification mod

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 169/169 [00:55<00:00,  3.03it/s, F1=3.92e-5, train_acc=0.81, train_loss=55, train_precision=2.03e-5, train_recall=0.000538]   


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00       204
     GPE.NOM       0.00      0.00      0.00         8
     LOC.NAM       0.00      0.00      0.00        56
     LOC.NOM       0.00      0.00      0.00        51
     ORG.NAM       0.00      0.00      0.00       182
     ORG.NOM       0.00      0.00      0.00        42
     PER.NAM       0.00      0.00      0.00       577
     PER.NOM       0.00      0.00      0.00       769

   micro avg       0.00      0.00      0.00      1889
   macro avg       0.00      0.00      0.00      1889
weighted avg       0.00      0.00      0.00      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.23it/s, F1=0.00281, eval_acc=0.941, eval_loss=12.3, eval_precision=0.00256, eval_recall=0.0031] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.00      0.00      0.00        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.00      0.00      0.00        90
     PER.NOM       0.01      0.01      0.01       208

   micro avg       0.00      0.01      0.00       389
   macro avg       0.00      0.00      0.00       389
weighted avg       0.00      0.01      0.00       389



Epoch: 2/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.24it/s, F1=0.384, train_acc=0.959, train_loss=9.23, train_precision=0.356, train_recall=0.446]  


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.32      0.47      0.38       204
     GPE.NOM       0.00      0.00      0.00         8
     LOC.NAM       0.00      0.00      0.00        56
     LOC.NOM       0.00      0.00      0.00        51
     ORG.NAM       0.08      0.10      0.09       182
     ORG.NOM       0.00      0.00      0.00        42
     PER.NAM       0.29      0.41      0.34       577
     PER.NOM       0.41      0.59      0.49       769

   micro avg       0.32      0.43      0.37      1889
   macro avg       0.14      0.20      0.16      1889
weighted avg       0.30      0.43      0.35      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.36it/s, F1=0.605, eval_acc=0.966, eval_loss=6.37, eval_precision=0.545, eval_recall=0.684]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.51      0.77      0.62        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.25      0.33      0.29         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.11      0.15      0.13        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.57      0.72      0.64        90
     PER.NOM       0.65      0.80      0.72       208

   micro avg       0.54      0.67      0.60       389
   macro avg       0.26      0.35      0.30       389
weighted avg       0.53      0.67      0.59       389



Epoch: 3/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.21it/s, F1=0.652, train_acc=0.976, train_loss=4.57, train_precision=0.62, train_recall=0.706] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.59      0.79      0.68       204
     GPE.NOM       0.00      0.00      0.00         8
     LOC.NAM       0.25      0.32      0.28        56
     LOC.NOM       0.07      0.04      0.05        51
     ORG.NAM       0.35      0.56      0.43       182
     ORG.NOM       0.07      0.02      0.04        42
     PER.NAM       0.63      0.71      0.67       577
     PER.NOM       0.71      0.83      0.77       769

   micro avg       0.60      0.70      0.65      1889
   macro avg       0.33      0.41      0.36      1889
weighted avg       0.59      0.70      0.64      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.32it/s, F1=0.591, eval_acc=0.966, eval_loss=6.34, eval_precision=0.508, eval_recall=0.721]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.45      0.69      0.55        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.17      0.50      0.25         6
     LOC.NOM       0.10      0.17      0.12         6
     ORG.NAM       0.22      0.38      0.28        47
     ORG.NOM       0.38      0.60      0.46         5
     PER.NAM       0.63      0.81      0.71        90
     PER.NOM       0.68      0.78      0.72       208

   micro avg       0.54      0.71      0.62       389
   macro avg       0.33      0.49      0.39       389
weighted avg       0.57      0.71      0.63       389



Epoch: 4/30 Train: 100%|██████████| 169/169 [00:55<00:00,  3.04it/s, F1=0.753, train_acc=0.983, train_loss=3.19, train_precision=0.724, train_recall=0.802]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.67      0.82      0.74       204
     GPE.NOM       0.00      0.00      0.00         8
     LOC.NAM       0.41      0.55      0.47        56
     LOC.NOM       0.16      0.20      0.18        51
     ORG.NAM       0.59      0.75      0.66       182
     ORG.NOM       0.50      0.48      0.49        42
     PER.NAM       0.77      0.81      0.79       577
     PER.NOM       0.80      0.89      0.84       769

   micro avg       0.71      0.80      0.76      1889
   macro avg       0.49      0.56      0.52      1889
weighted avg       0.72      0.80      0.76      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.30it/s, F1=0.631, eval_acc=0.966, eval_loss=6.3, eval_precision=0.553, eval_recall=0.74]  


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.47      0.73      0.58        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.31      0.67      0.42         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.27      0.47      0.34        47
     ORG.NOM       0.57      0.80      0.67         5
     PER.NAM       0.66      0.79      0.72        90
     PER.NOM       0.68      0.80      0.74       208

   micro avg       0.57      0.74      0.64       389
   macro avg       0.37      0.53      0.43       389
weighted avg       0.60      0.74      0.66       389



Epoch: 5/30 Train: 100%|██████████| 169/169 [00:53<00:00,  3.18it/s, F1=0.822, train_acc=0.988, train_loss=2.26, train_precision=0.802, train_recall=0.856]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.81      0.87      0.84       204
     GPE.NOM       0.00      0.00      0.00         8
     LOC.NAM       0.63      0.70      0.66        56
     LOC.NOM       0.24      0.31      0.27        51
     ORG.NAM       0.73      0.87      0.79       182
     ORG.NOM       0.48      0.57      0.52        42
     PER.NAM       0.82      0.86      0.84       577
     PER.NOM       0.85      0.91      0.88       769

   micro avg       0.79      0.85      0.82      1889
   macro avg       0.57      0.64      0.60      1889
weighted avg       0.79      0.85      0.82      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.00it/s, F1=0.644, eval_acc=0.965, eval_loss=7.49, eval_precision=0.571, eval_recall=0.743]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.44      0.85      0.58        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.22      0.67      0.33         6
     LOC.NOM       0.08      0.33      0.13         6
     ORG.NAM       0.30      0.26      0.28        47
     ORG.NOM       0.38      1.00      0.56         5
     PER.NAM       0.72      0.79      0.75        90
     PER.NOM       0.70      0.83      0.76       208

   micro avg       0.59      0.74      0.65       389
   macro avg       0.36      0.59      0.42       389
weighted avg       0.62      0.74      0.67       389



Epoch: 6/30 Train: 100%|██████████| 169/169 [00:55<00:00,  3.05it/s, F1=0.863, train_acc=0.991, train_loss=1.65, train_precision=0.843, train_recall=0.893]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.88      0.92      0.90       204
     GPE.NOM       0.50      0.38      0.43         8
     LOC.NAM       0.69      0.82      0.75        56
     LOC.NOM       0.43      0.53      0.47        51
     ORG.NAM       0.83      0.90      0.86       182
     ORG.NOM       0.64      0.69      0.67        42
     PER.NAM       0.88      0.89      0.89       577
     PER.NOM       0.88      0.94      0.91       769

   micro avg       0.85      0.90      0.87      1889
   macro avg       0.72      0.76      0.73      1889
weighted avg       0.85      0.90      0.87      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.29it/s, F1=0.645, eval_acc=0.965, eval_loss=7.19, eval_precision=0.573, eval_recall=0.744]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.48      0.85      0.61        26
     GPE.NOM       0.25      1.00      0.40         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.36      0.38      0.37        47
     ORG.NOM       0.16      0.60      0.25         5
     PER.NAM       0.61      0.79      0.69        90
     PER.NOM       0.71      0.79      0.75       208

   micro avg       0.59      0.72      0.65       389
   macro avg       0.32      0.55      0.38       389
weighted avg       0.60      0.72      0.65       389



Epoch: 7/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.24it/s, F1=0.89, train_acc=0.992, train_loss=1.34, train_precision=0.871, train_recall=0.918] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.85      0.91      0.88       204
     GPE.NOM       0.56      0.62      0.59         8
     LOC.NAM       0.69      0.77      0.73        56
     LOC.NOM       0.70      0.73      0.71        51
     ORG.NAM       0.86      0.93      0.90       182
     ORG.NOM       0.70      0.74      0.72        42
     PER.NAM       0.87      0.91      0.89       577
     PER.NOM       0.91      0.96      0.94       769

   micro avg       0.87      0.92      0.89      1889
   macro avg       0.77      0.82      0.79      1889
weighted avg       0.87      0.92      0.89      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.17it/s, F1=0.668, eval_acc=0.967, eval_loss=6.91, eval_precision=0.592, eval_recall=0.77] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.53      0.73      0.61        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.57      0.67      0.62         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.36      0.51      0.42        47
     ORG.NOM       0.25      0.80      0.38         5
     PER.NAM       0.66      0.77      0.71        90
     PER.NOM       0.73      0.83      0.77       208

   micro avg       0.61      0.75      0.67       389
   macro avg       0.51      0.66      0.56       389
weighted avg       0.63      0.75      0.69       389



Epoch: 8/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.21it/s, F1=0.928, train_acc=0.995, train_loss=0.972, train_precision=0.915, train_recall=0.946]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.95      0.96      0.95       204
     GPE.NOM       0.56      0.62      0.59         8
     LOC.NAM       0.85      0.91      0.88        56
     LOC.NOM       0.80      0.86      0.83        51
     ORG.NAM       0.93      0.96      0.94       182
     ORG.NOM       0.86      0.86      0.86        42
     PER.NAM       0.92      0.95      0.93       577
     PER.NOM       0.92      0.96      0.94       769

   micro avg       0.92      0.95      0.93      1889
   macro avg       0.85      0.88      0.87      1889
weighted avg       0.92      0.95      0.93      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.31it/s, F1=0.699, eval_acc=0.967, eval_loss=6.52, eval_precision=0.636, eval_recall=0.78] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.54      0.77      0.63        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.83      0.83      0.83         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.34      0.55      0.42        47
     ORG.NOM       0.27      0.60      0.37         5
     PER.NAM       0.70      0.77      0.73        90
     PER.NOM       0.74      0.81      0.77       208

   micro avg       0.63      0.75      0.69       389
   macro avg       0.43      0.54      0.47       389
weighted avg       0.65      0.75      0.69       389



Epoch: 9/30 Train: 100%|██████████| 169/169 [00:55<00:00,  3.03it/s, F1=0.935, train_acc=0.996, train_loss=0.747, train_precision=0.922, train_recall=0.952]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      0.99      0.99       204
     GPE.NOM       0.86      0.75      0.80         8
     LOC.NAM       0.84      0.93      0.88        56
     LOC.NOM       0.70      0.78      0.74        51
     ORG.NAM       0.93      0.96      0.95       182
     ORG.NOM       0.76      0.81      0.78        42
     PER.NAM       0.92      0.95      0.94       577
     PER.NOM       0.93      0.97      0.95       769

   micro avg       0.92      0.95      0.94      1889
   macro avg       0.87      0.89      0.88      1889
weighted avg       0.92      0.95      0.94      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  3.84it/s, F1=0.727, eval_acc=0.971, eval_loss=6.87, eval_precision=0.676, eval_recall=0.788]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.64      0.81      0.71        26
     GPE.NOM       0.50      1.00      0.67         1
     LOC.NAM       0.50      0.83      0.62         6
     LOC.NOM       0.19      0.50      0.27         6
     ORG.NAM       0.41      0.40      0.41        47
     ORG.NOM       0.27      0.60      0.37         5
     PER.NAM       0.75      0.78      0.77        90
     PER.NOM       0.74      0.82      0.78       208

   micro avg       0.66      0.75      0.71       389
   macro avg       0.50      0.72      0.58       389
weighted avg       0.68      0.75      0.71       389



Epoch: 10/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.20it/s, F1=0.942, train_acc=0.996, train_loss=0.698, train_precision=0.934, train_recall=0.956]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.98      1.00      0.99       204
     GPE.NOM       0.88      0.88      0.88         8
     LOC.NAM       0.79      0.89      0.84        56
     LOC.NOM       0.90      0.84      0.87        51
     ORG.NAM       0.94      0.97      0.95       182
     ORG.NOM       0.85      0.81      0.83        42
     PER.NAM       0.94      0.96      0.95       577
     PER.NOM       0.95      0.97      0.96       769

   micro avg       0.94      0.96      0.95      1889
   macro avg       0.90      0.91      0.91      1889
weighted avg       0.94      0.96      0.95      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.35it/s, F1=0.598, eval_acc=0.965, eval_loss=7.38, eval_precision=0.589, eval_recall=0.617]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.60      0.81      0.69        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.67      0.67      0.67         6
     LOC.NOM       0.09      0.17      0.12         6
     ORG.NAM       0.40      0.36      0.38        47
     ORG.NOM       0.15      0.60      0.24         5
     PER.NAM       0.76      0.72      0.74        90
     PER.NOM       0.70      0.60      0.65       208

   micro avg       0.62      0.61      0.62       389
   macro avg       0.55      0.62      0.56       389
weighted avg       0.65      0.61      0.63       389



Epoch: 11/30 Train: 100%|██████████| 169/169 [00:56<00:00,  3.01it/s, F1=0.926, train_acc=0.994, train_loss=0.954, train_precision=0.92, train_recall=0.94]  


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.97      0.99      0.98       204
     GPE.NOM       0.80      1.00      0.89         8
     LOC.NAM       0.93      0.93      0.93        56
     LOC.NOM       0.87      0.88      0.87        51
     ORG.NAM       0.96      0.97      0.97       182
     ORG.NOM       0.84      0.86      0.85        42
     PER.NAM       0.89      0.90      0.90       577
     PER.NOM       0.94      0.96      0.95       769

   micro avg       0.92      0.94      0.93      1889
   macro avg       0.90      0.94      0.92      1889
weighted avg       0.92      0.94      0.93      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.08it/s, F1=0.67, eval_acc=0.968, eval_loss=7.56, eval_precision=0.604, eval_recall=0.759] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.62      0.77      0.69        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.56      0.83      0.67         6
     LOC.NOM       0.12      0.33      0.18         6
     ORG.NAM       0.40      0.47      0.43        47
     ORG.NOM       0.11      0.60      0.19         5
     PER.NAM       0.68      0.79      0.73        90
     PER.NOM       0.72      0.78      0.75       208

   micro avg       0.61      0.74      0.67       389
   macro avg       0.53      0.70      0.58       389
weighted avg       0.65      0.74      0.68       389



Epoch: 12/30 Train: 100%|██████████| 169/169 [00:53<00:00,  3.17it/s, F1=0.945, train_acc=0.996, train_loss=0.719, train_precision=0.936, train_recall=0.958]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.97      0.99      0.98       204
     GPE.NOM       0.88      0.88      0.88         8
     LOC.NAM       0.93      0.96      0.95        56
     LOC.NOM       0.94      0.96      0.95        51
     ORG.NAM       0.93      0.96      0.94       182
     ORG.NOM       0.90      0.90      0.90        42
     PER.NAM       0.93      0.95      0.94       577
     PER.NOM       0.95      0.98      0.96       769

   micro avg       0.94      0.97      0.95      1889
   macro avg       0.93      0.95      0.94      1889
weighted avg       0.94      0.97      0.95      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  3.93it/s, F1=0.692, eval_acc=0.968, eval_loss=7.7, eval_precision=0.62, eval_recall=0.791]  


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.62      0.77      0.69        26
     GPE.NOM       0.50      1.00      0.67         1
     LOC.NAM       0.62      0.83      0.71         6
     LOC.NOM       0.09      0.33      0.14         6
     ORG.NAM       0.43      0.49      0.46        47
     ORG.NOM       0.11      0.60      0.18         5
     PER.NAM       0.72      0.79      0.75        90
     PER.NOM       0.75      0.82      0.78       208

   micro avg       0.62      0.76      0.69       389
   macro avg       0.48      0.70      0.55       389
weighted avg       0.67      0.76      0.71       389



Epoch: 13/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.24it/s, F1=0.943, train_acc=0.995, train_loss=0.72, train_precision=0.935, train_recall=0.955] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      0.99      0.99       204
     GPE.NOM       0.89      1.00      0.94         8
     LOC.NAM       0.92      0.96      0.94        56
     LOC.NOM       0.92      0.94      0.93        51
     ORG.NAM       0.86      0.93      0.89       182
     ORG.NOM       0.90      0.88      0.89        42
     PER.NAM       0.93      0.95      0.94       577
     PER.NOM       0.95      0.97      0.96       769

   micro avg       0.94      0.96      0.95      1889
   macro avg       0.92      0.95      0.94      1889
weighted avg       0.94      0.96      0.95      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.32it/s, F1=0.687, eval_acc=0.968, eval_loss=7.64, eval_precision=0.618, eval_recall=0.781]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.61      0.85      0.71        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.56      0.83      0.67         6
     LOC.NOM       0.12      0.33      0.18         6
     ORG.NAM       0.42      0.47      0.44        47
     ORG.NOM       0.36      0.80      0.50         5
     PER.NAM       0.65      0.83      0.73        90
     PER.NOM       0.74      0.81      0.77       208

   micro avg       0.64      0.77      0.70       389
   macro avg       0.56      0.74      0.63       389
weighted avg       0.66      0.77      0.71       389



Epoch: 14/30 Train: 100%|██████████| 169/169 [00:55<00:00,  3.06it/s, F1=0.944, train_acc=0.996, train_loss=0.538, train_precision=0.936, train_recall=0.958]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.98      1.00      0.99       204
     GPE.NOM       0.88      0.88      0.88         8
     LOC.NAM       0.93      0.93      0.93        56
     LOC.NOM       0.96      0.96      0.96        51
     ORG.NAM       0.91      0.95      0.93       182
     ORG.NOM       0.93      0.93      0.93        42
     PER.NAM       0.93      0.95      0.94       577
     PER.NOM       0.95      0.97      0.96       769

   micro avg       0.94      0.96      0.95      1889
   macro avg       0.93      0.94      0.94      1889
weighted avg       0.94      0.96      0.95      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.34it/s, F1=0.697, eval_acc=0.968, eval_loss=7.92, eval_precision=0.652, eval_recall=0.755]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.62      0.81      0.70        26
     GPE.NOM       0.50      1.00      0.67         1
     LOC.NAM       0.45      0.83      0.59         6
     LOC.NOM       0.14      0.33      0.20         6
     ORG.NAM       0.42      0.43      0.42        47
     ORG.NOM       0.25      0.60      0.35         5
     PER.NAM       0.79      0.80      0.80        90
     PER.NOM       0.75      0.78      0.76       208

   micro avg       0.67      0.74      0.70       389
   macro avg       0.49      0.70      0.56       389
weighted avg       0.69      0.74      0.71       389



Epoch: 15/30 Train: 100%|██████████| 169/169 [00:53<00:00,  3.19it/s, F1=0.958, train_acc=0.996, train_loss=0.497, train_precision=0.955, train_recall=0.967]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      1.00      0.99       204
     GPE.NOM       0.88      0.88      0.88         8
     LOC.NAM       0.93      1.00      0.97        56
     LOC.NOM       0.98      0.96      0.97        51
     ORG.NAM       0.97      0.98      0.97       182
     ORG.NOM       0.95      0.90      0.93        42
     PER.NAM       0.95      0.96      0.95       577
     PER.NOM       0.95      0.97      0.96       769

   micro avg       0.96      0.97      0.96      1889
   macro avg       0.95      0.96      0.95      1889
weighted avg       0.96      0.97      0.96      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.31it/s, F1=0.666, eval_acc=0.967, eval_loss=7.97, eval_precision=0.6, eval_recall=0.755]  


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.62      0.81      0.70        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       1.00      0.83      0.91         6
     LOC.NOM       0.07      0.17      0.10         6
     ORG.NAM       0.34      0.47      0.40        47
     ORG.NOM       0.12      0.60      0.20         5
     PER.NAM       0.72      0.81      0.76        90
     PER.NOM       0.75      0.80      0.77       208

   micro avg       0.63      0.75      0.68       389
   macro avg       0.58      0.69      0.61       389
weighted avg       0.67      0.75      0.71       389



Epoch: 16/30 Train: 100%|██████████| 169/169 [00:56<00:00,  3.00it/s, F1=0.966, train_acc=0.997, train_loss=0.41, train_precision=0.96, train_recall=0.975]  


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      1.00      0.99       204
     GPE.NOM       0.89      1.00      0.94         8
     LOC.NAM       0.96      0.96      0.96        56
     LOC.NOM       0.96      1.00      0.98        51
     ORG.NAM       0.97      0.98      0.97       182
     ORG.NOM       0.93      0.98      0.95        42
     PER.NAM       0.95      0.97      0.96       577
     PER.NOM       0.96      0.98      0.97       769

   micro avg       0.96      0.98      0.97      1889
   macro avg       0.95      0.98      0.97      1889
weighted avg       0.96      0.98      0.97      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.00it/s, F1=0.704, eval_acc=0.969, eval_loss=8.82, eval_precision=0.654, eval_recall=0.767]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.60      0.81      0.69        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.42      0.83      0.56         6
     LOC.NOM       0.22      0.33      0.27         6
     ORG.NAM       0.39      0.45      0.42        47
     ORG.NOM       0.38      0.60      0.46         5
     PER.NAM       0.76      0.82      0.79        90
     PER.NOM       0.74      0.79      0.77       208

   micro avg       0.67      0.75      0.71       389
   macro avg       0.56      0.70      0.62       389
weighted avg       0.68      0.75      0.71       389



Epoch: 17/30 Train: 100%|██████████| 169/169 [00:53<00:00,  3.18it/s, F1=0.956, train_acc=0.997, train_loss=0.432, train_precision=0.952, train_recall=0.965]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.98      0.99      0.98       204
     GPE.NOM       0.88      0.88      0.88         8
     LOC.NAM       0.93      0.95      0.94        56
     LOC.NOM       0.94      0.98      0.96        51
     ORG.NAM       0.96      0.99      0.97       182
     ORG.NOM       0.97      0.90      0.94        42
     PER.NAM       0.95      0.96      0.96       577
     PER.NOM       0.96      0.97      0.96       769

   micro avg       0.96      0.97      0.96      1889
   macro avg       0.95      0.95      0.95      1889
weighted avg       0.96      0.97      0.96      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.04it/s, F1=0.694, eval_acc=0.969, eval_loss=7.8, eval_precision=0.655, eval_recall=0.748] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.62      0.81      0.70        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.50      0.67      0.57         6
     LOC.NOM       0.14      0.17      0.15         6
     ORG.NAM       0.40      0.36      0.38        47
     ORG.NOM       0.22      0.80      0.35         5
     PER.NAM       0.80      0.78      0.79        90
     PER.NOM       0.78      0.84      0.81       208

   micro avg       0.69      0.75      0.72       389
   macro avg       0.43      0.55      0.47       389
weighted avg       0.71      0.75      0.72       389



Epoch: 18/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.21it/s, F1=0.954, train_acc=0.997, train_loss=0.369, train_precision=0.953, train_recall=0.959]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      1.00      0.99       204
     GPE.NOM       1.00      0.88      0.93         8
     LOC.NAM       0.95      0.96      0.96        56
     LOC.NOM       0.89      0.94      0.91        51
     ORG.NAM       0.94      0.96      0.95       182
     ORG.NOM       0.93      0.90      0.92        42
     PER.NAM       0.97      0.96      0.97       577
     PER.NOM       0.96      0.97      0.97       769

   micro avg       0.96      0.97      0.96      1889
   macro avg       0.95      0.95      0.95      1889
weighted avg       0.96      0.97      0.96      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.35it/s, F1=0.673, eval_acc=0.968, eval_loss=8.84, eval_precision=0.641, eval_recall=0.718]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.60      0.81      0.69        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.83      0.83      0.83         6
     LOC.NOM       0.20      0.33      0.25         6
     ORG.NAM       0.39      0.40      0.40        47
     ORG.NOM       0.20      0.60      0.30         5
     PER.NAM       0.78      0.77      0.78        90
     PER.NOM       0.76      0.75      0.76       208

   micro avg       0.68      0.71      0.69       389
   macro avg       0.60      0.69      0.63       389
weighted avg       0.70      0.71      0.70       389



Epoch: 19/30 Train: 100%|██████████| 169/169 [00:55<00:00,  3.06it/s, F1=0.967, train_acc=0.997, train_loss=0.339, train_precision=0.964, train_recall=0.974]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.98      0.99      0.99       204
     GPE.NOM       0.88      0.88      0.88         8
     LOC.NAM       0.98      0.95      0.96        56
     LOC.NOM       0.96      0.98      0.97        51
     ORG.NAM       0.95      0.96      0.95       182
     ORG.NOM       0.90      0.88      0.89        42
     PER.NAM       0.96      0.98      0.97       577
     PER.NOM       0.97      0.98      0.97       769

   micro avg       0.96      0.97      0.97      1889
   macro avg       0.95      0.95      0.95      1889
weighted avg       0.96      0.97      0.97      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.27it/s, F1=0.702, eval_acc=0.971, eval_loss=8.49, eval_precision=0.661, eval_recall=0.752]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.61      0.85      0.71        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.83      0.83      0.83         6
     LOC.NOM       0.12      0.17      0.14         6
     ORG.NAM       0.42      0.40      0.41        47
     ORG.NOM       0.25      0.60      0.35         5
     PER.NAM       0.82      0.81      0.82        90
     PER.NOM       0.71      0.77      0.74       208

   micro avg       0.67      0.73      0.70       389
   macro avg       0.60      0.68      0.63       389
weighted avg       0.68      0.73      0.70       389



Epoch: 20/30 Train: 100%|██████████| 169/169 [00:53<00:00,  3.14it/s, F1=0.964, train_acc=0.997, train_loss=0.366, train_precision=0.959, train_recall=0.972]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.98      0.99      0.99       204
     GPE.NOM       0.88      0.88      0.88         8
     LOC.NAM       0.95      0.98      0.96        56
     LOC.NOM       0.88      0.90      0.89        51
     ORG.NAM       0.97      0.99      0.98       182
     ORG.NOM       0.95      0.90      0.93        42
     PER.NAM       0.94      0.96      0.95       577
     PER.NOM       0.96      0.98      0.97       769

   micro avg       0.96      0.97      0.96      1889
   macro avg       0.94      0.95      0.94      1889
weighted avg       0.96      0.97      0.96      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.29it/s, F1=0.684, eval_acc=0.967, eval_loss=8.39, eval_precision=0.652, eval_recall=0.723]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.58      0.85      0.69        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.71      0.83      0.77         6
     LOC.NOM       0.20      0.33      0.25         6
     ORG.NAM       0.36      0.36      0.36        47
     ORG.NOM       0.25      0.60      0.35         5
     PER.NAM       0.76      0.78      0.77        90
     PER.NOM       0.78      0.76      0.77       208

   micro avg       0.68      0.72      0.70       389
   macro avg       0.58      0.69      0.62       389
weighted avg       0.70      0.72      0.70       389



Epoch: 21/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.23it/s, F1=0.966, train_acc=0.997, train_loss=0.289, train_precision=0.963, train_recall=0.973]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      1.00      0.99       204
     GPE.NOM       0.88      0.88      0.88         8
     LOC.NAM       0.95      1.00      0.97        56
     LOC.NOM       0.96      0.96      0.96        51
     ORG.NAM       0.97      0.98      0.98       182
     ORG.NOM       0.93      0.95      0.94        42
     PER.NAM       0.95      0.97      0.96       577
     PER.NOM       0.97      0.98      0.98       769

   micro avg       0.96      0.98      0.97      1889
   macro avg       0.95      0.96      0.96      1889
weighted avg       0.96      0.98      0.97      1889



Eval Result: 100%|██████████| 5/5 [00:04<00:00,  1.13it/s, F1=0.679, eval_acc=0.968, eval_loss=8.69, eval_precision=0.639, eval_recall=0.736]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.61      0.85      0.71        26
     GPE.NOM       0.50      1.00      0.67         1
     LOC.NAM       1.00      0.83      0.91         6
     LOC.NOM       0.18      0.33      0.24         6
     ORG.NAM       0.36      0.43      0.39        47
     ORG.NOM       0.38      0.60      0.46         5
     PER.NAM       0.77      0.77      0.77        90
     PER.NOM       0.76      0.78      0.77       208

   micro avg       0.68      0.73      0.70       389
   macro avg       0.57      0.70      0.61       389
weighted avg       0.70      0.73      0.71       389



Epoch: 22/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.22it/s, F1=0.967, train_acc=0.997, train_loss=0.292, train_precision=0.965, train_recall=0.973]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.98      0.99      0.98       204
     GPE.NOM       0.89      1.00      0.94         8
     LOC.NAM       0.95      0.95      0.95        56
     LOC.NOM       0.96      0.96      0.96        51
     ORG.NAM       0.95      0.98      0.96       182
     ORG.NOM       0.93      0.90      0.92        42
     PER.NAM       0.97      0.97      0.97       577
     PER.NOM       0.97      0.98      0.97       769

   micro avg       0.97      0.97      0.97      1889
   macro avg       0.95      0.97      0.96      1889
weighted avg       0.97      0.97      0.97      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.28it/s, F1=0.712, eval_acc=0.969, eval_loss=8.65, eval_precision=0.654, eval_recall=0.786]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.59      0.85      0.70        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.50      0.83      0.62         6
     LOC.NOM       0.18      0.33      0.24         6
     ORG.NAM       0.44      0.49      0.46        47
     ORG.NOM       0.31      0.80      0.44         5
     PER.NAM       0.76      0.78      0.77        90
     PER.NOM       0.76      0.83      0.79       208

   micro avg       0.67      0.77      0.72       389
   macro avg       0.57      0.74      0.63       389
weighted avg       0.69      0.77      0.73       389



Epoch: 23/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.21it/s, F1=0.961, train_acc=0.998, train_loss=0.312, train_precision=0.959, train_recall=0.967]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       204
     GPE.NOM       0.89      1.00      0.94         8
     LOC.NAM       0.97      1.00      0.98        56
     LOC.NOM       0.93      0.98      0.95        51
     ORG.NAM       0.95      0.97      0.96       182
     ORG.NOM       0.95      0.90      0.93        42
     PER.NAM       0.96      0.97      0.96       577
     PER.NOM       0.97      0.98      0.98       769

   micro avg       0.97      0.98      0.97      1889
   macro avg       0.95      0.97      0.96      1889
weighted avg       0.97      0.98      0.97      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.30it/s, F1=0.677, eval_acc=0.966, eval_loss=9.29, eval_precision=0.645, eval_recall=0.717]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.58      0.81      0.68        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.56      0.83      0.67         6
     LOC.NOM       0.25      0.33      0.29         6
     ORG.NAM       0.40      0.45      0.42        47
     ORG.NOM       0.21      0.60      0.32         5
     PER.NAM       0.77      0.83      0.80        90
     PER.NOM       0.77      0.71      0.74       208

   micro avg       0.67      0.71      0.69       389
   macro avg       0.57      0.70      0.61       389
weighted avg       0.69      0.71      0.69       389



Epoch: 24/30 Train: 100%|██████████| 169/169 [00:56<00:00,  2.99it/s, F1=0.968, train_acc=0.997, train_loss=0.315, train_precision=0.968, train_recall=0.971]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       204
     GPE.NOM       1.00      1.00      1.00         8
     LOC.NAM       0.98      0.93      0.95        56
     LOC.NOM       0.98      0.98      0.98        51
     ORG.NAM       0.95      0.97      0.96       182
     ORG.NOM       0.88      0.90      0.89        42
     PER.NAM       0.97      0.96      0.96       577
     PER.NOM       0.97      0.98      0.97       769

   micro avg       0.97      0.97      0.97      1889
   macro avg       0.97      0.97      0.97      1889
weighted avg       0.97      0.97      0.97      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.29it/s, F1=0.68, eval_acc=0.963, eval_loss=10.3, eval_precision=0.624, eval_recall=0.747] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.60      0.92      0.73        26
     GPE.NOM       0.50      1.00      0.67         1
     LOC.NAM       0.56      0.83      0.67         6
     LOC.NOM       0.20      0.50      0.29         6
     ORG.NAM       0.45      0.32      0.38        47
     ORG.NOM       0.14      0.60      0.23         5
     PER.NAM       0.66      0.81      0.73        90
     PER.NOM       0.73      0.79      0.76       208

   micro avg       0.63      0.74      0.68       389
   macro avg       0.48      0.72      0.56       389
weighted avg       0.65      0.74      0.69       389



Epoch: 25/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.22it/s, F1=0.966, train_acc=0.997, train_loss=0.289, train_precision=0.962, train_recall=0.974]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      0.99      0.99       204
     GPE.NOM       0.89      1.00      0.94         8
     LOC.NAM       0.93      0.96      0.95        56
     LOC.NOM       0.96      0.98      0.97        51
     ORG.NAM       0.97      0.98      0.98       182
     ORG.NOM       0.93      0.90      0.92        42
     PER.NAM       0.95      0.97      0.96       577
     PER.NOM       0.97      0.97      0.97       769

   micro avg       0.96      0.97      0.97      1889
   macro avg       0.95      0.97      0.96      1889
weighted avg       0.96      0.97      0.97      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  3.84it/s, F1=0.676, eval_acc=0.965, eval_loss=10.2, eval_precision=0.637, eval_recall=0.725]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.58      0.85      0.69        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.38      0.83      0.53         6
     LOC.NOM       0.14      0.17      0.15         6
     ORG.NAM       0.49      0.40      0.44        47
     ORG.NOM       0.12      0.60      0.20         5
     PER.NAM       0.83      0.78      0.80        90
     PER.NOM       0.73      0.75      0.74       208

   micro avg       0.66      0.71      0.68       389
   macro avg       0.53      0.67      0.57       389
weighted avg       0.69      0.71      0.70       389



Epoch: 26/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.19it/s, F1=0.973, train_acc=0.998, train_loss=0.232, train_precision=0.97, train_recall=0.979] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      1.00      0.99       204
     GPE.NOM       1.00      0.88      0.93         8
     LOC.NAM       0.95      0.98      0.96        56
     LOC.NOM       0.94      0.98      0.96        51
     ORG.NAM       0.97      0.99      0.98       182
     ORG.NOM       0.95      0.93      0.94        42
     PER.NAM       0.97      0.97      0.97       577
     PER.NOM       0.97      0.98      0.98       769

   micro avg       0.97      0.98      0.97      1889
   macro avg       0.97      0.96      0.96      1889
weighted avg       0.97      0.98      0.97      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.34it/s, F1=0.71, eval_acc=0.968, eval_loss=10.6, eval_precision=0.702, eval_recall=0.72]  


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.59      0.92      0.72        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.83      0.83      0.83         6
     LOC.NOM       0.25      0.33      0.29         6
     ORG.NAM       0.49      0.40      0.44        47
     ORG.NOM       0.25      0.40      0.31         5
     PER.NAM       0.78      0.79      0.78        90
     PER.NOM       0.78      0.74      0.76       208

   micro avg       0.71      0.71      0.71       389
   macro avg       0.62      0.68      0.64       389
weighted avg       0.72      0.71      0.71       389



Epoch: 27/30 Train: 100%|██████████| 169/169 [00:56<00:00,  2.99it/s, F1=0.966, train_acc=0.997, train_loss=0.427, train_precision=0.971, train_recall=0.965]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       204
     GPE.NOM       0.89      1.00      0.94         8
     LOC.NAM       1.00      0.93      0.96        56
     LOC.NOM       0.96      0.96      0.96        51
     ORG.NAM       0.96      0.96      0.96       182
     ORG.NOM       0.86      0.86      0.86        42
     PER.NAM       0.96      0.95      0.96       577
     PER.NOM       0.97      0.97      0.97       769

   micro avg       0.97      0.96      0.97      1889
   macro avg       0.95      0.95      0.95      1889
weighted avg       0.97      0.96      0.97      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.25it/s, F1=0.696, eval_acc=0.964, eval_loss=10.6, eval_precision=0.651, eval_recall=0.75] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.60      0.81      0.69        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.56      0.83      0.67         6
     LOC.NOM       0.20      0.17      0.18         6
     ORG.NAM       0.40      0.43      0.41        47
     ORG.NOM       0.24      0.80      0.36         5
     PER.NAM       0.78      0.80      0.79        90
     PER.NOM       0.74      0.80      0.77       208

   micro avg       0.67      0.75      0.71       389
   macro avg       0.56      0.70      0.61       389
weighted avg       0.68      0.75      0.71       389



Epoch: 28/30 Train: 100%|██████████| 169/169 [00:53<00:00,  3.17it/s, F1=0.966, train_acc=0.997, train_loss=0.43, train_precision=0.963, train_recall=0.973] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      0.99      0.99       204
     GPE.NOM       1.00      1.00      1.00         8
     LOC.NAM       0.95      1.00      0.97        56
     LOC.NOM       0.94      0.98      0.96        51
     ORG.NAM       0.94      0.96      0.95       182
     ORG.NOM       0.90      0.90      0.90        42
     PER.NAM       0.96      0.96      0.96       577
     PER.NOM       0.97      0.98      0.97       769

   micro avg       0.96      0.97      0.97      1889
   macro avg       0.96      0.97      0.96      1889
weighted avg       0.96      0.97      0.97      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.32it/s, F1=0.662, eval_acc=0.967, eval_loss=8.37, eval_precision=0.614, eval_recall=0.724]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.58      0.85      0.69        26
     GPE.NOM       0.33      1.00      0.50         1
     LOC.NAM       0.71      0.83      0.77         6
     LOC.NOM       0.12      0.17      0.14         6
     ORG.NAM       0.33      0.45      0.38        47
     ORG.NOM       0.16      0.60      0.25         5
     PER.NAM       0.75      0.80      0.77        90
     PER.NOM       0.77      0.74      0.75       208

   micro avg       0.64      0.72      0.68       389
   macro avg       0.47      0.68      0.53       389
weighted avg       0.68      0.72      0.69       389



Epoch: 29/30 Train: 100%|██████████| 169/169 [00:56<00:00,  3.01it/s, F1=0.966, train_acc=0.997, train_loss=0.507, train_precision=0.965, train_recall=0.971]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.98      1.00      0.99       204
     GPE.NOM       0.67      0.75      0.71         8
     LOC.NAM       0.89      0.91      0.90        56
     LOC.NOM       0.90      0.88      0.89        51
     ORG.NAM       0.96      0.97      0.97       182
     ORG.NOM       0.88      0.86      0.87        42
     PER.NAM       0.97      0.97      0.97       577
     PER.NOM       0.97      0.98      0.97       769

   micro avg       0.96      0.97      0.96      1889
   macro avg       0.90      0.91      0.91      1889
weighted avg       0.96      0.97      0.96      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.26it/s, F1=0.664, eval_acc=0.965, eval_loss=9.04, eval_precision=0.607, eval_recall=0.741]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.59      0.77      0.67        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.56      0.83      0.67         6
     LOC.NOM       0.12      0.33      0.17         6
     ORG.NAM       0.35      0.49      0.41        47
     ORG.NOM       0.19      0.60      0.29         5
     PER.NAM       0.76      0.76      0.76        90
     PER.NOM       0.76      0.79      0.77       208

   micro avg       0.64      0.74      0.68       389
   macro avg       0.54      0.70      0.59       389
weighted avg       0.68      0.74      0.70       389



Epoch: 30/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.24it/s, F1=0.968, train_acc=0.997, train_loss=0.359, train_precision=0.968, train_recall=0.971]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.98      0.99      0.99       204
     GPE.NOM       0.89      1.00      0.94         8
     LOC.NAM       0.91      0.91      0.91        56
     LOC.NOM       0.91      0.96      0.93        51
     ORG.NAM       0.98      0.98      0.98       182
     ORG.NOM       0.93      0.93      0.93        42
     PER.NAM       0.97      0.96      0.97       577
     PER.NOM       0.97      0.98      0.97       769

   micro avg       0.97      0.97      0.97      1889
   macro avg       0.94      0.96      0.95      1889
weighted avg       0.97      0.97      0.97      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  3.83it/s, F1=0.698, eval_acc=0.964, eval_loss=10.5, eval_precision=0.627, eval_recall=0.791]


eval_reports:


calculate data/few_shot/weibo/train_1350.json etag:   0%|          | 0.00/911k [00:00<?, ?B/s]

              precision    recall  f1-score   support

     GPE.NAM       0.50      0.88      0.64        26
     GPE.NOM       0.50      1.00      0.67         1
     LOC.NAM       0.56      0.83      0.67         6
     LOC.NOM       0.17      0.33      0.22         6
     ORG.NAM       0.40      0.51      0.45        47
     ORG.NOM       0.30      0.60      0.40         5
     PER.NAM       0.65      0.78      0.71        90
     PER.NOM       0.77      0.84      0.81       208

   micro avg       0.64      0.78      0.70       389
   macro avg       0.48      0.72      0.57       389
weighted avg       0.66      0.78      0.71       389

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/weibo/train_1350.json",
    "eval_file": "data/few_shot/weibo/dev.json",
    "test_file": "data/few_shot/

calculate data/few_shot/weibo/train_1350.json etag: 100%|██████████| 911k/911k [00:00<00:00, 303MB/s]
calculate data/few_shot/weibo/dev.json etag: 100%|██████████| 180k/180k [00:00<00:00, 188MB/s]
calculate data/few_shot/weibo/test.json etag: 100%|██████████| 184k/184k [00:00<00:00, 286MB/s]
calculate data/few_shot/weibo/labels.txt etag: 100%|██████████| 272/272 [00:00<00:00, 525kB/s]


load cached ./temp/019570c570c6a6a1ee32b781734ca455_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/lexicon_tree


count line size data/few_shot/weibo/labels.txt: 29L [00:00, 280264.55L/s]
build line mapper: 29L [00:00, 210077.40L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 29/29 [00:00<00:00, 8673.95it/s]
load vocab from list: 100%|██████████| 28/28 [00:00<00:00, 280958.16it/s]
load dataset from data/few_shot/weibo/train_1350.json: 55it [00:00, 547.78it/s]

load cached ./temp/019570c570c6a6a1ee32b781734ca455_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/matched_words
load cached ./temp/019570c570c6a6a1ee32b781734ca455_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/word_vocab
load cached ./temp/019570c570c6a6a1ee32b781734ca455_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/vocab_embedding


load dataset from data/few_shot/weibo/train_1350.json: 1350it [00:02, 500.02it/s]
load dataset from data/few_shot/weibo/dev.json: 271it [00:00, 505.10it/s]
Some weights of the model checkpoint at save_pretrained/weibo_pretrain_lebert_1350_pretraind_task/Bert_1290/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification mode

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.22it/s, F1=0.00874, train_acc=0.802, train_loss=41.6, train_precision=0.0164, train_recall=0.00817]    


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00       204
     GPE.NOM       0.00      0.00      0.00         8
     LOC.NAM       0.00      0.00      0.00        56
     LOC.NOM       0.00      0.04      0.00        51
     ORG.NAM       0.00      0.00      0.00       182
     ORG.NOM       0.00      0.00      0.00        42
     PER.NAM       0.04      0.01      0.01       577
     PER.NOM       0.22      0.01      0.01       769

   micro avg       0.00      0.01      0.00      1889
   macro avg       0.03      0.01      0.00      1889
weighted avg       0.10      0.01      0.01      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.24it/s, F1=0.309, eval_acc=0.95, eval_loss=10.7, eval_precision=0.247, eval_recall=0.415] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.12      0.08      0.09        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.00      0.00      0.00        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.17      0.44      0.25        90
     PER.NOM       0.43      0.62      0.51       208

   micro avg       0.27      0.44      0.33       389
   macro avg       0.09      0.14      0.11       389
weighted avg       0.28      0.44      0.34       389



Epoch: 2/30 Train: 100%|██████████| 169/169 [00:55<00:00,  3.03it/s, F1=0.516, train_acc=0.962, train_loss=7.57, train_precision=0.524, train_recall=0.541]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.53      0.56      0.54       204
     GPE.NOM       0.00      0.00      0.00         8
     LOC.NAM       0.00      0.00      0.00        56
     LOC.NOM       0.00      0.00      0.00        51
     ORG.NAM       0.18      0.26      0.21       182
     ORG.NOM       0.00      0.00      0.00        42
     PER.NAM       0.48      0.54      0.51       577
     PER.NOM       0.61      0.70      0.65       769

   micro avg       0.50      0.54      0.52      1889
   macro avg       0.23      0.26      0.24      1889
weighted avg       0.47      0.54      0.50      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.32it/s, F1=0.599, eval_acc=0.966, eval_loss=5.52, eval_precision=0.516, eval_recall=0.724]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.49      0.73      0.58        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.21      0.43      0.28        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.62      0.81      0.71        90
     PER.NOM       0.67      0.80      0.73       208

   micro avg       0.54      0.71      0.62       389
   macro avg       0.25      0.35      0.29       389
weighted avg       0.56      0.71      0.63       389



Epoch: 3/30 Train: 100%|██████████| 169/169 [00:53<00:00,  3.14it/s, F1=0.701, train_acc=0.977, train_loss=4.14, train_precision=0.684, train_recall=0.741]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.75      0.87      0.81       204
     GPE.NOM       0.00      0.00      0.00         8
     LOC.NAM       0.09      0.14      0.11        56
     LOC.NOM       0.00      0.00      0.00        51
     ORG.NAM       0.42      0.60      0.49       182
     ORG.NOM       0.00      0.00      0.00        42
     PER.NAM       0.73      0.78      0.75       577
     PER.NOM       0.75      0.84      0.79       769

   micro avg       0.66      0.73      0.69      1889
   macro avg       0.34      0.40      0.37      1889
weighted avg       0.65      0.73      0.69      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.31it/s, F1=0.667, eval_acc=0.969, eval_loss=5.39, eval_precision=0.657, eval_recall=0.678]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.61      0.85      0.71        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.23      0.50      0.32         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.33      0.32      0.33        47
     ORG.NOM       0.57      0.80      0.67         5
     PER.NAM       0.76      0.71      0.74        90
     PER.NOM       0.72      0.72      0.72       208

   micro avg       0.65      0.66      0.66       389
   macro avg       0.40      0.49      0.43       389
weighted avg       0.65      0.66      0.65       389



Epoch: 4/30 Train: 100%|██████████| 169/169 [00:56<00:00,  3.00it/s, F1=0.785, train_acc=0.984, train_loss=2.82, train_precision=0.76, train_recall=0.828] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.82      0.90      0.86       204
     GPE.NOM       0.00      0.00      0.00         8
     LOC.NAM       0.49      0.62      0.55        56
     LOC.NOM       0.12      0.12      0.12        51
     ORG.NAM       0.65      0.80      0.72       182
     ORG.NOM       0.25      0.24      0.24        42
     PER.NAM       0.80      0.85      0.82       577
     PER.NOM       0.82      0.89      0.86       769

   micro avg       0.76      0.82      0.79      1889
   macro avg       0.49      0.55      0.52      1889
weighted avg       0.75      0.82      0.79      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.36it/s, F1=0.624, eval_acc=0.953, eval_loss=6.61, eval_precision=0.521, eval_recall=0.782]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.61      0.85      0.71        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.24      0.83      0.37         6
     LOC.NOM       0.17      0.17      0.17         6
     ORG.NAM       0.25      0.47      0.33        47
     ORG.NOM       0.33      0.80      0.47         5
     PER.NAM       0.51      0.84      0.63        90
     PER.NOM       0.70      0.85      0.77       208

   micro avg       0.54      0.79      0.64       389
   macro avg       0.35      0.60      0.43       389
weighted avg       0.58      0.79      0.66       389



Epoch: 5/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.19it/s, F1=0.841, train_acc=0.988, train_loss=1.87, train_precision=0.826, train_recall=0.871]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.88      0.94      0.91       204
     GPE.NOM       0.00      0.00      0.00         8
     LOC.NAM       0.69      0.79      0.73        56
     LOC.NOM       0.24      0.25      0.25        51
     ORG.NAM       0.75      0.88      0.81       182
     ORG.NOM       0.38      0.50      0.43        42
     PER.NAM       0.83      0.86      0.85       577
     PER.NOM       0.87      0.92      0.89       769

   micro avg       0.81      0.87      0.84      1889
   macro avg       0.58      0.64      0.61      1889
weighted avg       0.81      0.87      0.84      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.36it/s, F1=0.651, eval_acc=0.966, eval_loss=6.58, eval_precision=0.575, eval_recall=0.757]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.69      0.92      0.79        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.29      0.83      0.43         6
     LOC.NOM       0.07      0.33      0.12         6
     ORG.NAM       0.43      0.45      0.44        47
     ORG.NOM       0.15      0.80      0.26         5
     PER.NAM       0.69      0.76      0.72        90
     PER.NOM       0.73      0.82      0.77       208

   micro avg       0.61      0.76      0.67       389
   macro avg       0.38      0.61      0.44       389
weighted avg       0.66      0.76      0.70       389



Epoch: 6/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.22it/s, F1=0.86, train_acc=0.991, train_loss=1.58, train_precision=0.84, train_recall=0.889]  


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.89      0.92      0.91       204
     GPE.NOM       0.50      0.25      0.33         8
     LOC.NAM       0.64      0.80      0.71        56
     LOC.NOM       0.40      0.49      0.44        51
     ORG.NAM       0.86      0.93      0.89       182
     ORG.NOM       0.54      0.62      0.58        42
     PER.NAM       0.89      0.91      0.90       577
     PER.NOM       0.88      0.93      0.90       769

   micro avg       0.85      0.90      0.87      1889
   macro avg       0.70      0.73      0.71      1889
weighted avg       0.85      0.90      0.87      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.35it/s, F1=0.68, eval_acc=0.964, eval_loss=6.18, eval_precision=0.605, eval_recall=0.778] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.51      0.92      0.66        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.50      0.83      0.62         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.41      0.43      0.42        47
     ORG.NOM       0.27      0.60      0.37         5
     PER.NAM       0.60      0.86      0.71        90
     PER.NOM       0.73      0.85      0.78       208

   micro avg       0.61      0.78      0.69       389
   macro avg       0.38      0.56      0.45       389
weighted avg       0.62      0.78      0.69       389



Epoch: 7/30 Train: 100%|██████████| 169/169 [00:55<00:00,  3.02it/s, F1=0.903, train_acc=0.993, train_loss=1.18, train_precision=0.888, train_recall=0.926]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.89      0.94      0.92       204
     GPE.NOM       0.43      0.38      0.40         8
     LOC.NAM       0.75      0.80      0.78        56
     LOC.NOM       0.57      0.65      0.61        51
     ORG.NAM       0.85      0.94      0.89       182
     ORG.NOM       0.55      0.64      0.59        42
     PER.NAM       0.90      0.93      0.92       577
     PER.NOM       0.92      0.95      0.94       769

   micro avg       0.88      0.92      0.90      1889
   macro avg       0.73      0.78      0.75      1889
weighted avg       0.88      0.92      0.90      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.32it/s, F1=0.672, eval_acc=0.967, eval_loss=7.16, eval_precision=0.591, eval_recall=0.788]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.59      0.92      0.72        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.38      0.83      0.53         6
     LOC.NOM       0.42      0.83      0.56         6
     ORG.NAM       0.39      0.45      0.42        47
     ORG.NOM       0.12      0.60      0.20         5
     PER.NAM       0.71      0.82      0.76        90
     PER.NOM       0.73      0.85      0.78       208

   micro avg       0.63      0.80      0.70       389
   macro avg       0.54      0.79      0.62       389
weighted avg       0.66      0.80      0.72       389



Epoch: 8/30 Train: 100%|██████████| 169/169 [00:53<00:00,  3.18it/s, F1=0.919, train_acc=0.994, train_loss=1, train_precision=0.911, train_recall=0.935]    


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.95      0.97      0.96       204
     GPE.NOM       0.86      0.75      0.80         8
     LOC.NAM       0.80      0.88      0.84        56
     LOC.NOM       0.76      0.76      0.76        51
     ORG.NAM       0.87      0.94      0.90       182
     ORG.NOM       0.64      0.69      0.67        42
     PER.NAM       0.93      0.94      0.93       577
     PER.NOM       0.93      0.96      0.95       769

   micro avg       0.91      0.94      0.93      1889
   macro avg       0.84      0.86      0.85      1889
weighted avg       0.91      0.94      0.93      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.22it/s, F1=0.661, eval_acc=0.964, eval_loss=6.69, eval_precision=0.599, eval_recall=0.742]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.61      0.85      0.71        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.33      0.83      0.48         6
     LOC.NOM       0.10      0.17      0.12         6
     ORG.NAM       0.41      0.43      0.42        47
     ORG.NOM       0.08      0.40      0.13         5
     PER.NAM       0.73      0.77      0.75        90
     PER.NOM       0.73      0.80      0.76       208

   micro avg       0.62      0.74      0.68       389
   macro avg       0.50      0.66      0.55       389
weighted avg       0.66      0.74      0.69       389



Epoch: 9/30 Train: 100%|██████████| 169/169 [00:56<00:00,  3.01it/s, F1=0.934, train_acc=0.995, train_loss=0.861, train_precision=0.922, train_recall=0.953]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.95      0.98      0.97       204
     GPE.NOM       0.86      0.75      0.80         8
     LOC.NAM       0.88      0.89      0.88        56
     LOC.NOM       0.84      0.84      0.84        51
     ORG.NAM       0.90      0.95      0.92       182
     ORG.NOM       0.71      0.81      0.76        42
     PER.NAM       0.91      0.94      0.93       577
     PER.NOM       0.94      0.97      0.95       769

   micro avg       0.92      0.95      0.93      1889
   macro avg       0.87      0.89      0.88      1889
weighted avg       0.92      0.95      0.93      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.41it/s, F1=0.69, eval_acc=0.965, eval_loss=7.67, eval_precision=0.662, eval_recall=0.721] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.65      0.85      0.73        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.62      0.83      0.71         6
     LOC.NOM       0.14      0.17      0.15         6
     ORG.NAM       0.39      0.32      0.35        47
     ORG.NOM       0.12      0.40      0.18         5
     PER.NAM       0.78      0.78      0.78        90
     PER.NOM       0.74      0.78      0.76       208

   micro avg       0.67      0.71      0.69       389
   macro avg       0.56      0.64      0.58       389
weighted avg       0.68      0.71      0.70       389



Epoch: 10/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.24it/s, F1=0.95, train_acc=0.996, train_loss=0.717, train_precision=0.942, train_recall=0.965] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.98      1.00      0.99       204
     GPE.NOM       0.70      0.88      0.78         8
     LOC.NAM       0.91      0.93      0.92        56
     LOC.NOM       0.81      0.86      0.84        51
     ORG.NAM       0.94      0.97      0.95       182
     ORG.NOM       0.84      0.88      0.86        42
     PER.NAM       0.95      0.96      0.95       577
     PER.NOM       0.95      0.98      0.96       769

   micro avg       0.94      0.96      0.95      1889
   macro avg       0.89      0.93      0.91      1889
weighted avg       0.94      0.96      0.95      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.35it/s, F1=0.708, eval_acc=0.967, eval_loss=6.93, eval_precision=0.677, eval_recall=0.743]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.61      0.88      0.72        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.56      0.83      0.67         6
     LOC.NOM       0.17      0.17      0.17         6
     ORG.NAM       0.42      0.40      0.41        47
     ORG.NOM       0.22      0.40      0.29         5
     PER.NAM       0.73      0.80      0.76        90
     PER.NOM       0.77      0.80      0.78       208

   micro avg       0.68      0.74      0.71       389
   macro avg       0.43      0.54      0.47       389
weighted avg       0.68      0.74      0.71       389



Epoch: 11/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.23it/s, F1=0.955, train_acc=0.997, train_loss=0.584, train_precision=0.95, train_recall=0.964] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.97      0.99      0.98       204
     GPE.NOM       0.88      0.88      0.88         8
     LOC.NAM       0.93      0.89      0.91        56
     LOC.NOM       0.94      0.96      0.95        51
     ORG.NAM       0.97      0.97      0.97       182
     ORG.NOM       0.93      0.88      0.90        42
     PER.NAM       0.94      0.96      0.95       577
     PER.NOM       0.95      0.97      0.96       769

   micro avg       0.95      0.97      0.96      1889
   macro avg       0.94      0.94      0.94      1889
weighted avg       0.95      0.97      0.96      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.23it/s, F1=0.683, eval_acc=0.966, eval_loss=7.33, eval_precision=0.63, eval_recall=0.749] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.69      0.85      0.76        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.23      0.83      0.36         6
     LOC.NOM       0.33      0.50      0.40         6
     ORG.NAM       0.38      0.38      0.38        47
     ORG.NOM       0.16      0.60      0.25         5
     PER.NAM       0.68      0.81      0.74        90
     PER.NOM       0.76      0.80      0.78       208

   micro avg       0.64      0.75      0.69       389
   macro avg       0.53      0.72      0.58       389
weighted avg       0.67      0.75      0.70       389



Epoch: 12/30 Train: 100%|██████████| 169/169 [00:55<00:00,  3.04it/s, F1=0.959, train_acc=0.997, train_loss=0.486, train_precision=0.954, train_recall=0.969]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      1.00      0.99       204
     GPE.NOM       0.89      1.00      0.94         8
     LOC.NAM       0.92      0.96      0.94        56
     LOC.NOM       0.98      0.96      0.97        51
     ORG.NAM       0.96      0.97      0.96       182
     ORG.NOM       0.88      0.90      0.89        42
     PER.NAM       0.94      0.95      0.95       577
     PER.NOM       0.96      0.98      0.97       769

   micro avg       0.95      0.97      0.96      1889
   macro avg       0.94      0.97      0.95      1889
weighted avg       0.95      0.97      0.96      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  3.86it/s, F1=0.668, eval_acc=0.961, eval_loss=8.39, eval_precision=0.598, eval_recall=0.761]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.63      0.85      0.72        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.50      0.83      0.62         6
     LOC.NOM       0.17      0.33      0.22         6
     ORG.NAM       0.40      0.49      0.44        47
     ORG.NOM       0.13      0.60      0.21         5
     PER.NAM       0.70      0.81      0.75        90
     PER.NOM       0.72      0.80      0.76       208

   micro avg       0.63      0.76      0.69       389
   macro avg       0.53      0.71      0.59       389
weighted avg       0.65      0.76      0.70       389



Epoch: 13/30 Train: 100%|██████████| 169/169 [00:53<00:00,  3.18it/s, F1=0.959, train_acc=0.997, train_loss=0.483, train_precision=0.957, train_recall=0.965]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      1.00      0.99       204
     GPE.NOM       0.88      0.88      0.88         8
     LOC.NAM       0.95      0.96      0.96        56
     LOC.NOM       0.92      0.94      0.93        51
     ORG.NAM       0.97      0.98      0.98       182
     ORG.NOM       0.93      0.93      0.93        42
     PER.NAM       0.95      0.95      0.95       577
     PER.NOM       0.97      0.98      0.97       769

   micro avg       0.96      0.97      0.97      1889
   macro avg       0.94      0.95      0.95      1889
weighted avg       0.96      0.97      0.97      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  3.93it/s, F1=0.676, eval_acc=0.961, eval_loss=8.23, eval_precision=0.61, eval_recall=0.762]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.63      0.85      0.72        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.62      0.83      0.71         6
     LOC.NOM       0.22      0.33      0.27         6
     ORG.NAM       0.35      0.45      0.39        47
     ORG.NOM       0.27      0.60      0.37         5
     PER.NAM       0.64      0.83      0.72        90
     PER.NOM       0.75      0.80      0.77       208

   micro avg       0.64      0.76      0.69       389
   macro avg       0.56      0.71      0.62       389
weighted avg       0.65      0.76      0.70       389



Epoch: 14/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.22it/s, F1=0.955, train_acc=0.996, train_loss=0.451, train_precision=0.951, train_recall=0.963]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       204
     GPE.NOM       0.88      0.88      0.88         8
     LOC.NAM       0.91      0.91      0.91        56
     LOC.NOM       0.96      0.98      0.97        51
     ORG.NAM       0.97      0.97      0.97       182
     ORG.NOM       0.93      0.95      0.94        42
     PER.NAM       0.96      0.96      0.96       577
     PER.NOM       0.95      0.97      0.96       769

   micro avg       0.96      0.97      0.96      1889
   macro avg       0.94      0.95      0.95      1889
weighted avg       0.96      0.97      0.96      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  3.97it/s, F1=0.68, eval_acc=0.962, eval_loss=8.23, eval_precision=0.612, eval_recall=0.767] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.61      0.77      0.68        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.50      0.83      0.62         6
     LOC.NOM       0.30      0.50      0.37         6
     ORG.NAM       0.34      0.49      0.40        47
     ORG.NOM       0.27      0.60      0.37         5
     PER.NAM       0.70      0.83      0.76        90
     PER.NOM       0.72      0.82      0.76       208

   micro avg       0.63      0.77      0.69       389
   macro avg       0.55      0.73      0.62       389
weighted avg       0.65      0.77      0.70       389



Epoch: 15/30 Train: 100%|██████████| 169/169 [00:55<00:00,  3.03it/s, F1=0.957, train_acc=0.997, train_loss=0.42, train_precision=0.953, train_recall=0.967] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      1.00      0.99       204
     GPE.NOM       0.88      0.88      0.88         8
     LOC.NAM       0.95      0.95      0.95        56
     LOC.NOM       0.96      0.94      0.95        51
     ORG.NAM       0.97      0.98      0.97       182
     ORG.NOM       0.93      0.90      0.92        42
     PER.NAM       0.96      0.97      0.96       577
     PER.NOM       0.96      0.97      0.97       769

   micro avg       0.96      0.97      0.97      1889
   macro avg       0.95      0.95      0.95      1889
weighted avg       0.96      0.97      0.97      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.29it/s, F1=0.668, eval_acc=0.961, eval_loss=8.14, eval_precision=0.601, eval_recall=0.758]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.64      0.81      0.71        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.50      0.83      0.62         6
     LOC.NOM       0.27      0.50      0.35         6
     ORG.NAM       0.38      0.45      0.41        47
     ORG.NOM       0.12      0.60      0.21         5
     PER.NAM       0.71      0.81      0.76        90
     PER.NOM       0.72      0.80      0.76       208

   micro avg       0.63      0.76      0.69       389
   macro avg       0.54      0.73      0.60       389
weighted avg       0.66      0.76      0.70       389



Epoch: 16/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.19it/s, F1=0.953, train_acc=0.997, train_loss=0.381, train_precision=0.949, train_recall=0.963]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       204
     GPE.NOM       0.78      0.88      0.82         8
     LOC.NAM       0.95      1.00      0.97        56
     LOC.NOM       0.96      1.00      0.98        51
     ORG.NAM       0.95      0.97      0.96       182
     ORG.NOM       0.84      0.88      0.86        42
     PER.NAM       0.96      0.96      0.96       577
     PER.NOM       0.96      0.98      0.97       769

   micro avg       0.96      0.97      0.97      1889
   macro avg       0.92      0.96      0.94      1889
weighted avg       0.96      0.97      0.97      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.23it/s, F1=0.678, eval_acc=0.964, eval_loss=8.84, eval_precision=0.606, eval_recall=0.775]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.62      0.92      0.74        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.56      0.83      0.67         6
     LOC.NOM       0.22      0.33      0.27         6
     ORG.NAM       0.38      0.45      0.41        47
     ORG.NOM       0.11      0.40      0.17         5
     PER.NAM       0.73      0.82      0.77        90
     PER.NOM       0.71      0.84      0.77       208

   micro avg       0.63      0.78      0.70       389
   macro avg       0.54      0.70      0.60       389
weighted avg       0.65      0.78      0.71       389



Epoch: 17/30 Train: 100%|██████████| 169/169 [00:54<00:00,  3.08it/s, F1=0.963, train_acc=0.997, train_loss=0.398, train_precision=0.957, train_recall=0.973]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      1.00      0.99       204
     GPE.NOM       0.89      1.00      0.94         8
     LOC.NAM       0.95      0.98      0.96        56
     LOC.NOM       0.94      0.94      0.94        51
     ORG.NAM       0.96      0.96      0.96       182
     ORG.NOM       0.91      0.93      0.92        42
     PER.NAM       0.96      0.97      0.96       577
     PER.NOM       0.96      0.98      0.97       769

   micro avg       0.96      0.97      0.97      1889
   macro avg       0.94      0.97      0.96      1889
weighted avg       0.96      0.97      0.97      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.36it/s, F1=0.692, eval_acc=0.965, eval_loss=8.83, eval_precision=0.643, eval_recall=0.75] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.67      0.77      0.71        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.50      0.83      0.62         6
     LOC.NOM       0.10      0.17      0.12         6
     ORG.NAM       0.37      0.47      0.41        47
     ORG.NOM       0.25      0.40      0.31         5
     PER.NAM       0.73      0.84      0.78        90
     PER.NOM       0.75      0.79      0.77       208

   micro avg       0.66      0.75      0.70       389
   macro avg       0.42      0.53      0.47       389
weighted avg       0.67      0.75      0.71       389



Epoch: 18/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.20it/s, F1=0.965, train_acc=0.997, train_loss=0.376, train_precision=0.962, train_recall=0.971]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      0.99      0.99       204
     GPE.NOM       0.88      0.88      0.88         8
     LOC.NAM       0.98      0.93      0.95        56
     LOC.NOM       0.96      0.96      0.96        51
     ORG.NAM       0.92      0.96      0.94       182
     ORG.NOM       0.84      0.90      0.87        42
     PER.NAM       0.97      0.97      0.97       577
     PER.NOM       0.97      0.98      0.98       769

   micro avg       0.96      0.97      0.97      1889
   macro avg       0.94      0.95      0.94      1889
weighted avg       0.96      0.97      0.97      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.28it/s, F1=0.717, eval_acc=0.968, eval_loss=8.29, eval_precision=0.718, eval_recall=0.717]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.67      0.85      0.75        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.56      0.83      0.67         6
     LOC.NOM       0.22      0.33      0.27         6
     ORG.NAM       0.50      0.34      0.41        47
     ORG.NOM       0.33      0.40      0.36         5
     PER.NAM       0.78      0.79      0.78        90
     PER.NOM       0.79      0.75      0.77       208

   micro avg       0.73      0.71      0.72       389
   macro avg       0.61      0.66      0.63       389
weighted avg       0.73      0.71      0.72       389



Epoch: 19/30 Train: 100%|██████████| 169/169 [00:56<00:00,  3.02it/s, F1=0.962, train_acc=0.997, train_loss=0.418, train_precision=0.964, train_recall=0.963]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      0.99      0.99       204
     GPE.NOM       0.88      0.88      0.88         8
     LOC.NAM       0.95      0.98      0.96        56
     LOC.NOM       0.96      0.98      0.97        51
     ORG.NAM       0.92      0.95      0.94       182
     ORG.NOM       0.84      0.88      0.86        42
     PER.NAM       0.96      0.97      0.96       577
     PER.NOM       0.97      0.97      0.97       769

   micro avg       0.96      0.97      0.96      1889
   macro avg       0.93      0.95      0.94      1889
weighted avg       0.96      0.97      0.96      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.41it/s, F1=0.695, eval_acc=0.965, eval_loss=9.98, eval_precision=0.64, eval_recall=0.763] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.62      0.88      0.73        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.45      0.83      0.59         6
     LOC.NOM       0.14      0.33      0.20         6
     ORG.NAM       0.50      0.40      0.45        47
     ORG.NOM       0.20      0.60      0.30         5
     PER.NAM       0.71      0.84      0.77        90
     PER.NOM       0.75      0.81      0.78       208

   micro avg       0.66      0.76      0.71       389
   macro avg       0.55      0.71      0.60       389
weighted avg       0.68      0.76      0.72       389



Epoch: 20/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.22it/s, F1=0.956, train_acc=0.996, train_loss=0.513, train_precision=0.954, train_recall=0.962]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.96      0.98      0.97       204
     GPE.NOM       0.88      0.88      0.88         8
     LOC.NAM       0.95      0.93      0.94        56
     LOC.NOM       0.83      0.94      0.88        51
     ORG.NAM       0.90      0.94      0.92       182
     ORG.NOM       0.88      0.90      0.89        42
     PER.NAM       0.97      0.96      0.97       577
     PER.NOM       0.96      0.98      0.97       769

   micro avg       0.95      0.96      0.96      1889
   macro avg       0.92      0.94      0.93      1889
weighted avg       0.95      0.96      0.96      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.24it/s, F1=0.699, eval_acc=0.963, eval_loss=8.23, eval_precision=0.647, eval_recall=0.763]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.61      0.85      0.71        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.56      0.83      0.67         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.42      0.47      0.44        47
     ORG.NOM       0.27      0.60      0.37         5
     PER.NAM       0.74      0.83      0.78        90
     PER.NOM       0.75      0.81      0.78       208

   micro avg       0.67      0.76      0.71       389
   macro avg       0.54      0.67      0.59       389
weighted avg       0.68      0.76      0.72       389



Epoch: 21/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.23it/s, F1=0.96, train_acc=0.996, train_loss=0.413, train_precision=0.955, train_recall=0.97]  


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      0.99      0.99       204
     GPE.NOM       0.89      1.00      0.94         8
     LOC.NAM       0.95      0.98      0.96        56
     LOC.NOM       0.96      0.96      0.96        51
     ORG.NAM       0.95      0.98      0.96       182
     ORG.NOM       0.86      0.88      0.87        42
     PER.NAM       0.96      0.97      0.97       577
     PER.NOM       0.96      0.96      0.96       769

   micro avg       0.96      0.97      0.96      1889
   macro avg       0.94      0.97      0.95      1889
weighted avg       0.96      0.97      0.96      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.34it/s, F1=0.698, eval_acc=0.965, eval_loss=9.1, eval_precision=0.647, eval_recall=0.76]  


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.62      0.81      0.70        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.45      0.83      0.59         6
     LOC.NOM       0.12      0.33      0.18         6
     ORG.NAM       0.44      0.47      0.45        47
     ORG.NOM       0.23      0.60      0.33         5
     PER.NAM       0.72      0.82      0.77        90
     PER.NOM       0.75      0.80      0.78       208

   micro avg       0.66      0.76      0.70       389
   macro avg       0.54      0.71      0.60       389
weighted avg       0.68      0.76      0.71       389



Epoch: 22/30 Train: 100%|██████████| 169/169 [00:55<00:00,  3.07it/s, F1=0.963, train_acc=0.998, train_loss=0.343, train_precision=0.964, train_recall=0.965]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      1.00      0.99       204
     GPE.NOM       0.86      0.75      0.80         8
     LOC.NAM       0.93      0.95      0.94        56
     LOC.NOM       0.91      0.98      0.94        51
     ORG.NAM       0.96      0.97      0.96       182
     ORG.NOM       0.90      0.90      0.90        42
     PER.NAM       0.98      0.96      0.97       577
     PER.NOM       0.97      0.99      0.98       769

   micro avg       0.97      0.97      0.97      1889
   macro avg       0.94      0.94      0.94      1889
weighted avg       0.97      0.97      0.97      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.32it/s, F1=0.715, eval_acc=0.968, eval_loss=8.92, eval_precision=0.698, eval_recall=0.735]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.67      0.85      0.75        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.62      0.83      0.71         6
     LOC.NOM       0.17      0.17      0.17         6
     ORG.NAM       0.55      0.38      0.45        47
     ORG.NOM       0.33      0.60      0.43         5
     PER.NAM       0.76      0.79      0.77        90
     PER.NOM       0.77      0.79      0.78       208

   micro avg       0.72      0.74      0.73       389
   macro avg       0.61      0.68      0.63       389
weighted avg       0.72      0.74      0.72       389



Epoch: 23/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.23it/s, F1=0.969, train_acc=0.998, train_loss=0.302, train_precision=0.968, train_recall=0.972]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      1.00      0.99       204
     GPE.NOM       0.88      0.88      0.88         8
     LOC.NAM       0.96      0.95      0.95        56
     LOC.NOM       0.92      0.94      0.93        51
     ORG.NAM       0.95      0.96      0.95       182
     ORG.NOM       0.97      0.90      0.94        42
     PER.NAM       0.97      0.98      0.98       577
     PER.NOM       0.97      0.98      0.98       769

   micro avg       0.97      0.98      0.97      1889
   macro avg       0.95      0.95      0.95      1889
weighted avg       0.97      0.98      0.97      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.34it/s, F1=0.669, eval_acc=0.962, eval_loss=9.41, eval_precision=0.608, eval_recall=0.751]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.60      0.92      0.73        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.45      0.83      0.59         6
     LOC.NOM       0.20      0.33      0.25         6
     ORG.NAM       0.33      0.45      0.38        47
     ORG.NOM       0.18      0.80      0.30         5
     PER.NAM       0.79      0.78      0.78        90
     PER.NOM       0.75      0.79      0.77       208

   micro avg       0.64      0.75      0.69       389
   macro avg       0.54      0.74      0.60       389
weighted avg       0.68      0.75      0.70       389



Epoch: 24/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.22it/s, F1=0.957, train_acc=0.997, train_loss=0.28, train_precision=0.959, train_recall=0.959] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       204
     GPE.NOM       0.88      0.88      0.88         8
     LOC.NAM       0.93      0.95      0.94        56
     LOC.NOM       0.96      0.98      0.97        51
     ORG.NAM       0.95      0.96      0.95       182
     ORG.NOM       0.91      0.93      0.92        42
     PER.NAM       0.98      0.97      0.97       577
     PER.NOM       0.98      0.98      0.98       769

   micro avg       0.97      0.98      0.97      1889
   macro avg       0.95      0.95      0.95      1889
weighted avg       0.97      0.98      0.97      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  3.84it/s, F1=0.719, eval_acc=0.968, eval_loss=9.71, eval_precision=0.691, eval_recall=0.751]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.61      0.88      0.72        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.50      0.83      0.62         6
     LOC.NOM       0.33      0.50      0.40         6
     ORG.NAM       0.48      0.34      0.40        47
     ORG.NOM       0.33      0.60      0.43         5
     PER.NAM       0.78      0.78      0.78        90
     PER.NOM       0.75      0.82      0.78       208

   micro avg       0.70      0.75      0.72       389
   macro avg       0.60      0.72      0.64       389
weighted avg       0.70      0.75      0.72       389



Epoch: 25/30 Train: 100%|██████████| 169/169 [00:55<00:00,  3.02it/s, F1=0.969, train_acc=0.997, train_loss=0.363, train_precision=0.969, train_recall=0.974]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       204
     GPE.NOM       0.88      0.88      0.88         8
     LOC.NAM       0.95      0.95      0.95        56
     LOC.NOM       0.94      0.96      0.95        51
     ORG.NAM       0.93      0.96      0.94       182
     ORG.NOM       0.88      0.90      0.89        42
     PER.NAM       0.98      0.98      0.98       577
     PER.NOM       0.97      0.98      0.97       769

   micro avg       0.97      0.97      0.97      1889
   macro avg       0.94      0.95      0.94      1889
weighted avg       0.97      0.97      0.97      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.33it/s, F1=0.688, eval_acc=0.965, eval_loss=9.83, eval_precision=0.635, eval_recall=0.757]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.66      0.88      0.75        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.42      0.83      0.56         6
     LOC.NOM       0.22      0.33      0.27         6
     ORG.NAM       0.46      0.45      0.45        47
     ORG.NOM       0.19      0.60      0.29         5
     PER.NAM       0.76      0.81      0.78        90
     PER.NOM       0.74      0.80      0.77       208

   micro avg       0.67      0.76      0.71       389
   macro avg       0.56      0.71      0.61       389
weighted avg       0.69      0.76      0.72       389



Epoch: 26/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.20it/s, F1=0.964, train_acc=0.997, train_loss=0.289, train_precision=0.962, train_recall=0.969]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      0.99      0.99       204
     GPE.NOM       0.89      1.00      0.94         8
     LOC.NAM       0.95      1.00      0.97        56
     LOC.NOM       0.96      1.00      0.98        51
     ORG.NAM       0.97      0.99      0.98       182
     ORG.NOM       0.88      0.90      0.89        42
     PER.NAM       0.97      0.97      0.97       577
     PER.NOM       0.97      0.97      0.97       769

   micro avg       0.97      0.97      0.97      1889
   macro avg       0.95      0.98      0.96      1889
weighted avg       0.97      0.97      0.97      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.20it/s, F1=0.706, eval_acc=0.966, eval_loss=9.41, eval_precision=0.68, eval_recall=0.736] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.53      0.92      0.68        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.50      0.83      0.62         6
     LOC.NOM       0.25      0.33      0.29         6
     ORG.NAM       0.53      0.34      0.42        47
     ORG.NOM       0.29      0.80      0.42         5
     PER.NAM       0.83      0.77      0.80        90
     PER.NOM       0.75      0.79      0.77       208

   micro avg       0.70      0.73      0.71       389
   macro avg       0.46      0.60      0.50       389
weighted avg       0.71      0.73      0.71       389



Epoch: 27/30 Train: 100%|██████████| 169/169 [00:56<00:00,  3.01it/s, F1=0.976, train_acc=0.998, train_loss=0.261, train_precision=0.978, train_recall=0.977]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      1.00      0.99       204
     GPE.NOM       1.00      1.00      1.00         8
     LOC.NAM       1.00      0.95      0.97        56
     LOC.NOM       0.98      0.94      0.96        51
     ORG.NAM       0.97      0.97      0.97       182
     ORG.NOM       0.91      0.93      0.92        42
     PER.NAM       0.98      0.97      0.98       577
     PER.NOM       0.98      0.99      0.98       769

   micro avg       0.98      0.98      0.98      1889
   macro avg       0.97      0.97      0.97      1889
weighted avg       0.98      0.98      0.98      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.24it/s, F1=0.685, eval_acc=0.964, eval_loss=8.41, eval_precision=0.629, eval_recall=0.755]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.52      0.88      0.66        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.43      0.50      0.46         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.36      0.45      0.40        47
     ORG.NOM       0.18      0.60      0.27         5
     PER.NAM       0.75      0.84      0.80        90
     PER.NOM       0.74      0.80      0.77       208

   micro avg       0.64      0.75      0.69       389
   macro avg       0.50      0.63      0.54       389
weighted avg       0.66      0.75      0.70       389



Epoch: 28/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.21it/s, F1=0.971, train_acc=0.998, train_loss=0.231, train_precision=0.969, train_recall=0.976]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      1.00      1.00       204
     GPE.NOM       0.89      1.00      0.94         8
     LOC.NAM       0.90      0.93      0.91        56
     LOC.NOM       0.96      0.98      0.97        51
     ORG.NAM       0.97      0.98      0.98       182
     ORG.NOM       0.90      0.90      0.90        42
     PER.NAM       0.98      0.98      0.98       577
     PER.NOM       0.98      0.98      0.98       769

   micro avg       0.97      0.98      0.98      1889
   macro avg       0.95      0.97      0.96      1889
weighted avg       0.97      0.98      0.98      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.29it/s, F1=0.691, eval_acc=0.965, eval_loss=10.1, eval_precision=0.642, eval_recall=0.755]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.68      0.88      0.77        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.31      0.83      0.45         6
     LOC.NOM       0.17      0.33      0.22         6
     ORG.NAM       0.45      0.45      0.45        47
     ORG.NOM       0.21      0.60      0.32         5
     PER.NAM       0.79      0.82      0.80        90
     PER.NOM       0.76      0.79      0.77       208

   micro avg       0.67      0.76      0.71       389
   macro avg       0.55      0.71      0.60       389
weighted avg       0.70      0.76      0.72       389



Epoch: 29/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.20it/s, F1=0.97, train_acc=0.998, train_loss=0.285, train_precision=0.966, train_recall=0.977] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.98      0.99      0.99       204
     GPE.NOM       0.88      0.88      0.88         8
     LOC.NAM       0.86      0.89      0.88        56
     LOC.NOM       0.96      0.98      0.97        51
     ORG.NAM       0.96      0.98      0.97       182
     ORG.NOM       0.86      0.90      0.88        42
     PER.NAM       0.98      0.98      0.98       577
     PER.NOM       0.97      0.98      0.98       769

   micro avg       0.97      0.98      0.97      1889
   macro avg       0.93      0.95      0.94      1889
weighted avg       0.97      0.98      0.97      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.34it/s, F1=0.691, eval_acc=0.965, eval_loss=9.72, eval_precision=0.667, eval_recall=0.722]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.67      0.92      0.77        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.36      0.83      0.50         6
     LOC.NOM       0.25      0.33      0.29         6
     ORG.NAM       0.42      0.45      0.43        47
     ORG.NOM       0.21      0.60      0.32         5
     PER.NAM       0.85      0.71      0.78        90
     PER.NOM       0.77      0.75      0.76       208

   micro avg       0.69      0.71      0.70       389
   macro avg       0.57      0.70      0.61       389
weighted avg       0.72      0.71      0.71       389



Epoch: 30/30 Train: 100%|██████████| 169/169 [00:56<00:00,  2.98it/s, F1=0.97, train_acc=0.998, train_loss=0.302, train_precision=0.97, train_recall=0.972]  


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      0.99      0.99       204
     GPE.NOM       1.00      0.88      0.93         8
     LOC.NAM       0.91      0.93      0.92        56
     LOC.NOM       0.96      0.94      0.95        51
     ORG.NAM       0.97      0.99      0.98       182
     ORG.NOM       0.88      0.90      0.89        42
     PER.NAM       0.98      0.97      0.97       577
     PER.NOM       0.98      0.98      0.98       769

   micro avg       0.97      0.98      0.97      1889
   macro avg       0.96      0.95      0.95      1889
weighted avg       0.97      0.98      0.97      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.34it/s, F1=0.709, eval_acc=0.968, eval_loss=8.65, eval_precision=0.694, eval_recall=0.727]


eval_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.60      0.92      0.73        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.42      0.83      0.56         6
     LOC.NOM       0.40      0.33      0.36         6
     ORG.NAM       0.53      0.36      0.43        47
     ORG.NOM       0.27      0.60      0.37         5
     PER.NAM       0.81      0.79      0.80        90
     PER.NOM       0.77      0.75      0.76       208

   micro avg       0.71      0.72      0.72       389
   macro avg       0.60      0.70      0.63       389
weighted avg       0.72      0.72      0.71       389



calculate data/few_shot/weibo/train_1350.json etag: 100%|██████████| 911k/911k [00:00<00:00, 312MB/s]
calculate data/few_shot/weibo/dev.json etag: 100%|██████████| 180k/180k [00:00<00:00, 190MB/s]
calculate data/few_shot/weibo/test.json etag: 100%|██████████| 184k/184k [00:00<00:00, 286MB/s]
calculate data/few_shot/weibo/labels.txt etag: 100%|██████████| 272/272 [00:00<00:00, 524kB/s]

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/weibo/train_1350.json",
    "eval_file": "data/few_shot/weibo/dev.json",
    "test_file": "data/few_shot/weibo/test.json",
    "tag_file": "data/few_shot/weibo/labels.txt",
    "bert_vocab_file": "./model/chinese_wwm_ext/vocab.txt",
    "output_eval": true,
    "max_scan_num": 1000000,
    "add_seq_vocab": false,
    "max_seq_length": 150,
    "max_word_num": 5,
    "default_tag": "O",
    "use_test": false,
    "do_shuffle": true,
    "do_predict": false,
    "task_name": "weibo_pretrain_lebert_crf_1350_x3"
}
load cached ./temp/019570c570c6a6a1ee32b781734ca455_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/lexicon_tree



count line size data/few_shot/weibo/labels.txt: 29L [00:00, 184295.18L/s]
build line mapper: 29L [00:00, 30264.95L/s]9 [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 29/29 [00:00<00:00, 8318.62it/s]
load vocab from list: 100%|██████████| 28/28 [00:00<00:00, 241647.14it/s]
load dataset from data/few_shot/weibo/train_1350.json: 36it [00:00, 357.84it/s]

load cached ./temp/019570c570c6a6a1ee32b781734ca455_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/matched_words
load cached ./temp/019570c570c6a6a1ee32b781734ca455_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/word_vocab
load cached ./temp/019570c570c6a6a1ee32b781734ca455_09aa1aaf832ce26fdd3856a1e9efec4a_80b03b9eb036cba8e85f623155e5f057_c8c242fc3f6ea09f357d4bd7f5116722/1000000/vocab_embedding


load dataset from data/few_shot/weibo/train_1350.json: 1350it [00:03, 342.67it/s]
load dataset from data/few_shot/weibo/dev.json: 271it [00:00, 342.71it/s]
Some weights of the model checkpoint at save_pretrained/weibo_pretrain_lebert_1350_pretraind_task/Bert_1290/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification mode

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 169/169 [00:53<00:00,  3.17it/s, F1=0.00635, train_acc=0.801, train_loss=51.9, train_precision=0.00519, train_recall=0.00841]   


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00       204
     GPE.NOM       0.00      0.00      0.00         8
     LOC.NAM       0.00      0.00      0.00        56
     LOC.NOM       0.00      0.00      0.00        51
     ORG.NAM       0.00      0.00      0.00       182
     ORG.NOM       0.00      0.00      0.00        42
     PER.NAM       0.00      0.00      0.00       577
     PER.NOM       0.01      0.02      0.01       769

   micro avg       0.00      0.01      0.00      1889
   macro avg       0.00      0.00      0.00      1889
weighted avg       0.00      0.01      0.01      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.20it/s, F1=0.193, eval_acc=0.937, eval_loss=13.1, eval_precision=0.13, eval_recall=0.372] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.00      0.00      0.00        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.00      0.00      0.00        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.00      0.00      0.00        90
     PER.NOM       0.28      0.76      0.41       208

   micro avg       0.15      0.41      0.21       389
   macro avg       0.04      0.09      0.05       389
weighted avg       0.15      0.41      0.22       389



Epoch: 2/30 Train: 100%|██████████| 169/169 [00:53<00:00,  3.18it/s, F1=0.414, train_acc=0.96, train_loss=8.65, train_precision=0.393, train_recall=0.456]  


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.53      0.66      0.59       204
     GPE.NOM       0.00      0.00      0.00         8
     LOC.NAM       0.00      0.00      0.00        56
     LOC.NOM       0.00      0.00      0.00        51
     ORG.NAM       0.09      0.11      0.10       182
     ORG.NOM       0.00      0.00      0.00        42
     PER.NAM       0.23      0.35      0.27       577
     PER.NOM       0.52      0.68      0.59       769

   micro avg       0.37      0.47      0.41      1889
   macro avg       0.17      0.23      0.19      1889
weighted avg       0.35      0.47      0.40      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.34it/s, F1=0.538, eval_acc=0.962, eval_loss=6.47, eval_precision=0.432, eval_recall=0.727]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.36      0.77      0.49        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.00      0.00      0.00         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.11      0.26      0.15        47
     ORG.NOM       0.00      0.00      0.00         5
     PER.NAM       0.46      0.76      0.57        90
     PER.NOM       0.62      0.83      0.71       208

   micro avg       0.45      0.70      0.55       389
   macro avg       0.19      0.33      0.24       389
weighted avg       0.47      0.70      0.56       389



Epoch: 3/30 Train: 100%|██████████| 169/169 [00:56<00:00,  3.01it/s, F1=0.646, train_acc=0.976, train_loss=4.82, train_precision=0.613, train_recall=0.702]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.68      0.83      0.75       204
     GPE.NOM       0.00      0.00      0.00         8
     LOC.NAM       0.04      0.05      0.04        56
     LOC.NOM       0.00      0.00      0.00        51
     ORG.NAM       0.34      0.51      0.41       182
     ORG.NOM       0.67      0.14      0.24        42
     PER.NAM       0.55      0.70      0.61       577
     PER.NOM       0.76      0.85      0.80       769

   micro avg       0.60      0.70      0.64      1889
   macro avg       0.38      0.39      0.36      1889
weighted avg       0.60      0.70      0.64      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.32it/s, F1=0.619, eval_acc=0.967, eval_loss=5.89, eval_precision=0.563, eval_recall=0.688]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.66      0.88      0.75        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.15      0.33      0.21         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.27      0.26      0.26        47
     ORG.NOM       1.00      0.80      0.89         5
     PER.NAM       0.46      0.76      0.57        90
     PER.NOM       0.73      0.77      0.75       208

   micro avg       0.58      0.69      0.63       389
   macro avg       0.41      0.47      0.43       389
weighted avg       0.59      0.69      0.63       389



Epoch: 4/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.20it/s, F1=0.751, train_acc=0.984, train_loss=3.36, train_precision=0.724, train_recall=0.798]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.84      0.90      0.87       204
     GPE.NOM       0.00      0.00      0.00         8
     LOC.NAM       0.28      0.41      0.34        56
     LOC.NOM       0.08      0.08      0.08        51
     ORG.NAM       0.65      0.79      0.71       182
     ORG.NOM       0.60      0.43      0.50        42
     PER.NAM       0.67      0.80      0.73       577
     PER.NOM       0.83      0.89      0.86       769

   micro avg       0.72      0.80      0.76      1889
   macro avg       0.49      0.54      0.51      1889
weighted avg       0.72      0.80      0.76      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.35it/s, F1=0.634, eval_acc=0.967, eval_loss=6.24, eval_precision=0.559, eval_recall=0.737]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.56      0.88      0.69        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.14      0.50      0.21         6
     LOC.NOM       0.14      0.33      0.20         6
     ORG.NAM       0.23      0.34      0.28        47
     ORG.NOM       0.42      1.00      0.59         5
     PER.NAM       0.61      0.73      0.67        90
     PER.NOM       0.74      0.82      0.78       208

   micro avg       0.57      0.73      0.64       389
   macro avg       0.35      0.58      0.43       389
weighted avg       0.61      0.73      0.66       389



Epoch: 5/30 Train: 100%|██████████| 169/169 [00:55<00:00,  3.02it/s, F1=0.802, train_acc=0.988, train_loss=2.37, train_precision=0.772, train_recall=0.847]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.87      0.94      0.90       204
     GPE.NOM       0.00      0.00      0.00         8
     LOC.NAM       0.35      0.50      0.41        56
     LOC.NOM       0.17      0.22      0.19        51
     ORG.NAM       0.75      0.85      0.80       182
     ORG.NOM       0.55      0.55      0.55        42
     PER.NAM       0.72      0.83      0.77       577
     PER.NOM       0.87      0.93      0.90       769

   micro avg       0.76      0.85      0.80      1889
   macro avg       0.54      0.60      0.57      1889
weighted avg       0.77      0.85      0.81      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.25it/s, F1=0.673, eval_acc=0.968, eval_loss=6.18, eval_precision=0.633, eval_recall=0.72] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.69      0.85      0.76        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.33      0.67      0.44         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.36      0.38      0.37        47
     ORG.NOM       0.44      0.80      0.57         5
     PER.NAM       0.63      0.73      0.68        90
     PER.NOM       0.75      0.78      0.76       208

   micro avg       0.64      0.71      0.67       389
   macro avg       0.40      0.53      0.45       389
weighted avg       0.65      0.71      0.68       389



Epoch: 6/30 Train: 100%|██████████| 169/169 [00:53<00:00,  3.18it/s, F1=0.841, train_acc=0.991, train_loss=1.72, train_precision=0.823, train_recall=0.869]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.92      0.94      0.93       204
     GPE.NOM       0.33      0.12      0.18         8
     LOC.NAM       0.56      0.68      0.61        56
     LOC.NOM       0.34      0.45      0.39        51
     ORG.NAM       0.83      0.90      0.86       182
     ORG.NOM       0.57      0.57      0.57        42
     PER.NAM       0.82      0.88      0.85       577
     PER.NOM       0.90      0.94      0.92       769

   micro avg       0.83      0.89      0.86      1889
   macro avg       0.66      0.69      0.66      1889
weighted avg       0.84      0.89      0.86      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.33it/s, F1=0.683, eval_acc=0.968, eval_loss=6.81, eval_precision=0.63, eval_recall=0.746] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.66      0.81      0.72        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.71      0.83      0.77         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.33      0.38      0.36        47
     ORG.NOM       0.36      0.80      0.50         5
     PER.NAM       0.60      0.79      0.68        90
     PER.NOM       0.76      0.81      0.78       208

   micro avg       0.63      0.74      0.68       389
   macro avg       0.55      0.68      0.60       389
weighted avg       0.65      0.74      0.69       389



Epoch: 7/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.19it/s, F1=0.885, train_acc=0.994, train_loss=1.24, train_precision=0.872, train_recall=0.907]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.97      0.98      0.97       204
     GPE.NOM       0.75      0.75      0.75         8
     LOC.NAM       0.77      0.88      0.82        56
     LOC.NOM       0.68      0.71      0.69        51
     ORG.NAM       0.89      0.93      0.91       182
     ORG.NOM       0.73      0.71      0.72        42
     PER.NAM       0.87      0.92      0.89       577
     PER.NOM       0.91      0.95      0.93       769

   micro avg       0.89      0.93      0.91      1889
   macro avg       0.82      0.85      0.84      1889
weighted avg       0.89      0.93      0.91      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.36it/s, F1=0.647, eval_acc=0.963, eval_loss=7.64, eval_precision=0.563, eval_recall=0.768]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.61      0.88      0.72        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.25      0.17      0.20         6
     LOC.NOM       0.15      0.50      0.23         6
     ORG.NAM       0.33      0.45      0.38        47
     ORG.NOM       0.18      0.80      0.30         5
     PER.NAM       0.60      0.81      0.69        90
     PER.NOM       0.72      0.83      0.77       208

   micro avg       0.59      0.77      0.67       389
   macro avg       0.48      0.68      0.54       389
weighted avg       0.62      0.77      0.68       389



Epoch: 8/30 Train: 100%|██████████| 169/169 [00:56<00:00,  3.00it/s, F1=0.919, train_acc=0.994, train_loss=1.08, train_precision=0.904, train_recall=0.94]  


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.96      0.98      0.97       204
     GPE.NOM       1.00      0.88      0.93         8
     LOC.NAM       0.70      0.79      0.74        56
     LOC.NOM       0.70      0.78      0.74        51
     ORG.NAM       0.93      0.97      0.95       182
     ORG.NOM       0.77      0.79      0.78        42
     PER.NAM       0.88      0.93      0.90       577
     PER.NOM       0.93      0.96      0.94       769

   micro avg       0.90      0.94      0.92      1889
   macro avg       0.86      0.88      0.87      1889
weighted avg       0.90      0.94      0.92      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.14it/s, F1=0.654, eval_acc=0.963, eval_loss=7.61, eval_precision=0.576, eval_recall=0.759]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.66      0.81      0.72        26
     GPE.NOM       0.33      1.00      0.50         1
     LOC.NAM       0.28      0.83      0.42         6
     LOC.NOM       0.13      0.50      0.21         6
     ORG.NAM       0.37      0.40      0.39        47
     ORG.NOM       0.21      0.60      0.32         5
     PER.NAM       0.66      0.81      0.73        90
     PER.NOM       0.69      0.82      0.75       208

   micro avg       0.59      0.76      0.67       389
   macro avg       0.42      0.72      0.50       389
weighted avg       0.62      0.76      0.68       389



Epoch: 9/30 Train: 100%|██████████| 169/169 [00:53<00:00,  3.16it/s, F1=0.925, train_acc=0.995, train_loss=0.854, train_precision=0.915, train_recall=0.94] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.96      0.97      0.97       204
     GPE.NOM       0.78      0.88      0.82         8
     LOC.NAM       0.81      0.86      0.83        56
     LOC.NOM       0.78      0.82      0.80        51
     ORG.NAM       0.88      0.92      0.90       182
     ORG.NOM       0.76      0.74      0.75        42
     PER.NAM       0.91      0.94      0.93       577
     PER.NOM       0.94      0.96      0.95       769

   micro avg       0.91      0.94      0.93      1889
   macro avg       0.85      0.89      0.87      1889
weighted avg       0.91      0.94      0.93      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.34it/s, F1=0.657, eval_acc=0.964, eval_loss=7.59, eval_precision=0.584, eval_recall=0.754]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.61      0.85      0.71        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.45      0.83      0.59         6
     LOC.NOM       0.07      0.17      0.10         6
     ORG.NAM       0.35      0.43      0.38        47
     ORG.NOM       0.21      0.60      0.32         5
     PER.NAM       0.58      0.81      0.68        90
     PER.NOM       0.76      0.81      0.78       208

   micro avg       0.61      0.75      0.67       389
   macro avg       0.51      0.69      0.57       389
weighted avg       0.64      0.75      0.69       389



Epoch: 10/30 Train: 100%|██████████| 169/169 [00:56<00:00,  2.98it/s, F1=0.933, train_acc=0.996, train_loss=0.693, train_precision=0.926, train_recall=0.945]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.97      0.99      0.98       204
     GPE.NOM       0.88      0.88      0.88         8
     LOC.NAM       0.88      0.91      0.89        56
     LOC.NOM       0.88      0.90      0.89        51
     ORG.NAM       0.94      0.96      0.95       182
     ORG.NOM       0.86      0.86      0.86        42
     PER.NAM       0.91      0.95      0.93       577
     PER.NOM       0.94      0.96      0.95       769

   micro avg       0.93      0.95      0.94      1889
   macro avg       0.91      0.92      0.92      1889
weighted avg       0.93      0.95      0.94      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.08it/s, F1=0.67, eval_acc=0.966, eval_loss=7.29, eval_precision=0.619, eval_recall=0.735] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.61      0.85      0.71        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.71      0.83      0.77         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.33      0.38      0.36        47
     ORG.NOM       0.20      0.60      0.30         5
     PER.NAM       0.67      0.74      0.71        90
     PER.NOM       0.75      0.80      0.77       208

   micro avg       0.63      0.73      0.68       389
   macro avg       0.53      0.65      0.58       389
weighted avg       0.65      0.73      0.69       389



Epoch: 11/30 Train: 100%|██████████| 169/169 [00:53<00:00,  3.18it/s, F1=0.928, train_acc=0.996, train_loss=0.637, train_precision=0.919, train_recall=0.943]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.98      0.99      0.98       204
     GPE.NOM       0.86      0.75      0.80         8
     LOC.NAM       0.82      0.89      0.85        56
     LOC.NOM       0.90      0.84      0.87        51
     ORG.NAM       0.91      0.95      0.93       182
     ORG.NOM       0.81      0.83      0.82        42
     PER.NAM       0.90      0.94      0.92       577
     PER.NOM       0.95      0.97      0.96       769

   micro avg       0.92      0.95      0.94      1889
   macro avg       0.89      0.90      0.89      1889
weighted avg       0.92      0.95      0.94      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.32it/s, F1=0.679, eval_acc=0.965, eval_loss=7.98, eval_precision=0.661, eval_recall=0.701]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.61      0.77      0.68        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       1.00      0.83      0.91         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.37      0.47      0.42        47
     ORG.NOM       0.44      0.80      0.57         5
     PER.NAM       0.66      0.73      0.69        90
     PER.NOM       0.80      0.71      0.75       208

   micro avg       0.67      0.68      0.67       389
   macro avg       0.61      0.66      0.63       389
weighted avg       0.69      0.68      0.68       389



Epoch: 12/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.21it/s, F1=0.932, train_acc=0.996, train_loss=0.794, train_precision=0.919, train_recall=0.953]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.98      1.00      0.99       204
     GPE.NOM       0.88      0.88      0.88         8
     LOC.NAM       0.85      0.89      0.87        56
     LOC.NOM       0.91      0.94      0.92        51
     ORG.NAM       0.91      0.96      0.93       182
     ORG.NOM       0.86      0.86      0.86        42
     PER.NAM       0.89      0.94      0.91       577
     PER.NOM       0.96      0.97      0.96       769

   micro avg       0.92      0.96      0.94      1889
   macro avg       0.90      0.93      0.91      1889
weighted avg       0.93      0.96      0.94      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.28it/s, F1=0.604, eval_acc=0.962, eval_loss=7.42, eval_precision=0.584, eval_recall=0.627]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.70      0.81      0.75        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.33      0.83      0.48         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.35      0.32      0.33        47
     ORG.NOM       0.40      0.80      0.53         5
     PER.NAM       0.55      0.79      0.65        90
     PER.NOM       0.79      0.62      0.70       208

   micro avg       0.61      0.63      0.62       389
   macro avg       0.51      0.65      0.55       389
weighted avg       0.65      0.63      0.63       389



Epoch: 13/30 Train: 100%|██████████| 169/169 [00:56<00:00,  3.02it/s, F1=0.934, train_acc=0.996, train_loss=0.728, train_precision=0.924, train_recall=0.949]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.95      0.98      0.96       204
     GPE.NOM       0.78      0.88      0.82         8
     LOC.NAM       0.93      0.98      0.96        56
     LOC.NOM       0.88      0.96      0.92        51
     ORG.NAM       0.92      0.95      0.93       182
     ORG.NOM       0.84      0.86      0.85        42
     PER.NAM       0.90      0.94      0.92       577
     PER.NOM       0.97      0.98      0.97       769

   micro avg       0.94      0.96      0.95      1889
   macro avg       0.90      0.94      0.92      1889
weighted avg       0.94      0.96      0.95      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.34it/s, F1=0.651, eval_acc=0.961, eval_loss=9.58, eval_precision=0.569, eval_recall=0.766]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.48      0.81      0.60        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.56      0.83      0.67         6
     LOC.NOM       0.06      0.17      0.09         6
     ORG.NAM       0.33      0.47      0.39        47
     ORG.NOM       0.12      0.80      0.21         5
     PER.NAM       0.64      0.72      0.68        90
     PER.NOM       0.72      0.78      0.75       208

   micro avg       0.57      0.72      0.64       389
   macro avg       0.49      0.70      0.55       389
weighted avg       0.62      0.72      0.66       389



Epoch: 14/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.21it/s, F1=0.955, train_acc=0.997, train_loss=0.432, train_precision=0.947, train_recall=0.967]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.97      0.99      0.98       204
     GPE.NOM       0.89      1.00      0.94         8
     LOC.NAM       0.93      0.96      0.95        56
     LOC.NOM       0.96      0.96      0.96        51
     ORG.NAM       0.95      0.97      0.96       182
     ORG.NOM       0.90      0.90      0.90        42
     PER.NAM       0.94      0.96      0.95       577
     PER.NOM       0.96      0.98      0.97       769

   micro avg       0.95      0.97      0.96      1889
   macro avg       0.94      0.97      0.95      1889
weighted avg       0.95      0.97      0.96      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.16it/s, F1=0.702, eval_acc=0.966, eval_loss=8.31, eval_precision=0.673, eval_recall=0.735]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.59      0.77      0.67        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.83      0.83      0.83         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.41      0.36      0.39        47
     ORG.NOM       0.40      0.80      0.53         5
     PER.NAM       0.68      0.77      0.72        90
     PER.NOM       0.76      0.81      0.78       208

   micro avg       0.68      0.73      0.70       389
   macro avg       0.46      0.54      0.49       389
weighted avg       0.67      0.73      0.70       389



Epoch: 15/30 Train: 100%|██████████| 169/169 [00:55<00:00,  3.02it/s, F1=0.961, train_acc=0.997, train_loss=0.379, train_precision=0.959, train_recall=0.966]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       204
     GPE.NOM       1.00      0.75      0.86         8
     LOC.NAM       0.93      0.96      0.95        56
     LOC.NOM       0.96      0.98      0.97        51
     ORG.NAM       0.96      0.97      0.96       182
     ORG.NOM       0.90      0.88      0.89        42
     PER.NAM       0.94      0.95      0.95       577
     PER.NOM       0.97      0.98      0.97       769

   micro avg       0.96      0.97      0.96      1889
   macro avg       0.96      0.94      0.94      1889
weighted avg       0.96      0.97      0.96      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.31it/s, F1=0.695, eval_acc=0.969, eval_loss=8.22, eval_precision=0.64, eval_recall=0.764] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.59      0.85      0.70        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.71      0.83      0.77         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.36      0.40      0.38        47
     ORG.NOM       0.14      0.60      0.22         5
     PER.NAM       0.65      0.78      0.71        90
     PER.NOM       0.78      0.78      0.78       208

   micro avg       0.64      0.72      0.68       389
   macro avg       0.53      0.66      0.57       389
weighted avg       0.66      0.72      0.69       389



Epoch: 16/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.19it/s, F1=0.961, train_acc=0.997, train_loss=0.4, train_precision=0.954, train_recall=0.973]  


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      1.00      1.00       204
     GPE.NOM       0.88      0.88      0.88         8
     LOC.NAM       0.93      0.95      0.94        56
     LOC.NOM       0.96      0.96      0.96        51
     ORG.NAM       0.96      0.98      0.97       182
     ORG.NOM       0.76      0.83      0.80        42
     PER.NAM       0.94      0.96      0.95       577
     PER.NOM       0.96      0.98      0.97       769

   micro avg       0.95      0.97      0.96      1889
   macro avg       0.92      0.94      0.93      1889
weighted avg       0.95      0.97      0.96      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.12it/s, F1=0.684, eval_acc=0.968, eval_loss=7.99, eval_precision=0.639, eval_recall=0.741]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.62      0.81      0.70        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.50      0.83      0.62         6
     LOC.NOM       0.07      0.17      0.10         6
     ORG.NAM       0.37      0.40      0.38        47
     ORG.NOM       0.19      0.60      0.29         5
     PER.NAM       0.74      0.78      0.76        90
     PER.NOM       0.78      0.76      0.77       208

   micro avg       0.66      0.71      0.68       389
   macro avg       0.53      0.67      0.58       389
weighted avg       0.69      0.71      0.70       389



Epoch: 17/30 Train: 100%|██████████| 169/169 [00:53<00:00,  3.18it/s, F1=0.966, train_acc=0.997, train_loss=0.345, train_precision=0.961, train_recall=0.974]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      1.00      0.99       204
     GPE.NOM       0.89      1.00      0.94         8
     LOC.NAM       0.95      0.96      0.96        56
     LOC.NOM       0.96      1.00      0.98        51
     ORG.NAM       0.97      0.98      0.98       182
     ORG.NOM       0.93      0.93      0.93        42
     PER.NAM       0.95      0.97      0.96       577
     PER.NOM       0.97      0.97      0.97       769

   micro avg       0.96      0.97      0.97      1889
   macro avg       0.95      0.98      0.96      1889
weighted avg       0.96      0.97      0.97      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.02it/s, F1=0.708, eval_acc=0.968, eval_loss=9.17, eval_precision=0.695, eval_recall=0.722]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.61      0.77      0.68        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.71      0.83      0.77         6
     LOC.NOM       0.12      0.17      0.14         6
     ORG.NAM       0.47      0.34      0.40        47
     ORG.NOM       0.33      0.60      0.43         5
     PER.NAM       0.72      0.73      0.73        90
     PER.NOM       0.78      0.80      0.79       208

   micro avg       0.70      0.71      0.71       389
   macro avg       0.47      0.53      0.49       389
weighted avg       0.70      0.71      0.70       389



Epoch: 18/30 Train: 100%|██████████| 169/169 [00:56<00:00,  2.98it/s, F1=0.959, train_acc=0.997, train_loss=0.371, train_precision=0.953, train_recall=0.97] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.97      0.99      0.98       204
     GPE.NOM       0.86      0.75      0.80         8
     LOC.NAM       0.93      0.98      0.96        56
     LOC.NOM       0.96      0.96      0.96        51
     ORG.NAM       0.95      0.96      0.95       182
     ORG.NOM       0.93      0.88      0.90        42
     PER.NAM       0.94      0.96      0.95       577
     PER.NOM       0.97      0.98      0.98       769

   micro avg       0.96      0.97      0.96      1889
   macro avg       0.94      0.93      0.94      1889
weighted avg       0.96      0.97      0.96      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.33it/s, F1=0.651, eval_acc=0.965, eval_loss=9.26, eval_precision=0.595, eval_recall=0.729]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.57      0.81      0.67        26
     GPE.NOM       0.33      1.00      0.50         1
     LOC.NAM       0.62      0.83      0.71         6
     LOC.NOM       0.07      0.17      0.10         6
     ORG.NAM       0.40      0.38      0.39        47
     ORG.NOM       0.12      0.60      0.21         5
     PER.NAM       0.73      0.71      0.72        90
     PER.NOM       0.74      0.80      0.77       208

   micro avg       0.63      0.72      0.67       389
   macro avg       0.45      0.66      0.51       389
weighted avg       0.66      0.72      0.69       389



Epoch: 19/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.20it/s, F1=0.922, train_acc=0.995, train_loss=0.936, train_precision=0.912, train_recall=0.936]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.98      0.99      0.98       204
     GPE.NOM       0.86      0.75      0.80         8
     LOC.NAM       0.83      0.88      0.85        56
     LOC.NOM       0.96      0.98      0.97        51
     ORG.NAM       0.91      0.95      0.93       182
     ORG.NOM       0.89      0.93      0.91        42
     PER.NAM       0.86      0.91      0.88       577
     PER.NOM       0.96      0.97      0.96       769

   micro avg       0.92      0.94      0.93      1889
   macro avg       0.91      0.92      0.91      1889
weighted avg       0.92      0.94      0.93      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.32it/s, F1=0.669, eval_acc=0.97, eval_loss=8.34, eval_precision=0.627, eval_recall=0.728] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.55      0.81      0.66        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.62      0.83      0.71         6
     LOC.NOM       0.25      0.17      0.20         6
     ORG.NAM       0.40      0.45      0.42        47
     ORG.NOM       0.27      0.60      0.37         5
     PER.NAM       0.67      0.73      0.70        90
     PER.NOM       0.77      0.77      0.77       208

   micro avg       0.66      0.71      0.69       389
   macro avg       0.57      0.67      0.61       389
weighted avg       0.67      0.71      0.69       389



Epoch: 20/30 Train: 100%|██████████| 169/169 [00:57<00:00,  2.96it/s, F1=0.937, train_acc=0.996, train_loss=0.667, train_precision=0.928, train_recall=0.952]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.98      0.99      0.98       204
     GPE.NOM       0.88      0.88      0.88         8
     LOC.NAM       0.86      0.89      0.88        56
     LOC.NOM       0.91      0.94      0.92        51
     ORG.NAM       0.96      0.97      0.96       182
     ORG.NOM       0.90      0.83      0.86        42
     PER.NAM       0.90      0.94      0.92       577
     PER.NOM       0.95      0.97      0.96       769

   micro avg       0.93      0.96      0.94      1889
   macro avg       0.92      0.93      0.92      1889
weighted avg       0.93      0.96      0.94      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.42it/s, F1=0.647, eval_acc=0.963, eval_loss=9.13, eval_precision=0.569, eval_recall=0.757]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.62      0.81      0.70        26
     GPE.NOM       0.25      1.00      0.40         1
     LOC.NAM       0.19      0.83      0.30         6
     LOC.NOM       0.09      0.33      0.14         6
     ORG.NAM       0.32      0.40      0.36        47
     ORG.NOM       0.21      0.80      0.33         5
     PER.NAM       0.70      0.79      0.74        90
     PER.NOM       0.76      0.82      0.79       208

   micro avg       0.60      0.76      0.67       389
   macro avg       0.39      0.72      0.47       389
weighted avg       0.65      0.76      0.69       389



Epoch: 21/30 Train: 100%|██████████| 169/169 [00:53<00:00,  3.17it/s, F1=0.944, train_acc=0.997, train_loss=0.462, train_precision=0.938, train_recall=0.953]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      1.00      0.99       204
     GPE.NOM       0.88      0.88      0.88         8
     LOC.NAM       0.93      1.00      0.97        56
     LOC.NOM       0.85      0.92      0.89        51
     ORG.NAM       0.95      0.97      0.96       182
     ORG.NOM       0.88      0.90      0.89        42
     PER.NAM       0.94      0.96      0.95       577
     PER.NOM       0.96      0.98      0.97       769

   micro avg       0.95      0.97      0.96      1889
   macro avg       0.92      0.95      0.94      1889
weighted avg       0.95      0.97      0.96      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.26it/s, F1=0.715, eval_acc=0.969, eval_loss=8.36, eval_precision=0.688, eval_recall=0.748]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.60      0.81      0.69        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.62      0.83      0.71         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.43      0.45      0.44        47
     ORG.NOM       0.44      0.80      0.57         5
     PER.NAM       0.70      0.73      0.72        90
     PER.NOM       0.77      0.75      0.76       208

   micro avg       0.68      0.70      0.69       389
   macro avg       0.57      0.67      0.61       389
weighted avg       0.68      0.70      0.69       389



Epoch: 22/30 Train: 100%|██████████| 169/169 [00:53<00:00,  3.18it/s, F1=0.972, train_acc=0.998, train_loss=0.289, train_precision=0.973, train_recall=0.975]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       204
     GPE.NOM       0.89      1.00      0.94         8
     LOC.NAM       0.95      0.93      0.94        56
     LOC.NOM       0.89      0.96      0.92        51
     ORG.NAM       0.97      0.99      0.98       182
     ORG.NOM       0.90      0.88      0.89        42
     PER.NAM       0.98      0.97      0.97       577
     PER.NOM       0.98      0.98      0.98       769

   micro avg       0.97      0.98      0.97      1889
   macro avg       0.94      0.96      0.95      1889
weighted avg       0.97      0.98      0.97      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.22it/s, F1=0.697, eval_acc=0.967, eval_loss=9.4, eval_precision=0.64, eval_recall=0.772] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.61      0.85      0.71        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.50      0.83      0.62         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.39      0.47      0.43        47
     ORG.NOM       0.19      0.60      0.29         5
     PER.NAM       0.75      0.80      0.77        90
     PER.NOM       0.75      0.80      0.78       208

   micro avg       0.65      0.75      0.70       389
   macro avg       0.52      0.67      0.57       389
weighted avg       0.68      0.75      0.71       389



Epoch: 23/30 Train: 100%|██████████| 169/169 [00:56<00:00,  3.02it/s, F1=0.975, train_acc=0.998, train_loss=0.279, train_precision=0.973, train_recall=0.98] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       204
     GPE.NOM       1.00      0.88      0.93         8
     LOC.NAM       0.91      0.93      0.92        56
     LOC.NOM       0.94      0.98      0.96        51
     ORG.NAM       0.97      0.98      0.98       182
     ORG.NOM       0.95      0.93      0.94        42
     PER.NAM       0.96      0.97      0.97       577
     PER.NOM       0.98      0.98      0.98       769

   micro avg       0.97      0.98      0.97      1889
   macro avg       0.96      0.96      0.96      1889
weighted avg       0.97      0.98      0.97      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.33it/s, F1=0.68, eval_acc=0.967, eval_loss=9.9, eval_precision=0.638, eval_recall=0.736]  


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.55      0.85      0.67        26
     GPE.NOM       0.33      1.00      0.50         1
     LOC.NAM       0.50      0.83      0.62         6
     LOC.NOM       0.12      0.17      0.14         6
     ORG.NAM       0.40      0.40      0.40        47
     ORG.NOM       0.22      0.80      0.35         5
     PER.NAM       0.79      0.78      0.78        90
     PER.NOM       0.78      0.78      0.78       208

   micro avg       0.67      0.73      0.70       389
   macro avg       0.46      0.70      0.53       389
weighted avg       0.70      0.73      0.71       389



Epoch: 24/30 Train: 100%|██████████| 169/169 [00:53<00:00,  3.18it/s, F1=0.965, train_acc=0.997, train_loss=0.274, train_precision=0.957, train_recall=0.979]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      1.00      1.00       204
     GPE.NOM       0.89      1.00      0.94         8
     LOC.NAM       0.95      0.96      0.96        56
     LOC.NOM       0.96      1.00      0.98        51
     ORG.NAM       0.98      0.99      0.99       182
     ORG.NOM       0.90      0.90      0.90        42
     PER.NAM       0.95      0.97      0.96       577
     PER.NOM       0.97      0.98      0.97       769

   micro avg       0.96      0.98      0.97      1889
   macro avg       0.95      0.98      0.96      1889
weighted avg       0.97      0.98      0.97      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.29it/s, F1=0.662, eval_acc=0.967, eval_loss=10.2, eval_precision=0.612, eval_recall=0.73] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.54      0.81      0.65        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.50      0.83      0.62         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.35      0.38      0.37        47
     ORG.NOM       0.19      0.80      0.31         5
     PER.NAM       0.73      0.77      0.75        90
     PER.NOM       0.77      0.79      0.78       208

   micro avg       0.64      0.72      0.68       389
   macro avg       0.51      0.67      0.56       389
weighted avg       0.67      0.72      0.69       389



Epoch: 25/30 Train: 100%|██████████| 169/169 [00:53<00:00,  3.17it/s, F1=0.971, train_acc=0.998, train_loss=0.265, train_precision=0.972, train_recall=0.972]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      1.00      0.99       204
     GPE.NOM       1.00      0.88      0.93         8
     LOC.NAM       0.93      0.96      0.95        56
     LOC.NOM       0.98      0.96      0.97        51
     ORG.NAM       0.97      0.97      0.97       182
     ORG.NOM       0.88      0.90      0.89        42
     PER.NAM       0.97      0.97      0.97       577
     PER.NOM       0.98      0.98      0.98       769

   micro avg       0.97      0.97      0.97      1889
   macro avg       0.96      0.95      0.96      1889
weighted avg       0.97      0.97      0.97      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.14it/s, F1=0.664, eval_acc=0.966, eval_loss=10.3, eval_precision=0.605, eval_recall=0.744]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.68      0.81      0.74        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.31      0.83      0.45         6
     LOC.NOM       0.07      0.17      0.10         6
     ORG.NAM       0.34      0.43      0.38        47
     ORG.NOM       0.23      0.60      0.33         5
     PER.NAM       0.70      0.81      0.75        90
     PER.NOM       0.76      0.78      0.77       208

   micro avg       0.63      0.74      0.68       389
   macro avg       0.51      0.68      0.57       389
weighted avg       0.67      0.74      0.70       389



Epoch: 26/30 Train: 100%|██████████| 169/169 [00:56<00:00,  2.99it/s, F1=0.964, train_acc=0.997, train_loss=0.308, train_precision=0.964, train_recall=0.969]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       204
     GPE.NOM       1.00      0.88      0.93         8
     LOC.NAM       0.96      0.95      0.95        56
     LOC.NOM       0.94      0.96      0.95        51
     ORG.NAM       0.96      0.97      0.96       182
     ORG.NOM       0.84      0.88      0.86        42
     PER.NAM       0.97      0.97      0.97       577
     PER.NOM       0.97      0.97      0.97       769

   micro avg       0.97      0.97      0.97      1889
   macro avg       0.95      0.95      0.95      1889
weighted avg       0.97      0.97      0.97      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.26it/s, F1=0.673, eval_acc=0.966, eval_loss=9.4, eval_precision=0.63, eval_recall=0.732]  


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.62      0.81      0.70        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.62      0.83      0.71         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.43      0.40      0.42        47
     ORG.NOM       0.22      0.80      0.35         5
     PER.NAM       0.74      0.76      0.75        90
     PER.NOM       0.73      0.79      0.76       208

   micro avg       0.66      0.72      0.69       389
   macro avg       0.55      0.67      0.59       389
weighted avg       0.67      0.72      0.69       389



Epoch: 27/30 Train: 100%|██████████| 169/169 [00:53<00:00,  3.18it/s, F1=0.972, train_acc=0.997, train_loss=0.259, train_precision=0.972, train_recall=0.977]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      1.00      0.99       204
     GPE.NOM       0.89      1.00      0.94         8
     LOC.NAM       0.95      0.95      0.95        56
     LOC.NOM       0.96      1.00      0.98        51
     ORG.NAM       0.96      0.98      0.97       182
     ORG.NOM       0.95      0.90      0.93        42
     PER.NAM       0.97      0.97      0.97       577
     PER.NOM       0.98      0.98      0.98       769

   micro avg       0.97      0.98      0.97      1889
   macro avg       0.95      0.97      0.96      1889
weighted avg       0.97      0.98      0.97      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.36it/s, F1=0.668, eval_acc=0.963, eval_loss=9.43, eval_precision=0.621, eval_recall=0.73] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.56      0.85      0.68        26
     GPE.NOM       0.00      0.00      0.00         1
     LOC.NAM       0.50      0.83      0.62         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.41      0.40      0.41        47
     ORG.NOM       0.20      0.80      0.32         5
     PER.NAM       0.70      0.78      0.74        90
     PER.NOM       0.75      0.77      0.76       208

   micro avg       0.64      0.72      0.68       389
   macro avg       0.39      0.55      0.44       389
weighted avg       0.66      0.72      0.69       389



Epoch: 28/30 Train: 100%|██████████| 169/169 [00:55<00:00,  3.03it/s, F1=0.962, train_acc=0.997, train_loss=0.256, train_precision=0.959, train_recall=0.967]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       1.00      1.00      1.00       204
     GPE.NOM       0.88      0.88      0.88         8
     LOC.NAM       0.93      0.96      0.95        56
     LOC.NOM       0.92      0.96      0.94        51
     ORG.NAM       0.97      0.98      0.97       182
     ORG.NOM       0.95      0.90      0.93        42
     PER.NAM       0.97      0.97      0.97       577
     PER.NOM       0.97      0.98      0.97       769

   micro avg       0.97      0.97      0.97      1889
   macro avg       0.95      0.95      0.95      1889
weighted avg       0.97      0.97      0.97      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.35it/s, F1=0.672, eval_acc=0.964, eval_loss=9.89, eval_precision=0.635, eval_recall=0.718]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.58      0.85      0.69        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.62      0.83      0.71         6
     LOC.NOM       0.00      0.00      0.00         6
     ORG.NAM       0.40      0.34      0.37        47
     ORG.NOM       0.21      0.60      0.32         5
     PER.NAM       0.63      0.80      0.71        90
     PER.NOM       0.77      0.75      0.76       208

   micro avg       0.65      0.71      0.68       389
   macro avg       0.53      0.65      0.57       389
weighted avg       0.66      0.71      0.68       389



Epoch: 29/30 Train: 100%|██████████| 169/169 [00:53<00:00,  3.18it/s, F1=0.974, train_acc=0.998, train_loss=0.274, train_precision=0.971, train_recall=0.98] 


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.99      1.00      0.99       204
     GPE.NOM       0.89      1.00      0.94         8
     LOC.NAM       0.88      0.93      0.90        56
     LOC.NOM       0.96      0.96      0.96        51
     ORG.NAM       0.97      0.98      0.98       182
     ORG.NOM       0.91      0.93      0.92        42
     PER.NAM       0.97      0.98      0.97       577
     PER.NOM       0.98      0.99      0.98       769

   micro avg       0.97      0.98      0.98      1889
   macro avg       0.94      0.97      0.96      1889
weighted avg       0.97      0.98      0.98      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.35it/s, F1=0.676, eval_acc=0.965, eval_loss=8.54, eval_precision=0.626, eval_recall=0.738]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

     GPE.NAM       0.57      0.81      0.67        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.50      0.83      0.62         6
     LOC.NOM       0.10      0.17      0.12         6
     ORG.NAM       0.39      0.38      0.39        47
     ORG.NOM       0.27      0.60      0.37         5
     PER.NAM       0.65      0.81      0.72        90
     PER.NOM       0.78      0.78      0.78       208

   micro avg       0.65      0.73      0.69       389
   macro avg       0.53      0.67      0.58       389
weighted avg       0.67      0.73      0.69       389



Epoch: 30/30 Train: 100%|██████████| 169/169 [00:53<00:00,  3.14it/s, F1=0.969, train_acc=0.998, train_loss=0.329, train_precision=0.972, train_recall=0.971]


train_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.98      1.00      0.99       204
     GPE.NOM       0.88      0.88      0.88         8
     LOC.NAM       1.00      0.96      0.98        56
     LOC.NOM       0.96      0.96      0.96        51
     ORG.NAM       0.97      0.98      0.97       182
     ORG.NOM       0.93      0.93      0.93        42
     PER.NAM       0.97      0.97      0.97       577
     PER.NOM       0.98      0.98      0.98       769

   micro avg       0.97      0.98      0.97      1889
   macro avg       0.96      0.96      0.96      1889
weighted avg       0.97      0.98      0.97      1889



Eval Result: 100%|██████████| 5/5 [00:01<00:00,  4.28it/s, F1=0.685, eval_acc=0.966, eval_loss=8.41, eval_precision=0.663, eval_recall=0.716]


eval_reports:
              precision    recall  f1-score   support

     GPE.NAM       0.67      0.85      0.75        26
     GPE.NOM       1.00      1.00      1.00         1
     LOC.NAM       0.33      0.83      0.48         6
     LOC.NOM       0.14      0.17      0.15         6
     ORG.NAM       0.43      0.40      0.42        47
     ORG.NOM       0.40      0.80      0.53         5
     PER.NAM       0.75      0.80      0.77        90
     PER.NOM       0.82      0.76      0.79       208

   micro avg       0.71      0.72      0.72       389
   macro avg       0.57      0.70      0.61       389
weighted avg       0.72      0.72      0.72       389



calculate data/few_shot/note4/train_250.json etag: 100%|██████████| 98.0k/98.0k [00:00<00:00, 7.15MB/s]
calculate data/few_shot/note4/dev.json etag: 100%|██████████| 2.46M/2.46M [00:00<00:00, 63.0MB/s]
calculate data/few_shot/note4/test.json etag: 100%|██████████| 2.56M/2.56M [00:00<00:00, 311MB/s]
calculate data/few_shot/note4/labels.txt etag: 100%|██████████| 100/100 [00:00<00:00, 10.9kB/s]

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/note4/train_250.json",
    "eval_file": "data/few_shot/note4/dev.json",
    "test_file": "data/few_shot/note4/test.json",
    "tag_file": "data/few_shot/note4/labels.txt",
    "bert_vocab_file": "./model/chinese_wwm_ext/vocab.txt",
    "output_eval": true,
    "max_scan_num": 1000000,
    "add_seq_vocab": false,
    "max_seq_length": 150,
    "max_word_num": 5,
    "default_tag": "O",
    "use_test": false,
    "do_shuffle": true,
    "do_predict": false,
    "task_name": "note4_pretrain_lebert_crf_250_x1"
}
load cached ./temp/7037c0d8b5e05990c48974ccd914b436_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/lexicon_tree



count line size data/few_shot/note4/labels.txt: 19L [00:00, 152083.54L/s]
build line mapper: 19L [00:00, 138835.85L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 19/19 [00:00<00:00, 5437.48it/s]
load vocab from list: 100%|██████████| 18/18 [00:00<00:00, 193583.26it/s]

load cached ./temp/7037c0d8b5e05990c48974ccd914b436_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/matched_words
load cached ./temp/7037c0d8b5e05990c48974ccd914b436_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/word_vocab
load cached ./temp/7037c0d8b5e05990c48974ccd914b436_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/vocab_embedding



load dataset from data/few_shot/note4/train_250.json: 250it [00:00, 839.06it/s]
load dataset from data/few_shot/note4/dev.json: 4301it [00:07, 573.94it/s]
Some weights of the model checkpoint at save_pretrained/note4_pretrain_lebert_250_pretraind_task/Bert_240/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model 

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.64it/s, F1=0, train_acc=0.394, train_loss=40.3, train_precision=0, train_recall=0]  


train_reports:
              precision    recall  f1-score   support

         GPE       0.00      0.00      0.00        92
         LOC       0.00      0.00      0.00        16
         ORG       0.00      0.00      0.00        57
         PER       0.00      0.00      0.00        64

   micro avg       0.00      0.00      0.00       229
   macro avg       0.00      0.00      0.00       229
weighted avg       0.00      0.00      0.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.10it/s, F1=0, eval_acc=0.895, eval_loss=29.9, eval_precision=0, eval_recall=0]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.00      0.00      0.00      3160
         LOC       0.00      0.00      0.00       482
         ORG       0.00      0.00      0.00      1645
         PER       0.00      0.00      0.00      1650

   micro avg       0.00      0.00      0.00      6937
   macro avg       0.00      0.00      0.00      6937
weighted avg       0.00      0.00      0.00      6937



Epoch: 2/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.73it/s, F1=0, train_acc=0.911, train_loss=16.8, train_precision=0, train_recall=0]


train_reports:
              precision    recall  f1-score   support

         GPE       0.00      0.00      0.00        92
         LOC       0.00      0.00      0.00        16
         ORG       0.00      0.00      0.00        57
         PER       0.00      0.00      0.00        64

   micro avg       0.00      0.00      0.00       229
   macro avg       0.00      0.00      0.00       229
weighted avg       0.00      0.00      0.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.05it/s, F1=0, eval_acc=0.895, eval_loss=24.3, eval_precision=0, eval_recall=0]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.00      0.00      0.00      3160
         LOC       0.00      0.00      0.00       482
         ORG       0.00      0.00      0.00      1645
         PER       0.00      0.00      0.00      1650

   micro avg       0.00      0.00      0.00      6937
   macro avg       0.00      0.00      0.00      6937
weighted avg       0.00      0.00      0.00      6937



Epoch: 3/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.82it/s, F1=0, train_acc=0.902, train_loss=12.7, train_precision=0, train_recall=0]


train_reports:
              precision    recall  f1-score   support

         GPE       0.00      0.00      0.00        92
         LOC       0.00      0.00      0.00        16
         ORG       0.00      0.00      0.00        57
         PER       0.00      0.00      0.00        64

   micro avg       0.00      0.00      0.00       229
   macro avg       0.00      0.00      0.00       229
weighted avg       0.00      0.00      0.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.09it/s, F1=0.000474, eval_acc=0.895, eval_loss=16.7, eval_precision=0.00153, eval_recall=0.000288]
  _warn_prf(average, modifier, msg_start, len(result))


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.00      0.00      0.00      3160
         LOC       0.00      0.00      0.00       482
         ORG       0.01      0.00      0.00      1645
         PER       0.00      0.00      0.00      1650
           _       0.00      0.00      0.00         0

   micro avg       0.00      0.00      0.00      6937
   macro avg       0.00      0.00      0.00      6937
weighted avg       0.00      0.00      0.00      6937



Epoch: 4/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.76it/s, F1=0.00942, train_acc=0.927, train_loss=8.09, train_precision=0.00758, train_recall=0.013]   


train_reports:
              precision    recall  f1-score   support

         GPE       0.02      0.02      0.02        92
         LOC       0.00      0.00      0.00        16
         ORG       0.02      0.02      0.02        57
         PER       0.02      0.03      0.03        64
           _       0.00      0.00      0.00         0

   micro avg       0.02      0.02      0.02       229
   macro avg       0.01      0.01      0.01       229
weighted avg       0.02      0.02      0.02       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.12it/s, F1=0.0514, eval_acc=0.921, eval_loss=11.1, eval_precision=0.0581, eval_recall=0.0472]  


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.02      0.02      0.02      3160
         LOC       0.00      0.00      0.00       482
         ORG       0.16      0.07      0.10      1645
         PER       0.08      0.10      0.09      1650

   micro avg       0.06      0.05      0.05      6937
   macro avg       0.07      0.05      0.05      6937
weighted avg       0.07      0.05      0.05      6937



Epoch: 5/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.73it/s, F1=0.34, train_acc=0.957, train_loss=4.52, train_precision=0.319, train_recall=0.381]   


train_reports:
              precision    recall  f1-score   support

         GPE       0.24      0.36      0.29        92
         LOC       0.00      0.00      0.00        16
         ORG       0.48      0.54      0.51        57
         PER       0.41      0.48      0.44        64

   micro avg       0.34      0.41      0.38       229
   macro avg       0.28      0.35      0.31       229
weighted avg       0.33      0.41      0.37       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.12it/s, F1=0.602, eval_acc=0.95, eval_loss=8.25, eval_precision=0.527, eval_recall=0.716] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.50      0.85      0.63      3160
         LOC       0.00      0.00      0.00       482
         ORG       0.36      0.49      0.41      1645
         PER       0.78      0.88      0.82      1650

   micro avg       0.52      0.71      0.60      6937
   macro avg       0.41      0.55      0.47      6937
weighted avg       0.50      0.71      0.58      6937



Epoch: 6/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.70it/s, F1=0.77, train_acc=0.98, train_loss=2.44, train_precision=0.755, train_recall=0.799]  


train_reports:
              precision    recall  f1-score   support

         GPE       0.70      0.85      0.77        92
         LOC       0.00      0.00      0.00        16
         ORG       0.81      0.84      0.83        57
         PER       0.81      0.91      0.85        64

   micro avg       0.72      0.80      0.76       229
   macro avg       0.58      0.65      0.61       229
weighted avg       0.71      0.80      0.75       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.16it/s, F1=0.62, eval_acc=0.956, eval_loss=7.06, eval_precision=0.595, eval_recall=0.658] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.63      0.69      0.66      3160
         LOC       0.02      0.02      0.02       482
         ORG       0.47      0.51      0.49      1645
         PER       0.71      0.91      0.80      1650

   micro avg       0.59      0.65      0.62      6937
   macro avg       0.46      0.53      0.49      6937
weighted avg       0.57      0.65      0.61      6937



Epoch: 7/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.76it/s, F1=0.781, train_acc=0.985, train_loss=1.91, train_precision=0.741, train_recall=0.839]


train_reports:
              precision    recall  f1-score   support

         GPE       0.79      0.91      0.85        92
         LOC       0.05      0.06      0.05        16
         ORG       0.90      0.96      0.93        57
         PER       0.78      0.89      0.83        64

   micro avg       0.75      0.86      0.80       229
   macro avg       0.63      0.71      0.67       229
weighted avg       0.76      0.86      0.81       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.08it/s, F1=0.668, eval_acc=0.959, eval_loss=6.57, eval_precision=0.678, eval_recall=0.671]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.66      0.75      0.70      3160
         LOC       0.05      0.02      0.03       482
         ORG       0.56      0.48      0.52      1645
         PER       0.86      0.88      0.87      1650

   micro avg       0.67      0.66      0.67      6937
   macro avg       0.53      0.53      0.53      6937
weighted avg       0.64      0.66      0.65      6937



Epoch: 8/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.74it/s, F1=0.825, train_acc=0.992, train_loss=0.898, train_precision=0.823, train_recall=0.849]


train_reports:
              precision    recall  f1-score   support

         GPE       0.89      0.90      0.90        92
         LOC       0.25      0.25      0.25        16
         ORG       0.90      0.95      0.92        57
         PER       0.95      0.97      0.96        64

   micro avg       0.87      0.89      0.88       229
   macro avg       0.75      0.77      0.76       229
weighted avg       0.87      0.89      0.88       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.18it/s, F1=0.686, eval_acc=0.963, eval_loss=6.48, eval_precision=0.672, eval_recall=0.711]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.70      0.74      0.72      3160
         LOC       0.16      0.14      0.15       482
         ORG       0.55      0.63      0.59      1645
         PER       0.86      0.89      0.88      1650

   micro avg       0.67      0.71      0.69      6937
   macro avg       0.57      0.60      0.58      6937
weighted avg       0.66      0.71      0.68      6937



Epoch: 9/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.66it/s, F1=0.901, train_acc=0.997, train_loss=0.359, train_precision=0.898, train_recall=0.906]


train_reports:
              precision    recall  f1-score   support

         GPE       0.97      0.99      0.98        92
         LOC       0.56      0.62      0.59        16
         ORG       0.98      1.00      0.99        57
         PER       1.00      0.95      0.98        64

   micro avg       0.95      0.96      0.95       229
   macro avg       0.88      0.89      0.88       229
weighted avg       0.95      0.96      0.95       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.10it/s, F1=0.681, eval_acc=0.961, eval_loss=6.93, eval_precision=0.648, eval_recall=0.728]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.70      0.75      0.73      3160
         LOC       0.17      0.34      0.22       482
         ORG       0.58      0.59      0.58      1645
         PER       0.86      0.91      0.89      1650

   micro avg       0.64      0.72      0.68      6937
   macro avg       0.58      0.65      0.61      6937
weighted avg       0.67      0.72      0.70      6937



Epoch: 10/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.68it/s, F1=0.965, train_acc=1, train_loss=0.187, train_precision=0.969, train_recall=0.961]    


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      0.97      0.98        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      0.98      0.99        64

   micro avg       1.00      0.98      0.99       229
   macro avg       1.00      0.99      0.99       229
weighted avg       1.00      0.98      0.99       229



Eval Result: 100%|██████████| 68/68 [00:20<00:00,  3.40it/s, F1=0.71, eval_acc=0.964, eval_loss=6.92, eval_precision=0.674, eval_recall=0.761] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.70      0.80      0.75      3160
         LOC       0.21      0.32      0.25       482
         ORG       0.58      0.65      0.61      1645
         PER       0.88      0.91      0.90      1650

   micro avg       0.67      0.76      0.71      6937
   macro avg       0.59      0.67      0.63      6937
weighted avg       0.68      0.76      0.72      6937



Epoch: 11/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.73it/s, F1=1, train_acc=1, train_loss=0.105, train_precision=1, train_recall=1] 


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       1.00      1.00      1.00       229
   macro avg       1.00      1.00      1.00       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.11it/s, F1=0.722, eval_acc=0.964, eval_loss=7.23, eval_precision=0.687, eval_recall=0.771]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.72      0.81      0.76      3160
         LOC       0.27      0.34      0.30       482
         ORG       0.57      0.67      0.62      1645
         PER       0.88      0.92      0.90      1650

   micro avg       0.68      0.77      0.72      6937
   macro avg       0.61      0.68      0.64      6937
weighted avg       0.69      0.77      0.73      6937



Epoch: 12/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.73it/s, F1=1, train_acc=1, train_loss=0.0648, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       1.00      1.00      1.00       229
   macro avg       1.00      1.00      1.00       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.10it/s, F1=0.715, eval_acc=0.964, eval_loss=7.46, eval_precision=0.678, eval_recall=0.767]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.70      0.81      0.75      3160
         LOC       0.27      0.37      0.31       482
         ORG       0.58      0.65      0.61      1645
         PER       0.88      0.92      0.90      1650

   micro avg       0.67      0.77      0.72      6937
   macro avg       0.61      0.69      0.64      6937
weighted avg       0.68      0.77      0.72      6937



Epoch: 13/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.77it/s, F1=0.969, train_acc=1, train_loss=0.0533, train_precision=0.969, train_recall=0.969]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       1.00      1.00      1.00       229
   macro avg       1.00      1.00      1.00       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.15it/s, F1=0.722, eval_acc=0.964, eval_loss=7.63, eval_precision=0.681, eval_recall=0.782]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.69      0.84      0.76      3160
         LOC       0.29      0.37      0.32       482
         ORG       0.57      0.65      0.61      1645
         PER       0.88      0.92      0.90      1650

   micro avg       0.67      0.78      0.72      6937
   macro avg       0.61      0.69      0.65      6937
weighted avg       0.68      0.78      0.73      6937



Epoch: 14/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.73it/s, F1=0.938, train_acc=1, train_loss=0.0402, train_precision=0.938, train_recall=0.938]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       1.00      1.00      1.00       229
   macro avg       1.00      1.00      1.00       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.15it/s, F1=0.72, eval_acc=0.964, eval_loss=7.92, eval_precision=0.683, eval_recall=0.772] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.70      0.83      0.76      3160
         LOC       0.30      0.38      0.33       482
         ORG       0.56      0.62      0.59      1645
         PER       0.88      0.92      0.90      1650

   micro avg       0.68      0.77      0.72      6937
   macro avg       0.61      0.69      0.65      6937
weighted avg       0.68      0.77      0.72      6937



Epoch: 15/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.74it/s, F1=1, train_acc=1, train_loss=0.0314, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       1.00      1.00      1.00       229
   macro avg       1.00      1.00      1.00       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:19<00:00,  3.44it/s, F1=0.721, eval_acc=0.964, eval_loss=8.02, eval_precision=0.686, eval_recall=0.772]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.71      0.83      0.76      3160
         LOC       0.29      0.38      0.33       482
         ORG       0.57      0.62      0.60      1645
         PER       0.88      0.92      0.90      1650

   micro avg       0.68      0.77      0.72      6937
   macro avg       0.61      0.69      0.65      6937
weighted avg       0.69      0.77      0.73      6937



Epoch: 16/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.74it/s, F1=1, train_acc=1, train_loss=0.0273, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       1.00      1.00      1.00       229
   macro avg       1.00      1.00      1.00       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.05it/s, F1=0.726, eval_acc=0.965, eval_loss=8.07, eval_precision=0.688, eval_recall=0.781]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.71      0.84      0.77      3160
         LOC       0.30      0.39      0.34       482
         ORG       0.57      0.64      0.60      1645
         PER       0.88      0.93      0.90      1650

   micro avg       0.68      0.78      0.73      6937
   macro avg       0.62      0.70      0.65      6937
weighted avg       0.69      0.78      0.73      6937



Epoch: 17/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.60it/s, F1=1, train_acc=1, train_loss=0.0225, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       1.00      1.00      1.00       229
   macro avg       1.00      1.00      1.00       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.12it/s, F1=0.724, eval_acc=0.964, eval_loss=8.3, eval_precision=0.686, eval_recall=0.778] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.71      0.84      0.77      3160
         LOC       0.30      0.38      0.33       482
         ORG       0.57      0.63      0.60      1645
         PER       0.88      0.92      0.90      1650

   micro avg       0.68      0.78      0.73      6937
   macro avg       0.61      0.69      0.65      6937
weighted avg       0.69      0.78      0.73      6937



Epoch: 18/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.74it/s, F1=0.969, train_acc=1, train_loss=0.0212, train_precision=0.969, train_recall=0.969]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       1.00      1.00      1.00       229
   macro avg       1.00      1.00      1.00       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.11it/s, F1=0.724, eval_acc=0.964, eval_loss=8.46, eval_precision=0.685, eval_recall=0.778]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.71      0.84      0.77      3160
         LOC       0.30      0.37      0.33       482
         ORG       0.56      0.63      0.60      1645
         PER       0.88      0.92      0.90      1650

   micro avg       0.68      0.78      0.73      6937
   macro avg       0.61      0.69      0.65      6937
weighted avg       0.69      0.78      0.73      6937



Epoch: 19/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.67it/s, F1=0.938, train_acc=1, train_loss=0.018, train_precision=0.938, train_recall=0.938] 


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       1.00      1.00      1.00       229
   macro avg       1.00      1.00      1.00       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.16it/s, F1=0.728, eval_acc=0.965, eval_loss=8.52, eval_precision=0.693, eval_recall=0.777]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.71      0.83      0.77      3160
         LOC       0.31      0.37      0.34       482
         ORG       0.57      0.64      0.61      1645
         PER       0.88      0.92      0.90      1650

   micro avg       0.69      0.78      0.73      6937
   macro avg       0.62      0.69      0.65      6937
weighted avg       0.69      0.78      0.73      6937



Epoch: 20/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.73it/s, F1=1, train_acc=1, train_loss=0.0222, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       1.00      1.00      1.00       229
   macro avg       1.00      1.00      1.00       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:20<00:00,  3.39it/s, F1=0.72, eval_acc=0.963, eval_loss=8.69, eval_precision=0.667, eval_recall=0.796] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.67      0.86      0.75      3160
         LOC       0.29      0.39      0.33       482
         ORG       0.56      0.65      0.60      1645
         PER       0.88      0.93      0.90      1650

   micro avg       0.66      0.80      0.72      6937
   macro avg       0.60      0.71      0.65      6937
weighted avg       0.67      0.80      0.72      6937



Epoch: 21/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.66it/s, F1=0.999, train_acc=1, train_loss=0.037, train_precision=0.998, train_recall=1]   


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      1.00      0.99        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       1.00      1.00      1.00       229
   macro avg       1.00      1.00      1.00       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.11it/s, F1=0.721, eval_acc=0.964, eval_loss=8.61, eval_precision=0.686, eval_recall=0.773]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.71      0.82      0.76      3160
         LOC       0.30      0.38      0.33       482
         ORG       0.57      0.63      0.60      1645
         PER       0.88      0.92      0.90      1650

   micro avg       0.68      0.77      0.72      6937
   macro avg       0.61      0.69      0.65      6937
weighted avg       0.69      0.77      0.73      6937



Epoch: 22/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.75it/s, F1=0.999, train_acc=1, train_loss=0.0254, train_precision=0.998, train_recall=1]  


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      1.00      0.99        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       1.00      1.00      1.00       229
   macro avg       1.00      1.00      1.00       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.11it/s, F1=0.723, eval_acc=0.964, eval_loss=8.45, eval_precision=0.691, eval_recall=0.77] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.73      0.80      0.77      3160
         LOC       0.29      0.39      0.33       482
         ORG       0.56      0.67      0.61      1645
         PER       0.88      0.92      0.90      1650

   micro avg       0.69      0.77      0.73      6937
   macro avg       0.62      0.69      0.65      6937
weighted avg       0.70      0.77      0.73      6937



Epoch: 23/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.70it/s, F1=0.969, train_acc=1, train_loss=0.0135, train_precision=0.969, train_recall=0.969]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       1.00      1.00      1.00       229
   macro avg       1.00      1.00      1.00       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.11it/s, F1=0.726, eval_acc=0.964, eval_loss=8.53, eval_precision=0.685, eval_recall=0.784]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.73      0.82      0.77      3160
         LOC       0.31      0.39      0.34       482
         ORG       0.55      0.68      0.61      1645
         PER       0.88      0.92      0.90      1650

   micro avg       0.68      0.78      0.73      6937
   macro avg       0.62      0.70      0.66      6937
weighted avg       0.69      0.78      0.73      6937



Epoch: 24/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.65it/s, F1=0.969, train_acc=1, train_loss=0.0117, train_precision=0.969, train_recall=0.969]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       1.00      1.00      1.00       229
   macro avg       1.00      1.00      1.00       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.12it/s, F1=0.729, eval_acc=0.965, eval_loss=8.61, eval_precision=0.688, eval_recall=0.789]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.72      0.82      0.77      3160
         LOC       0.32      0.39      0.35       482
         ORG       0.56      0.70      0.62      1645
         PER       0.89      0.92      0.90      1650

   micro avg       0.68      0.79      0.73      6937
   macro avg       0.62      0.71      0.66      6937
weighted avg       0.69      0.79      0.74      6937



Epoch: 25/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.80it/s, F1=0.938, train_acc=1, train_loss=0.0113, train_precision=0.938, train_recall=0.938]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       1.00      1.00      1.00       229
   macro avg       1.00      1.00      1.00       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:19<00:00,  3.44it/s, F1=0.728, eval_acc=0.965, eval_loss=8.71, eval_precision=0.69, eval_recall=0.782] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.72      0.81      0.76      3160
         LOC       0.32      0.39      0.35       482
         ORG       0.57      0.69      0.62      1645
         PER       0.89      0.92      0.90      1650

   micro avg       0.69      0.78      0.73      6937
   macro avg       0.62      0.70      0.66      6937
weighted avg       0.70      0.78      0.74      6937



Epoch: 26/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.68it/s, F1=0.906, train_acc=1, train_loss=0.00889, train_precision=0.906, train_recall=0.906]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       1.00      1.00      1.00       229
   macro avg       1.00      1.00      1.00       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.15it/s, F1=0.728, eval_acc=0.965, eval_loss=8.79, eval_precision=0.69, eval_recall=0.783] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.72      0.82      0.77      3160
         LOC       0.31      0.39      0.35       482
         ORG       0.57      0.69      0.62      1645
         PER       0.89      0.92      0.90      1650

   micro avg       0.69      0.78      0.73      6937
   macro avg       0.62      0.71      0.66      6937
weighted avg       0.70      0.78      0.74      6937



Epoch: 27/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.71it/s, F1=0.93, train_acc=0.999, train_loss=0.178, train_precision=0.93, train_recall=0.931]  


train_reports:
              precision    recall  f1-score   support

         GPE       0.97      0.98      0.97        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       0.99      0.99      0.99       229
   macro avg       0.99      0.99      0.99       229
weighted avg       0.99      0.99      0.99       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.11it/s, F1=0.667, eval_acc=0.961, eval_loss=8.93, eval_precision=0.676, eval_recall=0.667]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.69      0.59      0.64      3160
         LOC       0.24      0.26      0.25       482
         ORG       0.55      0.66      0.60      1645
         PER       0.89      0.92      0.90      1650

   micro avg       0.67      0.66      0.66      6937
   macro avg       0.59      0.61      0.60      6937
weighted avg       0.67      0.66      0.66      6937



Epoch: 28/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.62it/s, F1=0.998, train_acc=1, train_loss=0.0701, train_precision=0.997, train_recall=1]    


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      1.00      0.99        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       1.00      1.00      1.00       229
   macro avg       1.00      1.00      1.00       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.15it/s, F1=0.717, eval_acc=0.964, eval_loss=7.82, eval_precision=0.67, eval_recall=0.782] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.70      0.83      0.76      3160
         LOC       0.30      0.35      0.32       482
         ORG       0.52      0.67      0.59      1645
         PER       0.88      0.92      0.90      1650

   micro avg       0.66      0.78      0.72      6937
   macro avg       0.60      0.69      0.64      6937
weighted avg       0.67      0.78      0.72      6937



Epoch: 29/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.67it/s, F1=0.938, train_acc=1, train_loss=0.0213, train_precision=0.938, train_recall=0.938]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       1.00      1.00      1.00       229
   macro avg       1.00      1.00      1.00       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.07it/s, F1=0.71, eval_acc=0.963, eval_loss=8.6, eval_precision=0.682, eval_recall=0.751]  


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.72      0.80      0.76      3160
         LOC       0.27      0.41      0.32       482
         ORG       0.56      0.58      0.57      1645
         PER       0.87      0.92      0.90      1650

   micro avg       0.68      0.75      0.71      6937
   macro avg       0.61      0.68      0.64      6937
weighted avg       0.69      0.75      0.72      6937



Epoch: 30/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.69it/s, F1=0.963, train_acc=0.999, train_loss=0.189, train_precision=0.963, train_recall=0.964]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      0.98      0.99        57
         PER       0.98      1.00      0.99        64

   micro avg       1.00      1.00      1.00       229
   macro avg       1.00      1.00      1.00       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.10it/s, F1=0.67, eval_acc=0.947, eval_loss=10.6, eval_precision=0.584, eval_recall=0.802] 


eval_reports:
              precision    recall  f1-score   support

         GPE       0.69      0.81      0.75      3160
         LOC       0.36      0.38      0.37       482
         ORG       0.35      0.74      0.48      1645
         PER       0.91      0.92      0.91      1650

   micro avg       0.59      0.79      0.67      6937
   macro avg       0.58      0.71      0.63      6937
weighted avg       0.64      0.79      0.70      6937



calculate data/few_shot/note4/train_250.json etag: 100%|██████████| 98.0k/98.0k [00:00<00:00, 137MB/s]
calculate data/few_shot/note4/dev.json etag: 100%|██████████| 2.46M/2.46M [00:00<00:00, 316MB/s]
calculate data/few_shot/note4/test.json etag: 100%|██████████| 2.56M/2.56M [00:00<00:00, 367MB/s]
calculate data/few_shot/note4/labels.txt etag: 100%|██████████| 100/100 [00:00<00:00, 202kB/s]

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/note4/train_250.json",
    "eval_file": "data/few_shot/note4/dev.json",
    "test_file": "data/few_shot/note4/test.json",
    "tag_file": "data/few_shot/note4/labels.txt",
    "bert_vocab_file": "./model/chinese_wwm_ext/vocab.txt",
    "output_eval": true,
    "max_scan_num": 1000000,
    "add_seq_vocab": false,
    "max_seq_length": 150,
    "max_word_num": 5,
    "default_tag": "O",
    "use_test": false,
    "do_shuffle": true,
    "do_predict": false,
    "task_name": "note4_pretrain_lebert_crf_250_x2"
}
load cached ./temp/7037c0d8b5e05990c48974ccd914b436_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/lexicon_tree



count line size data/few_shot/note4/labels.txt: 19L [00:00, 167772.16L/s]
build line mapper: 19L [00:00, 41527.76L/s]9 [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 19/19 [00:00<00:00, 5743.14it/s]
load vocab from list: 100%|██████████| 18/18 [00:00<00:00, 206277.25it/s]
load dataset from data/few_shot/note4/train_250.json: 0it [00:00, ?it/s]

load cached ./temp/7037c0d8b5e05990c48974ccd914b436_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/matched_words
load cached ./temp/7037c0d8b5e05990c48974ccd914b436_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/word_vocab
load cached ./temp/7037c0d8b5e05990c48974ccd914b436_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/vocab_embedding


load dataset from data/few_shot/note4/train_250.json: 250it [00:00, 829.01it/s]
load dataset from data/few_shot/note4/dev.json: 4301it [00:07, 563.50it/s]
Some weights of the model checkpoint at save_pretrained/note4_pretrain_lebert_250_pretraind_task/Bert_240/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model f

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.62it/s, F1=0, train_acc=0.0956, train_loss=102, train_precision=0, train_recall=0]  


train_reports:
              precision    recall  f1-score   support

         GPE       0.00      0.00      0.00        92
         LOC       0.00      0.00      0.00        16
         ORG       0.00      0.00      0.00        57
         PER       0.00      0.00      0.00        64

   micro avg       0.00      0.00      0.00       229
   macro avg       0.00      0.00      0.00       229
weighted avg       0.00      0.00      0.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.12it/s, F1=0, eval_acc=0.893, eval_loss=52, eval_precision=0, eval_recall=0]  


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.00      0.00      0.00      3160
         LOC       0.00      0.00      0.00       482
         ORG       0.00      0.00      0.00      1645
         PER       0.00      0.00      0.00      1650

   micro avg       0.00      0.00      0.00      6937
   macro avg       0.00      0.00      0.00      6937
weighted avg       0.00      0.00      0.00      6937



Epoch: 2/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.69it/s, F1=0, train_acc=0.911, train_loss=21.3, train_precision=0, train_recall=0]


train_reports:
              precision    recall  f1-score   support

         GPE       0.00      0.00      0.00        92
         LOC       0.00      0.00      0.00        16
         ORG       0.00      0.00      0.00        57
         PER       0.00      0.00      0.00        64

   micro avg       0.00      0.00      0.00       229
   macro avg       0.00      0.00      0.00       229
weighted avg       0.00      0.00      0.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.07it/s, F1=0, eval_acc=0.895, eval_loss=30.3, eval_precision=0, eval_recall=0]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.00      0.00      0.00      3160
         LOC       0.00      0.00      0.00       482
         ORG       0.00      0.00      0.00      1645
         PER       0.00      0.00      0.00      1650

   micro avg       0.00      0.00      0.00      6937
   macro avg       0.00      0.00      0.00      6937
weighted avg       0.00      0.00      0.00      6937



Epoch: 3/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.71it/s, F1=0, train_acc=0.911, train_loss=16.9, train_precision=0, train_recall=0]


train_reports:
              precision    recall  f1-score   support

         GPE       0.00      0.00      0.00        92
         LOC       0.00      0.00      0.00        16
         ORG       0.00      0.00      0.00        57
         PER       0.00      0.00      0.00        64

   micro avg       0.00      0.00      0.00       229
   macro avg       0.00      0.00      0.00       229
weighted avg       0.00      0.00      0.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.18it/s, F1=0, eval_acc=0.895, eval_loss=25, eval_precision=0, eval_recall=0]  


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.00      0.00      0.00      3160
         LOC       0.00      0.00      0.00       482
         ORG       0.00      0.00      0.00      1645
         PER       0.00      0.00      0.00      1650

   micro avg       0.00      0.00      0.00      6937
   macro avg       0.00      0.00      0.00      6937
weighted avg       0.00      0.00      0.00      6937



Epoch: 4/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.63it/s, F1=0.007, train_acc=0.91, train_loss=12.4, train_precision=0.00631, train_recall=0.00837]   


train_reports:
              precision    recall  f1-score   support

         GPE       0.04      0.03      0.04        92
         LOC       0.00      0.00      0.00        16
         ORG       0.00      0.00      0.00        57
         PER       0.00      0.00      0.00        64
           _       0.00      0.00      0.00         0

   micro avg       0.02      0.01      0.01       229
   macro avg       0.01      0.01      0.01       229
weighted avg       0.02      0.01      0.01       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.15it/s, F1=0.011, eval_acc=0.903, eval_loss=18.1, eval_precision=0.00776, eval_recall=0.0193]  


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.02      0.03      0.02      3160
         LOC       0.00      0.00      0.00       482
         ORG       0.00      0.02      0.01      1645
         PER       0.01      0.01      0.01      1650
           _       0.00      0.00      0.00         0

   micro avg       0.01      0.02      0.01      6937
   macro avg       0.01      0.01      0.01      6937
weighted avg       0.01      0.02      0.01      6937



Epoch: 5/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.82it/s, F1=0.183, train_acc=0.942, train_loss=7.54, train_precision=0.174, train_recall=0.222]   


train_reports:
              precision    recall  f1-score   support

         GPE       0.18      0.35      0.23        92
         LOC       0.00      0.00      0.00        16
         ORG       0.00      0.00      0.00        57
         PER       0.13      0.25      0.17        64
           _       0.00      0.00      0.00         0

   micro avg       0.11      0.21      0.14       229
   macro avg       0.06      0.12      0.08       229
weighted avg       0.11      0.21      0.14       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.05it/s, F1=0.347, eval_acc=0.939, eval_loss=12.2, eval_precision=0.276, eval_recall=0.482]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.32      0.63      0.43      3160
         LOC       0.00      0.00      0.00       482
         ORG       0.01      0.02      0.01      1645
         PER       0.66      0.75      0.70      1650
           _       0.00      0.00      0.00         0

   micro avg       0.26      0.47      0.33      6937
   macro avg       0.20      0.28      0.23      6937
weighted avg       0.31      0.47      0.36      6937



Epoch: 6/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.76it/s, F1=0.325, train_acc=0.966, train_loss=4.42, train_precision=0.289, train_recall=0.392]


train_reports:
              precision    recall  f1-score   support

         GPE       0.28      0.52      0.37        92
         LOC       0.00      0.00      0.00        16
         ORG       0.04      0.09      0.06        57
         PER       0.58      0.67      0.62        64
           _       0.00      0.00      0.00         0

   micro avg       0.25      0.42      0.31       229
   macro avg       0.18      0.26      0.21       229
weighted avg       0.29      0.42      0.34       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.15it/s, F1=0.438, eval_acc=0.942, eval_loss=11.2, eval_precision=0.368, eval_recall=0.552]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.39      0.71      0.50      3160
         LOC       0.00      0.00      0.00       482
         ORG       0.02      0.02      0.02      1645
         PER       0.71      0.89      0.79      1650
           _       0.00      0.00      0.00         0

   micro avg       0.36      0.54      0.43      6937
   macro avg       0.22      0.32      0.26      6937
weighted avg       0.35      0.54      0.42      6937



Epoch: 7/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.70it/s, F1=0.551, train_acc=0.975, train_loss=2.82, train_precision=0.507, train_recall=0.63] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.46      0.67      0.55        92
         LOC       0.00      0.00      0.00        16
         ORG       0.35      0.56      0.43        57
         PER       0.66      0.83      0.74        64
           _       0.00      0.00      0.00         0

   micro avg       0.47      0.64      0.54       229
   macro avg       0.29      0.41      0.34       229
weighted avg       0.46      0.64      0.53       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.14it/s, F1=0.525, eval_acc=0.952, eval_loss=9.71, eval_precision=0.461, eval_recall=0.62] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.47      0.74      0.58      3160
         LOC       0.00      0.00      0.00       482
         ORG       0.20      0.29      0.23      1645
         PER       0.80      0.86      0.83      1650
           _       0.00      0.00      0.00         0

   micro avg       0.45      0.61      0.52      6937
   macro avg       0.29      0.38      0.33      6937
weighted avg       0.45      0.61      0.52      6937



Epoch: 8/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.77it/s, F1=0.747, train_acc=0.986, train_loss=2.05, train_precision=0.707, train_recall=0.804]


train_reports:
              precision    recall  f1-score   support

         GPE       0.61      0.80      0.69        92
         LOC       0.05      0.06      0.06        16
         ORG       0.68      0.81      0.74        57
         PER       0.86      0.92      0.89        64

   micro avg       0.65      0.79      0.71       229
   macro avg       0.55      0.65      0.59       229
weighted avg       0.65      0.79      0.71       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.10it/s, F1=0.568, eval_acc=0.952, eval_loss=9.36, eval_precision=0.505, eval_recall=0.663]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.56      0.65      0.60      3160
         LOC       0.00      0.00      0.00       482
         ORG       0.28      0.57      0.37      1645
         PER       0.81      0.90      0.85      1650
           _       0.00      0.00      0.00         0

   micro avg       0.49      0.65      0.56      6937
   macro avg       0.33      0.42      0.37      6937
weighted avg       0.52      0.65      0.57      6937



Epoch: 9/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.76it/s, F1=0.821, train_acc=0.992, train_loss=1.01, train_precision=0.809, train_recall=0.839] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.80      0.89      0.84        92
         LOC       0.11      0.12      0.11        16
         ORG       0.84      0.95      0.89        57
         PER       0.98      0.94      0.96        64

   micro avg       0.80      0.86      0.83       229
   macro avg       0.68      0.73      0.70       229
weighted avg       0.81      0.86      0.84       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.11it/s, F1=0.608, eval_acc=0.954, eval_loss=9.24, eval_precision=0.542, eval_recall=0.704]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.64      0.64      0.64      3160
         LOC       0.18      0.27      0.21       482
         ORG       0.35      0.67      0.46      1645
         PER       0.78      0.92      0.84      1650

   micro avg       0.53      0.69      0.60      6937
   macro avg       0.49      0.63      0.54      6937
weighted avg       0.57      0.69      0.62      6937



Epoch: 10/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.72it/s, F1=0.908, train_acc=0.995, train_loss=0.665, train_precision=0.907, train_recall=0.916]


train_reports:
              precision    recall  f1-score   support

         GPE       0.91      0.91      0.91        92
         LOC       0.87      0.81      0.84        16
         ORG       0.87      0.91      0.89        57
         PER       0.97      0.98      0.98        64

   micro avg       0.91      0.93      0.92       229
   macro avg       0.90      0.91      0.90       229
weighted avg       0.91      0.93      0.92       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.14it/s, F1=0.591, eval_acc=0.954, eval_loss=9.89, eval_precision=0.527, eval_recall=0.687]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.57      0.73      0.64      3160
         LOC       0.12      0.28      0.16       482
         ORG       0.38      0.52      0.44      1645
         PER       0.83      0.85      0.84      1650

   micro avg       0.51      0.68      0.58      6937
   macro avg       0.47      0.60      0.52      6937
weighted avg       0.55      0.68      0.60      6937



Epoch: 11/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.68it/s, F1=0.928, train_acc=0.998, train_loss=0.437, train_precision=0.918, train_recall=0.945]


train_reports:
              precision    recall  f1-score   support

         GPE       0.96      0.96      0.96        92
         LOC       0.65      0.81      0.72        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       0.95      0.97      0.96       229
   macro avg       0.90      0.94      0.92       229
weighted avg       0.96      0.97      0.96       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.04it/s, F1=0.635, eval_acc=0.958, eval_loss=9.56, eval_precision=0.591, eval_recall=0.696]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.66      0.67      0.66      3160
         LOC       0.24      0.24      0.24       482
         ORG       0.43      0.66      0.52      1645
         PER       0.77      0.89      0.82      1650

   micro avg       0.59      0.69      0.63      6937
   macro avg       0.52      0.61      0.56      6937
weighted avg       0.60      0.69      0.64      6937



Epoch: 12/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.71it/s, F1=0.946, train_acc=0.999, train_loss=0.251, train_precision=0.958, train_recall=0.945]


train_reports:
              precision    recall  f1-score   support

         GPE       0.97      0.97      0.97        92
         LOC       0.94      1.00      0.97        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       0.98      0.99      0.98       229
   macro avg       0.98      0.99      0.98       229
weighted avg       0.98      0.99      0.98       229



Eval Result: 100%|██████████| 68/68 [00:19<00:00,  3.42it/s, F1=0.621, eval_acc=0.957, eval_loss=10.3, eval_precision=0.592, eval_recall=0.666]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.66      0.61      0.63      3160
         LOC       0.19      0.26      0.22       482
         ORG       0.44      0.64      0.52      1645
         PER       0.78      0.89      0.83      1650

   micro avg       0.58      0.66      0.62      6937
   macro avg       0.52      0.60      0.55      6937
weighted avg       0.61      0.66      0.62      6937



Epoch: 13/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.70it/s, F1=0.938, train_acc=0.998, train_loss=0.372, train_precision=0.941, train_recall=0.939]


train_reports:
              precision    recall  f1-score   support

         GPE       0.97      0.96      0.96        92
         LOC       1.00      1.00      1.00        16
         ORG       0.97      1.00      0.98        57
         PER       0.97      0.98      0.98        64

   micro avg       0.97      0.98      0.97       229
   macro avg       0.98      0.99      0.98       229
weighted avg       0.97      0.98      0.97       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.09it/s, F1=0.646, eval_acc=0.959, eval_loss=9.86, eval_precision=0.58, eval_recall=0.744] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.60      0.80      0.69      3160
         LOC       0.22      0.32      0.26       482
         ORG       0.42      0.57      0.49      1645
         PER       0.82      0.90      0.86      1650

   micro avg       0.57      0.74      0.64      6937
   macro avg       0.52      0.65      0.57      6937
weighted avg       0.58      0.74      0.65      6937



Epoch: 14/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.77it/s, F1=0.891, train_acc=0.998, train_loss=0.33, train_precision=0.882, train_recall=0.903] 


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      0.98      0.99        92
         LOC       0.94      0.94      0.94        16
         ORG       0.89      0.95      0.92        57
         PER       0.97      1.00      0.98        64

   micro avg       0.96      0.97      0.97       229
   macro avg       0.95      0.97      0.96       229
weighted avg       0.96      0.97      0.97       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.12it/s, F1=0.613, eval_acc=0.952, eval_loss=14.1, eval_precision=0.609, eval_recall=0.628]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.66      0.73      0.69      3160
         LOC       0.21      0.29      0.24       482
         ORG       0.36      0.29      0.32      1645
         PER       0.81      0.87      0.84      1650

   micro avg       0.60      0.63      0.62      6937
   macro avg       0.51      0.54      0.53      6937
weighted avg       0.60      0.63      0.61      6937



Epoch: 15/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.73it/s, F1=0.916, train_acc=0.997, train_loss=0.591, train_precision=0.91, train_recall=0.931] 


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00        92
         LOC       0.87      0.81      0.84        16
         ORG       0.81      0.91      0.86        57
         PER       1.00      1.00      1.00        64

   micro avg       0.94      0.97      0.95       229
   macro avg       0.92      0.93      0.92       229
weighted avg       0.94      0.97      0.95       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.11it/s, F1=0.655, eval_acc=0.959, eval_loss=11.1, eval_precision=0.599, eval_recall=0.735]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.63      0.78      0.69      3160
         LOC       0.23      0.34      0.27       482
         ORG       0.45      0.59      0.51      1645
         PER       0.85      0.90      0.87      1650

   micro avg       0.59      0.73      0.65      6937
   macro avg       0.54      0.65      0.59      6937
weighted avg       0.61      0.73      0.66      6937



Epoch: 16/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.60it/s, F1=0.954, train_acc=0.992, train_loss=2.1, train_precision=0.96, train_recall=0.965]   


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.99      0.99        92
         LOC       0.88      0.88      0.88        16
         ORG       0.90      0.95      0.92        57
         PER       0.98      0.98      0.98        64

   micro avg       0.96      0.97      0.96       229
   macro avg       0.94      0.95      0.94       229
weighted avg       0.96      0.97      0.96       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.08it/s, F1=0.637, eval_acc=0.957, eval_loss=11.4, eval_precision=0.602, eval_recall=0.687]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.64      0.76      0.70      3160
         LOC       0.24      0.37      0.29       482
         ORG       0.41      0.42      0.41      1645
         PER       0.82      0.90      0.86      1650

   micro avg       0.60      0.69      0.64      6937
   macro avg       0.53      0.61      0.57      6937
weighted avg       0.60      0.69      0.64      6937



Epoch: 17/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.65it/s, F1=0.95, train_acc=0.999, train_loss=0.334, train_precision=0.946, train_recall=0.954] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.99      0.99        92
         LOC       1.00      1.00      1.00        16
         ORG       0.90      0.95      0.92        57
         PER       1.00      1.00      1.00        64

   micro avg       0.97      0.98      0.98       229
   macro avg       0.97      0.98      0.98       229
weighted avg       0.97      0.98      0.98       229



Eval Result: 100%|██████████| 68/68 [00:19<00:00,  3.41it/s, F1=0.659, eval_acc=0.959, eval_loss=10, eval_precision=0.612, eval_recall=0.726]  


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.67      0.76      0.71      3160
         LOC       0.30      0.29      0.29       482
         ORG       0.40      0.59      0.48      1645
         PER       0.84      0.89      0.87      1650

   micro avg       0.60      0.72      0.66      6937
   macro avg       0.55      0.63      0.59      6937
weighted avg       0.62      0.72      0.66      6937



Epoch: 18/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.69it/s, F1=0.963, train_acc=1, train_loss=0.0849, train_precision=0.962, train_recall=0.965]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00        92
         LOC       1.00      1.00      1.00        16
         ORG       0.97      0.98      0.97        57
         PER       1.00      1.00      1.00        64

   micro avg       0.99      1.00      0.99       229
   macro avg       0.99      1.00      0.99       229
weighted avg       0.99      1.00      0.99       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.00it/s, F1=0.664, eval_acc=0.959, eval_loss=10.6, eval_precision=0.605, eval_recall=0.748]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.67      0.75      0.71      3160
         LOC       0.27      0.39      0.32       482
         ORG       0.41      0.65      0.50      1645
         PER       0.85      0.91      0.88      1650

   micro avg       0.60      0.74      0.66      6937
   macro avg       0.55      0.67      0.60      6937
weighted avg       0.62      0.74      0.67      6937



Epoch: 19/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.75it/s, F1=0.95, train_acc=1, train_loss=0.0711, train_precision=0.953, train_recall=0.948]     


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.98      0.98        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       1.00      0.99      0.99       229
   macro avg       1.00      0.99      1.00       229
weighted avg       1.00      0.99      0.99       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.12it/s, F1=0.666, eval_acc=0.959, eval_loss=10.7, eval_precision=0.606, eval_recall=0.753]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.64      0.78      0.70      3160
         LOC       0.28      0.29      0.29       482
         ORG       0.42      0.64      0.51      1645
         PER       0.84      0.91      0.87      1650

   micro avg       0.60      0.74      0.66      6937
   macro avg       0.55      0.66      0.59      6937
weighted avg       0.61      0.74      0.67      6937



Epoch: 20/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.71it/s, F1=0.994, train_acc=1, train_loss=0.0495, train_precision=0.992, train_recall=0.996]


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      1.00      0.99        92
         LOC       0.94      0.94      0.94        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       0.99      1.00      0.99       229
   macro avg       0.98      0.98      0.98       229
weighted avg       0.99      1.00      0.99       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.12it/s, F1=0.669, eval_acc=0.959, eval_loss=10.9, eval_precision=0.609, eval_recall=0.756]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.66      0.76      0.71      3160
         LOC       0.26      0.39      0.31       482
         ORG       0.44      0.66      0.52      1645
         PER       0.85      0.91      0.88      1650

   micro avg       0.60      0.75      0.67      6937
   macro avg       0.55      0.68      0.61      6937
weighted avg       0.62      0.75      0.68      6937



Epoch: 21/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.77it/s, F1=0.938, train_acc=1, train_loss=0.0387, train_precision=0.938, train_recall=0.938]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       1.00      1.00      1.00       229
   macro avg       1.00      1.00      1.00       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.17it/s, F1=0.671, eval_acc=0.96, eval_loss=11, eval_precision=0.616, eval_recall=0.752]   


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.66      0.77      0.71      3160
         LOC       0.26      0.36      0.31       482
         ORG       0.44      0.63      0.52      1645
         PER       0.84      0.91      0.87      1650

   micro avg       0.61      0.74      0.67      6937
   macro avg       0.55      0.67      0.60      6937
weighted avg       0.62      0.74      0.68      6937



Epoch: 22/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.66it/s, F1=1, train_acc=1, train_loss=0.0283, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       1.00      1.00      1.00       229
   macro avg       1.00      1.00      1.00       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:19<00:00,  3.43it/s, F1=0.675, eval_acc=0.96, eval_loss=11.1, eval_precision=0.625, eval_recall=0.747] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.66      0.78      0.72      3160
         LOC       0.27      0.35      0.31       482
         ORG       0.45      0.62      0.52      1645
         PER       0.84      0.90      0.87      1650

   micro avg       0.62      0.74      0.67      6937
   macro avg       0.56      0.66      0.61      6937
weighted avg       0.63      0.74      0.68      6937



Epoch: 23/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.74it/s, F1=0.969, train_acc=1, train_loss=0.0317, train_precision=0.969, train_recall=0.969]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       1.00      1.00      1.00       229
   macro avg       1.00      1.00      1.00       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.10it/s, F1=0.672, eval_acc=0.96, eval_loss=11.4, eval_precision=0.608, eval_recall=0.765] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.64      0.80      0.71      3160
         LOC       0.26      0.36      0.30       482
         ORG       0.44      0.64      0.52      1645
         PER       0.85      0.91      0.88      1650

   micro avg       0.60      0.76      0.67      6937
   macro avg       0.55      0.68      0.60      6937
weighted avg       0.62      0.76      0.68      6937



Epoch: 24/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.71it/s, F1=1, train_acc=1, train_loss=0.0223, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       1.00      1.00      1.00       229
   macro avg       1.00      1.00      1.00       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.14it/s, F1=0.675, eval_acc=0.96, eval_loss=11.5, eval_precision=0.614, eval_recall=0.762] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.65      0.79      0.71      3160
         LOC       0.27      0.36      0.31       482
         ORG       0.44      0.64      0.52      1645
         PER       0.85      0.91      0.88      1650

   micro avg       0.61      0.75      0.67      6937
   macro avg       0.55      0.68      0.61      6937
weighted avg       0.62      0.75      0.68      6937



Epoch: 25/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.73it/s, F1=1, train_acc=1, train_loss=0.0189, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       1.00      1.00      1.00       229
   macro avg       1.00      1.00      1.00       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.12it/s, F1=0.676, eval_acc=0.96, eval_loss=11.6, eval_precision=0.617, eval_recall=0.762] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.65      0.79      0.72      3160
         LOC       0.28      0.37      0.31       482
         ORG       0.45      0.64      0.53      1645
         PER       0.84      0.91      0.88      1650

   micro avg       0.61      0.75      0.67      6937
   macro avg       0.55      0.68      0.61      6937
weighted avg       0.62      0.75      0.68      6937



Epoch: 26/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.74it/s, F1=1, train_acc=1, train_loss=0.0178, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       1.00      1.00      1.00       229
   macro avg       1.00      1.00      1.00       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.04it/s, F1=0.677, eval_acc=0.96, eval_loss=11.7, eval_precision=0.618, eval_recall=0.762] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.65      0.79      0.72      3160
         LOC       0.28      0.36      0.32       482
         ORG       0.45      0.64      0.53      1645
         PER       0.84      0.91      0.88      1650

   micro avg       0.61      0.76      0.67      6937
   macro avg       0.56      0.68      0.61      6937
weighted avg       0.62      0.76      0.68      6937



Epoch: 27/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.74it/s, F1=0.938, train_acc=1, train_loss=0.0154, train_precision=0.938, train_recall=0.938]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       1.00      1.00      1.00       229
   macro avg       1.00      1.00      1.00       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:20<00:00,  3.39it/s, F1=0.678, eval_acc=0.96, eval_loss=11.7, eval_precision=0.62, eval_recall=0.761]  


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.66      0.79      0.72      3160
         LOC       0.28      0.37      0.32       482
         ORG       0.45      0.64      0.53      1645
         PER       0.84      0.91      0.88      1650

   micro avg       0.61      0.75      0.67      6937
   macro avg       0.56      0.68      0.61      6937
weighted avg       0.62      0.75      0.68      6937



Epoch: 28/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.76it/s, F1=0.938, train_acc=1, train_loss=0.0147, train_precision=0.938, train_recall=0.938]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       1.00      1.00      1.00       229
   macro avg       1.00      1.00      1.00       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.12it/s, F1=0.679, eval_acc=0.96, eval_loss=11.8, eval_precision=0.623, eval_recall=0.759] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.66      0.79      0.72      3160
         LOC       0.28      0.36      0.32       482
         ORG       0.45      0.63      0.53      1645
         PER       0.84      0.91      0.88      1650

   micro avg       0.61      0.75      0.68      6937
   macro avg       0.56      0.67      0.61      6937
weighted avg       0.63      0.75      0.68      6937



Epoch: 29/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.65it/s, F1=1, train_acc=1, train_loss=0.0144, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       1.00      1.00      1.00       229
   macro avg       1.00      1.00      1.00       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.11it/s, F1=0.68, eval_acc=0.96, eval_loss=11.9, eval_precision=0.624, eval_recall=0.76]   


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.66      0.79      0.72      3160
         LOC       0.28      0.37      0.32       482
         ORG       0.45      0.63      0.53      1645
         PER       0.84      0.91      0.88      1650

   micro avg       0.61      0.75      0.68      6937
   macro avg       0.56      0.68      0.61      6937
weighted avg       0.63      0.75      0.68      6937



Epoch: 30/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.75it/s, F1=0.969, train_acc=1, train_loss=0.0146, train_precision=0.969, train_recall=0.969]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       1.00      1.00      1.00       229
   macro avg       1.00      1.00      1.00       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.14it/s, F1=0.677, eval_acc=0.96, eval_loss=12, eval_precision=0.615, eval_recall=0.766]   


eval_reports:
              precision    recall  f1-score   support

         GPE       0.65      0.80      0.72      3160
         LOC       0.27      0.36      0.31       482
         ORG       0.45      0.64      0.53      1645
         PER       0.84      0.92      0.88      1650

   micro avg       0.61      0.76      0.67      6937
   macro avg       0.55      0.68      0.61      6937
weighted avg       0.62      0.76      0.68      6937



calculate data/few_shot/note4/train_250.json etag: 100%|██████████| 98.0k/98.0k [00:00<00:00, 128MB/s]
calculate data/few_shot/note4/dev.json etag: 100%|██████████| 2.46M/2.46M [00:00<00:00, 329MB/s]
calculate data/few_shot/note4/test.json etag: 100%|██████████| 2.56M/2.56M [00:00<00:00, 368MB/s]
calculate data/few_shot/note4/labels.txt etag: 100%|██████████| 100/100 [00:00<00:00, 166kB/s]

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/note4/train_250.json",
    "eval_file": "data/few_shot/note4/dev.json",
    "test_file": "data/few_shot/note4/test.json",
    "tag_file": "data/few_shot/note4/labels.txt",
    "bert_vocab_file": "./model/chinese_wwm_ext/vocab.txt",
    "output_eval": true,
    "max_scan_num": 1000000,
    "add_seq_vocab": false,
    "max_seq_length": 150,
    "max_word_num": 5,
    "default_tag": "O",
    "use_test": false,
    "do_shuffle": true,
    "do_predict": false,
    "task_name": "note4_pretrain_lebert_crf_250_x3"
}
load cached ./temp/7037c0d8b5e05990c48974ccd914b436_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/lexicon_tree



count line size data/few_shot/note4/labels.txt: 19L [00:00, 168481.56L/s]
build line mapper: 19L [00:00, 168481.56L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 19/19 [00:00<00:00, 5705.31it/s]
load vocab from list: 100%|██████████| 18/18 [00:00<00:00, 196608.00it/s]
load dataset from data/few_shot/note4/train_250.json: 0it [00:00, ?it/s]

load cached ./temp/7037c0d8b5e05990c48974ccd914b436_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/matched_words
load cached ./temp/7037c0d8b5e05990c48974ccd914b436_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/word_vocab
load cached ./temp/7037c0d8b5e05990c48974ccd914b436_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/vocab_embedding


load dataset from data/few_shot/note4/train_250.json: 250it [00:00, 827.24it/s]
load dataset from data/few_shot/note4/dev.json: 4301it [00:07, 571.73it/s]
Some weights of the model checkpoint at save_pretrained/note4_pretrain_lebert_250_pretraind_task/Bert_240/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model f

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.63it/s, F1=0.000553, train_acc=0.33, train_loss=57.4, train_precision=0.000285, train_recall=0.00938]   


train_reports:
              precision    recall  f1-score   support

         GPE       0.00      0.01      0.00        92
         LOC       0.00      0.00      0.00        16
         ORG       0.00      0.00      0.00        57
         PER       0.00      0.02      0.00        64

   micro avg       0.00      0.01      0.00       229
   macro avg       0.00      0.01      0.00       229
weighted avg       0.00      0.01      0.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.10it/s, F1=0, eval_acc=0.895, eval_loss=30.5, eval_precision=0, eval_recall=0]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.00      0.00      0.00      3160
         LOC       0.00      0.00      0.00       482
         ORG       0.00      0.00      0.00      1645
         PER       0.00      0.00      0.00      1650

   micro avg       0.00      0.00      0.00      6937
   macro avg       0.00      0.00      0.00      6937
weighted avg       0.00      0.00      0.00      6937



Epoch: 2/30 Train: 100%|██████████| 32/32 [00:12<00:00,  2.66it/s, F1=0, train_acc=0.908, train_loss=18.4, train_precision=0, train_recall=0]


train_reports:
              precision    recall  f1-score   support

         GPE       0.00      0.00      0.00        92
         LOC       0.00      0.00      0.00        16
         ORG       0.00      0.00      0.00        57
         PER       0.00      0.00      0.00        64

   micro avg       0.00      0.00      0.00       229
   macro avg       0.00      0.00      0.00       229
weighted avg       0.00      0.00      0.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.15it/s, F1=0, eval_acc=0.895, eval_loss=26, eval_precision=0, eval_recall=0]  


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.00      0.00      0.00      3160
         LOC       0.00      0.00      0.00       482
         ORG       0.00      0.00      0.00      1645
         PER       0.00      0.00      0.00      1650

   micro avg       0.00      0.00      0.00      6937
   macro avg       0.00      0.00      0.00      6937
weighted avg       0.00      0.00      0.00      6937



Epoch: 3/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.77it/s, F1=0, train_acc=0.912, train_loss=13.4, train_precision=0, train_recall=0]


train_reports:
              precision    recall  f1-score   support

         GPE       0.00      0.00      0.00        92
         LOC       0.00      0.00      0.00        16
         ORG       0.00      0.00      0.00        57
         PER       0.00      0.00      0.00        64

   micro avg       0.00      0.00      0.00       229
   macro avg       0.00      0.00      0.00       229
weighted avg       0.00      0.00      0.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.16it/s, F1=0.000151, eval_acc=0.895, eval_loss=18.8, eval_precision=0.000408, eval_recall=9.25e-5] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.00      0.00      0.00      3160
         LOC       0.00      0.00      0.00       482
         ORG       0.00      0.00      0.00      1645
         PER       0.00      0.00      0.00      1650

   micro avg       0.00      0.00      0.00      6937
   macro avg       0.00      0.00      0.00      6937
weighted avg       0.00      0.00      0.00      6937



Epoch: 4/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.64it/s, F1=0, train_acc=0.913, train_loss=9.24, train_precision=0, train_recall=0]


train_reports:
              precision    recall  f1-score   support

         GPE       0.00      0.00      0.00        92
         LOC       0.00      0.00      0.00        16
         ORG       0.00      0.00      0.00        57
         PER       0.00      0.00      0.00        64

   micro avg       0.00      0.00      0.00       229
   macro avg       0.00      0.00      0.00       229
weighted avg       0.00      0.00      0.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.14it/s, F1=0.112, eval_acc=0.921, eval_loss=12.6, eval_precision=0.0868, eval_recall=0.163] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.15      0.24      0.18      3160
         LOC       0.00      0.00      0.00       482
         ORG       0.00      0.01      0.00      1645
         PER       0.11      0.23      0.15      1650

   micro avg       0.09      0.17      0.12      6937
   macro avg       0.06      0.12      0.08      6937
weighted avg       0.09      0.17      0.12      6937



Epoch: 5/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.76it/s, F1=0.332, train_acc=0.955, train_loss=5.18, train_precision=0.308, train_recall=0.371]  


train_reports:
              precision    recall  f1-score   support

         GPE       0.28      0.45      0.34        92
         LOC       0.00      0.00      0.00        16
         ORG       0.11      0.23      0.15        57
         PER       0.48      0.58      0.52        64

   micro avg       0.26      0.40      0.32       229
   macro avg       0.22      0.31      0.25       229
weighted avg       0.27      0.40      0.32       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.08it/s, F1=0.506, eval_acc=0.949, eval_loss=8.6, eval_precision=0.45, eval_recall=0.588]  


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.43      0.66      0.52      3160
         LOC       0.00      0.00      0.00       482
         ORG       0.21      0.33      0.25      1645
         PER       0.82      0.84      0.83      1650

   micro avg       0.43      0.58      0.49      6937
   macro avg       0.36      0.46      0.40      6937
weighted avg       0.44      0.58      0.50      6937



Epoch: 6/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.73it/s, F1=0.64, train_acc=0.98, train_loss=2.58, train_precision=0.613, train_recall=0.685]  


train_reports:
              precision    recall  f1-score   support

         GPE       0.45      0.66      0.54        92
         LOC       0.00      0.00      0.00        16
         ORG       0.71      0.77      0.74        57
         PER       0.89      0.88      0.88        64

   micro avg       0.59      0.70      0.64       229
   macro avg       0.51      0.58      0.54       229
weighted avg       0.61      0.70      0.65       229



Eval Result: 100%|██████████| 68/68 [00:19<00:00,  3.45it/s, F1=0.596, eval_acc=0.955, eval_loss=8.53, eval_precision=0.576, eval_recall=0.629]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.57      0.71      0.63      3160
         LOC       0.00      0.00      0.00       482
         ORG       0.35      0.42      0.38      1645
         PER       0.86      0.84      0.85      1650

   micro avg       0.56      0.62      0.59      6937
   macro avg       0.44      0.49      0.47      6937
weighted avg       0.55      0.62      0.58      6937



Epoch: 7/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.62it/s, F1=0.772, train_acc=0.984, train_loss=2.13, train_precision=0.746, train_recall=0.812]


train_reports:
              precision    recall  f1-score   support

         GPE       0.75      0.88      0.81        92
         LOC       0.00      0.00      0.00        16
         ORG       0.70      0.88      0.78        57
         PER       0.94      0.94      0.94        64

   micro avg       0.74      0.83      0.78       229
   macro avg       0.60      0.67      0.63       229
weighted avg       0.74      0.83      0.78       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.12it/s, F1=0.529, eval_acc=0.951, eval_loss=7.78, eval_precision=0.461, eval_recall=0.635]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.47      0.70      0.57      3160
         LOC       0.00      0.02      0.01       482
         ORG       0.36      0.47      0.41      1645
         PER       0.89      0.83      0.86      1650

   micro avg       0.44      0.63      0.51      6937
   macro avg       0.43      0.51      0.46      6937
weighted avg       0.51      0.63      0.56      6937



Epoch: 8/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.66it/s, F1=0.738, train_acc=0.989, train_loss=1.22, train_precision=0.727, train_recall=0.775]


train_reports:
              precision    recall  f1-score   support

         GPE       0.78      0.88      0.83        92
         LOC       0.00      0.00      0.00        16
         ORG       0.74      0.89      0.81        57
         PER       1.00      0.94      0.97        64

   micro avg       0.76      0.84      0.80       229
   macro avg       0.63      0.68      0.65       229
weighted avg       0.78      0.84      0.80       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.13it/s, F1=0.591, eval_acc=0.953, eval_loss=8.9, eval_precision=0.56, eval_recall=0.641]  


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.57      0.72      0.64      3160
         LOC       0.03      0.05      0.04       482
         ORG       0.43      0.41      0.42      1645
         PER       0.86      0.89      0.88      1650

   micro avg       0.55      0.64      0.59      6937
   macro avg       0.47      0.52      0.49      6937
weighted avg       0.57      0.64      0.60      6937



Epoch: 9/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.76it/s, F1=0.905, train_acc=0.997, train_loss=0.679, train_precision=0.899, train_recall=0.914]


train_reports:
              precision    recall  f1-score   support

         GPE       0.90      0.95      0.92        92
         LOC       0.38      0.50      0.43        16
         ORG       0.93      0.95      0.94        57
         PER       1.00      1.00      1.00        64

   micro avg       0.89      0.93      0.91       229
   macro avg       0.80      0.85      0.82       229
weighted avg       0.90      0.93      0.91       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.05it/s, F1=0.652, eval_acc=0.957, eval_loss=8.5, eval_precision=0.596, eval_recall=0.734] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.58      0.82      0.68      3160
         LOC       0.08      0.04      0.05       482
         ORG       0.43      0.57      0.49      1645
         PER       0.86      0.91      0.88      1650

   micro avg       0.58      0.73      0.65      6937
   macro avg       0.49      0.58      0.53      6937
weighted avg       0.58      0.73      0.64      6937



Epoch: 10/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.62it/s, F1=0.899, train_acc=0.997, train_loss=0.455, train_precision=0.905, train_recall=0.896]


train_reports:
              precision    recall  f1-score   support

         GPE       0.96      0.96      0.96        92
         LOC       0.85      0.69      0.76        16
         ORG       0.97      0.98      0.97        57
         PER       0.95      0.98      0.97        64

   micro avg       0.95      0.95      0.95       229
   macro avg       0.93      0.90      0.91       229
weighted avg       0.95      0.95      0.95       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.10it/s, F1=0.658, eval_acc=0.959, eval_loss=8.13, eval_precision=0.6, eval_recall=0.741]  


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.64      0.78      0.71      3160
         LOC       0.18      0.38      0.24       482
         ORG       0.45      0.60      0.51      1645
         PER       0.87      0.91      0.89      1650

   micro avg       0.59      0.74      0.65      6937
   macro avg       0.54      0.67      0.59      6937
weighted avg       0.62      0.74      0.67      6937



Epoch: 11/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.65it/s, F1=0.98, train_acc=0.999, train_loss=0.192, train_precision=0.982, train_recall=0.979] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.97      0.95      0.96        92
         LOC       0.94      1.00      0.97        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       0.98      0.98      0.98       229
   macro avg       0.98      0.99      0.98       229
weighted avg       0.98      0.98      0.98       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.11it/s, F1=0.658, eval_acc=0.957, eval_loss=8.58, eval_precision=0.591, eval_recall=0.757]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.62      0.81      0.70      3160
         LOC       0.18      0.29      0.22       482
         ORG       0.43      0.62      0.51      1645
         PER       0.86      0.91      0.89      1650

   micro avg       0.58      0.75      0.65      6937
   macro avg       0.52      0.66      0.58      6937
weighted avg       0.60      0.75      0.67      6937



Epoch: 12/30 Train: 100%|██████████| 32/32 [00:12<00:00,  2.63it/s, F1=0.978, train_acc=0.998, train_loss=0.249, train_precision=0.974, train_recall=0.983]


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.99      0.98        92
         LOC       0.83      0.94      0.88        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       0.98      0.99      0.98       229
   macro avg       0.95      0.98      0.97       229
weighted avg       0.98      0.99      0.99       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.14it/s, F1=0.674, eval_acc=0.96, eval_loss=9.02, eval_precision=0.635, eval_recall=0.73]  


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.65      0.81      0.72      3160
         LOC       0.22      0.23      0.22       482
         ORG       0.46      0.55      0.50      1645
         PER       0.88      0.89      0.89      1650

   micro avg       0.62      0.73      0.67      6937
   macro avg       0.55      0.62      0.58      6937
weighted avg       0.63      0.73      0.67      6937



Epoch: 13/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.70it/s, F1=0.969, train_acc=0.998, train_loss=0.383, train_precision=0.958, train_recall=0.985]


train_reports:
              precision    recall  f1-score   support

         GPE       0.96      0.98      0.97        92
         LOC       0.94      0.94      0.94        16
         ORG       0.97      1.00      0.98        57
         PER       0.98      0.98      0.98        64

   micro avg       0.97      0.98      0.97       229
   macro avg       0.96      0.98      0.97       229
weighted avg       0.97      0.98      0.97       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.11it/s, F1=0.663, eval_acc=0.959, eval_loss=8.89, eval_precision=0.627, eval_recall=0.717]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.65      0.78      0.71      3160
         LOC       0.27      0.33      0.30       482
         ORG       0.44      0.48      0.46      1645
         PER       0.84      0.92      0.88      1650

   micro avg       0.62      0.71      0.66      6937
   macro avg       0.55      0.63      0.59      6937
weighted avg       0.62      0.71      0.66      6937



Epoch: 14/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.67it/s, F1=0.92, train_acc=0.999, train_loss=0.164, train_precision=0.913, train_recall=0.929] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      1.00      0.99        92
         LOC       0.82      0.88      0.85        16
         ORG       1.00      1.00      1.00        57
         PER       0.97      0.98      0.98        64

   micro avg       0.97      0.99      0.98       229
   macro avg       0.95      0.96      0.95       229
weighted avg       0.97      0.99      0.98       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.08it/s, F1=0.675, eval_acc=0.961, eval_loss=8.69, eval_precision=0.647, eval_recall=0.721]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.68      0.73      0.71      3160
         LOC       0.26      0.37      0.31       482
         ORG       0.48      0.62      0.54      1645
         PER       0.88      0.90      0.89      1650

   micro avg       0.63      0.72      0.67      6937
   macro avg       0.58      0.66      0.61      6937
weighted avg       0.65      0.72      0.68      6937



Epoch: 15/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.74it/s, F1=0.957, train_acc=0.999, train_loss=0.161, train_precision=0.958, train_recall=0.957]


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.99      0.99        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       0.97      0.97      0.97        64

   micro avg       0.99      0.99      0.99       229
   macro avg       0.99      0.99      0.99       229
weighted avg       0.99      0.99      0.99       229



Eval Result: 100%|██████████| 68/68 [00:17<00:00,  3.98it/s, F1=0.689, eval_acc=0.961, eval_loss=8.7, eval_precision=0.653, eval_recall=0.741] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.69      0.76      0.73      3160
         LOC       0.36      0.31      0.33       482
         ORG       0.47      0.63      0.54      1645
         PER       0.85      0.91      0.88      1650

   micro avg       0.65      0.74      0.69      6937
   macro avg       0.59      0.65      0.62      6937
weighted avg       0.65      0.74      0.69      6937



Epoch: 16/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.75it/s, F1=0.965, train_acc=0.999, train_loss=0.0797, train_precision=0.965, train_recall=0.965]


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      1.00      0.99        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      0.98      0.99        64

   micro avg       1.00      1.00      1.00       229
   macro avg       1.00      1.00      1.00       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.14it/s, F1=0.682, eval_acc=0.96, eval_loss=9.25, eval_precision=0.652, eval_recall=0.73]  


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.70      0.73      0.71      3160
         LOC       0.32      0.38      0.35       482
         ORG       0.48      0.62      0.54      1645
         PER       0.82      0.92      0.87      1650

   micro avg       0.64      0.72      0.68      6937
   macro avg       0.58      0.66      0.62      6937
weighted avg       0.65      0.72      0.68      6937



Epoch: 17/30 Train: 100%|██████████| 32/32 [00:12<00:00,  2.65it/s, F1=0.994, train_acc=1, train_loss=0.0604, train_precision=0.99, train_recall=1] 


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       0.98      1.00      0.99        64

   micro avg       1.00      1.00      1.00       229
   macro avg       1.00      1.00      1.00       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.14it/s, F1=0.684, eval_acc=0.96, eval_loss=9.66, eval_precision=0.669, eval_recall=0.713] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.70      0.71      0.70      3160
         LOC       0.33      0.36      0.35       482
         ORG       0.50      0.59      0.54      1645
         PER       0.85      0.91      0.88      1650

   micro avg       0.66      0.71      0.68      6937
   macro avg       0.60      0.64      0.62      6937
weighted avg       0.66      0.71      0.68      6937



Epoch: 18/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.74it/s, F1=0.906, train_acc=1, train_loss=0.03, train_precision=0.906, train_recall=0.906]  


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       1.00      1.00      1.00       229
   macro avg       1.00      1.00      1.00       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.13it/s, F1=0.688, eval_acc=0.96, eval_loss=9.79, eval_precision=0.672, eval_recall=0.719] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.70      0.74      0.72      3160
         LOC       0.34      0.37      0.35       482
         ORG       0.51      0.59      0.54      1645
         PER       0.87      0.90      0.88      1650

   micro avg       0.66      0.72      0.69      6937
   macro avg       0.60      0.65      0.62      6937
weighted avg       0.67      0.72      0.69      6937



Epoch: 19/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.71it/s, F1=0.969, train_acc=1, train_loss=0.0232, train_precision=0.969, train_recall=0.969]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       1.00      1.00      1.00       229
   macro avg       1.00      1.00      1.00       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.11it/s, F1=0.689, eval_acc=0.96, eval_loss=9.7, eval_precision=0.659, eval_recall=0.737]  


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.69      0.76      0.72      3160
         LOC       0.31      0.38      0.34       482
         ORG       0.50      0.61      0.55      1645
         PER       0.86      0.91      0.88      1650

   micro avg       0.65      0.73      0.69      6937
   macro avg       0.59      0.67      0.62      6937
weighted avg       0.66      0.73      0.69      6937



Epoch: 20/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.81it/s, F1=0.966, train_acc=1, train_loss=0.0262, train_precision=0.965, train_recall=0.967]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       0.97      0.98      0.98        64

   micro avg       0.99      1.00      0.99       229
   macro avg       0.99      1.00      0.99       229
weighted avg       0.99      1.00      0.99       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.15it/s, F1=0.691, eval_acc=0.961, eval_loss=9.66, eval_precision=0.655, eval_recall=0.745]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.69      0.77      0.73      3160
         LOC       0.31      0.39      0.35       482
         ORG       0.50      0.62      0.55      1645
         PER       0.85      0.92      0.88      1650

   micro avg       0.65      0.74      0.69      6937
   macro avg       0.59      0.67      0.63      6937
weighted avg       0.66      0.74      0.70      6937



Epoch: 21/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.68it/s, F1=0.952, train_acc=0.999, train_loss=0.138, train_precision=0.95, train_recall=0.954] 


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00        92
         LOC       0.88      0.88      0.88        16
         ORG       1.00      1.00      1.00        57
         PER       0.97      0.98      0.98        64

   micro avg       0.98      0.99      0.98       229
   macro avg       0.96      0.96      0.96       229
weighted avg       0.98      0.99      0.98       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.09it/s, F1=0.69, eval_acc=0.96, eval_loss=9.89, eval_precision=0.662, eval_recall=0.734]  


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.69      0.78      0.73      3160
         LOC       0.29      0.37      0.33       482
         ORG       0.51      0.58      0.54      1645
         PER       0.87      0.91      0.89      1650

   micro avg       0.65      0.73      0.69      6937
   macro avg       0.59      0.66      0.62      6937
weighted avg       0.66      0.73      0.69      6937



Epoch: 22/30 Train: 100%|██████████| 32/32 [00:12<00:00,  2.60it/s, F1=0.962, train_acc=0.999, train_loss=0.101, train_precision=0.965, train_recall=0.961]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00        92
         LOC       0.94      0.94      0.94        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       1.00      1.00      1.00       229
   macro avg       0.98      0.98      0.98       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.10it/s, F1=0.689, eval_acc=0.96, eval_loss=9.28, eval_precision=0.642, eval_recall=0.759] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.68      0.81      0.74      3160
         LOC       0.33      0.33      0.33       482
         ORG       0.46      0.64      0.54      1645
         PER       0.87      0.90      0.88      1650

   micro avg       0.64      0.76      0.69      6937
   macro avg       0.58      0.67      0.62      6937
weighted avg       0.65      0.76      0.70      6937



Epoch: 23/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.65it/s, F1=0.959, train_acc=0.999, train_loss=0.252, train_precision=0.957, train_recall=0.962]


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      1.00      0.99        92
         LOC       1.00      0.94      0.97        16
         ORG       0.97      0.98      0.97        57
         PER       1.00      1.00      1.00        64

   micro avg       0.99      0.99      0.99       229
   macro avg       0.99      0.98      0.98       229
weighted avg       0.99      0.99      0.99       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.08it/s, F1=0.643, eval_acc=0.953, eval_loss=9.93, eval_precision=0.563, eval_recall=0.77] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.63      0.81      0.70      3160
         LOC       0.17      0.44      0.25       482
         ORG       0.45      0.63      0.52      1645
         PER       0.81      0.93      0.86      1650

   micro avg       0.56      0.77      0.65      6937
   macro avg       0.51      0.70      0.58      6937
weighted avg       0.59      0.77      0.67      6937



Epoch: 24/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.77it/s, F1=0.954, train_acc=0.999, train_loss=0.125, train_precision=0.95, train_recall=0.96]  


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.98      0.98        92
         LOC       0.89      1.00      0.94        16
         ORG       1.00      1.00      1.00        57
         PER       0.98      1.00      0.99        64

   micro avg       0.98      0.99      0.98       229
   macro avg       0.96      0.99      0.98       229
weighted avg       0.98      0.99      0.98       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.07it/s, F1=0.681, eval_acc=0.96, eval_loss=9.89, eval_precision=0.643, eval_recall=0.738] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.63      0.80      0.70      3160
         LOC       0.26      0.26      0.26       482
         ORG       0.52      0.57      0.55      1645
         PER       0.87      0.91      0.89      1650

   micro avg       0.63      0.74      0.68      6937
   macro avg       0.57      0.64      0.60      6937
weighted avg       0.63      0.74      0.68      6937



Epoch: 25/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.74it/s, F1=0.906, train_acc=1, train_loss=0.0251, train_precision=0.906, train_recall=0.906]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       1.00      1.00      1.00       229
   macro avg       1.00      1.00      1.00       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.15it/s, F1=0.687, eval_acc=0.96, eval_loss=9.99, eval_precision=0.651, eval_recall=0.741] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.67      0.78      0.72      3160
         LOC       0.27      0.41      0.33       482
         ORG       0.52      0.59      0.55      1645
         PER       0.87      0.91      0.89      1650

   micro avg       0.64      0.74      0.69      6937
   macro avg       0.58      0.67      0.62      6937
weighted avg       0.65      0.74      0.69      6937



Epoch: 26/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.73it/s, F1=0.966, train_acc=1, train_loss=0.0218, train_precision=0.964, train_recall=0.969]


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      1.00      0.99        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       1.00      1.00      1.00       229
   macro avg       1.00      1.00      1.00       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:19<00:00,  3.46it/s, F1=0.689, eval_acc=0.96, eval_loss=10.2, eval_precision=0.669, eval_recall=0.723] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.70      0.73      0.71      3160
         LOC       0.28      0.41      0.33       482
         ORG       0.53      0.60      0.56      1645
         PER       0.86      0.91      0.89      1650

   micro avg       0.66      0.72      0.69      6937
   macro avg       0.59      0.66      0.62      6937
weighted avg       0.67      0.72      0.69      6937



Epoch: 27/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.69it/s, F1=1, train_acc=1, train_loss=0.0171, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       1.00      1.00      1.00       229
   macro avg       1.00      1.00      1.00       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.12it/s, F1=0.693, eval_acc=0.961, eval_loss=10.2, eval_precision=0.658, eval_recall=0.746]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.67      0.78      0.72      3160
         LOC       0.35      0.34      0.35       482
         ORG       0.52      0.62      0.56      1645
         PER       0.85      0.91      0.88      1650

   micro avg       0.65      0.74      0.69      6937
   macro avg       0.60      0.66      0.63      6937
weighted avg       0.65      0.74      0.69      6937



Epoch: 28/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.66it/s, F1=1, train_acc=1, train_loss=0.0151, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       1.00      1.00      1.00       229
   macro avg       1.00      1.00      1.00       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.11it/s, F1=0.691, eval_acc=0.96, eval_loss=10.4, eval_precision=0.651, eval_recall=0.749] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.65      0.79      0.71      3160
         LOC       0.35      0.28      0.31       482
         ORG       0.52      0.62      0.56      1645
         PER       0.85      0.91      0.88      1650

   micro avg       0.65      0.74      0.69      6937
   macro avg       0.59      0.65      0.62      6937
weighted avg       0.64      0.74      0.69      6937



Epoch: 29/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.76it/s, F1=0.969, train_acc=1, train_loss=0.0102, train_precision=0.969, train_recall=0.969]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       1.00      1.00      1.00       229
   macro avg       1.00      1.00      1.00       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.12it/s, F1=0.696, eval_acc=0.961, eval_loss=10.5, eval_precision=0.666, eval_recall=0.741]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.66      0.78      0.72      3160
         LOC       0.36      0.32      0.34       482
         ORG       0.53      0.60      0.56      1645
         PER       0.86      0.91      0.89      1650

   micro avg       0.66      0.74      0.70      6937
   macro avg       0.60      0.65      0.63      6937
weighted avg       0.66      0.74      0.69      6937



Epoch: 30/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.76it/s, F1=0.969, train_acc=1, train_loss=0.00979, train_precision=0.969, train_recall=0.969]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00        92
         LOC       1.00      1.00      1.00        16
         ORG       1.00      1.00      1.00        57
         PER       1.00      1.00      1.00        64

   micro avg       1.00      1.00      1.00       229
   macro avg       1.00      1.00      1.00       229
weighted avg       1.00      1.00      1.00       229



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.07it/s, F1=0.694, eval_acc=0.96, eval_loss=10.6, eval_precision=0.669, eval_recall=0.735] 


eval_reports:
              precision    recall  f1-score   support

         GPE       0.68      0.77      0.72      3160
         LOC       0.32      0.38      0.35       482
         ORG       0.53      0.60      0.56      1645
         PER       0.86      0.91      0.88      1650

   micro avg       0.66      0.73      0.69      6937
   macro avg       0.60      0.66      0.63      6937
weighted avg       0.66      0.73      0.70      6937



calculate data/few_shot/note4/train_500.json etag: 100%|██████████| 192k/192k [00:00<00:00, 18.1MB/s]
calculate data/few_shot/note4/dev.json etag: 100%|██████████| 2.46M/2.46M [00:00<00:00, 332MB/s]
calculate data/few_shot/note4/test.json etag: 100%|██████████| 2.56M/2.56M [00:00<00:00, 373MB/s]
calculate data/few_shot/note4/labels.txt etag: 100%|██████████| 100/100 [00:00<00:00, 189kB/s]

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/note4/train_500.json",
    "eval_file": "data/few_shot/note4/dev.json",
    "test_file": "data/few_shot/note4/test.json",
    "tag_file": "data/few_shot/note4/labels.txt",
    "bert_vocab_file": "./model/chinese_wwm_ext/vocab.txt",
    "output_eval": true,
    "max_scan_num": 1000000,
    "add_seq_vocab": false,
    "max_seq_length": 150,
    "max_word_num": 5,
    "default_tag": "O",
    "use_test": false,
    "do_shuffle": true,
    "do_predict": false,
    "task_name": "note4_pretrain_lebert_crf_500_x1"
}
load cached ./temp/36a18c95fb213f26988dba66c921f34a_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/lexicon_tree



count line size data/few_shot/note4/labels.txt: 19L [00:00, 143847.97L/s]
build line mapper: 19L [00:00, 143073.21L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 19/19 [00:00<00:00, 5120.26it/s]
load vocab from list: 100%|██████████| 18/18 [00:00<00:00, 198156.09it/s]

load cached ./temp/36a18c95fb213f26988dba66c921f34a_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/matched_words
load cached ./temp/36a18c95fb213f26988dba66c921f34a_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/word_vocab
load cached ./temp/36a18c95fb213f26988dba66c921f34a_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/vocab_embedding



load dataset from data/few_shot/note4/train_500.json: 500it [00:00, 828.86it/s]
load dataset from data/few_shot/note4/dev.json: 4301it [00:07, 561.72it/s]
Some weights of the model checkpoint at save_pretrained/note4_pretrain_lebert_500_pretraind_task/Bert_480/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model 

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 63/63 [00:20<00:00,  3.12it/s, F1=0.000209, train_acc=0.742, train_loss=32.5, train_precision=0.000108, train_recall=0.00317]


train_reports:
              precision    recall  f1-score   support

         GPE       0.00      0.00      0.00       171
         LOC       0.00      0.00      0.00        27
         ORG       0.00      0.00      0.00       110
         PER       0.00      0.01      0.00       121

   micro avg       0.00      0.00      0.00       429
   macro avg       0.00      0.00      0.00       429
weighted avg       0.00      0.00      0.00       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.11it/s, F1=0, eval_acc=0.895, eval_loss=24.6, eval_precision=0, eval_recall=0]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.00      0.00      0.00      3160
         LOC       0.00      0.00      0.00       482
         ORG       0.00      0.00      0.00      1645
         PER       0.00      0.00      0.00      1650

   micro avg       0.00      0.00      0.00      6937
   macro avg       0.00      0.00      0.00      6937
weighted avg       0.00      0.00      0.00      6937



Epoch: 2/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.67it/s, F1=0.00819, train_acc=0.919, train_loss=10.5, train_precision=0.0212, train_recall=0.00854]


train_reports:
              precision    recall  f1-score   support

         GPE       0.00      0.00      0.00       171
         LOC       0.00      0.00      0.00        27
         ORG       0.29      0.05      0.08       110
         PER       0.00      0.00      0.00       121

   micro avg       0.05      0.01      0.02       429
   macro avg       0.07      0.01      0.02       429
weighted avg       0.08      0.01      0.02       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.13it/s, F1=0.0483, eval_acc=0.914, eval_loss=12.7, eval_precision=0.0459, eval_recall=0.0561]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.01      0.02      0.02      3160
         LOC       0.00      0.00      0.00       482
         ORG       0.14      0.13      0.13      1645
         PER       0.03      0.05      0.04      1650

   micro avg       0.04      0.05      0.04      6937
   macro avg       0.05      0.05      0.05      6937
weighted avg       0.05      0.05      0.05      6937



Epoch: 3/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.66it/s, F1=0.344, train_acc=0.952, train_loss=5.15, train_precision=0.354, train_recall=0.368]   


train_reports:
              precision    recall  f1-score   support

         GPE       0.26      0.36      0.30       171
         LOC       0.00      0.00      0.00        27
         ORG       0.27      0.35      0.31       110
         PER       0.56      0.61      0.58       121

   micro avg       0.33      0.41      0.37       429
   macro avg       0.27      0.33      0.30       429
weighted avg       0.33      0.41      0.36       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.15it/s, F1=0.478, eval_acc=0.943, eval_loss=7.42, eval_precision=0.513, eval_recall=0.461]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.55      0.43      0.48      3160
         LOC       0.00      0.00      0.00       482
         ORG       0.12      0.15      0.13      1645
         PER       0.86      0.86      0.86      1650

   micro avg       0.49      0.43      0.46      6937
   macro avg       0.38      0.36      0.37      6937
weighted avg       0.48      0.43      0.45      6937



Epoch: 4/30 Train: 100%|██████████| 63/63 [00:20<00:00,  3.07it/s, F1=0.65, train_acc=0.979, train_loss=2.21, train_precision=0.634, train_recall=0.688] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.57      0.72      0.64       171
         LOC       0.00      0.00      0.00        27
         ORG       0.69      0.75      0.72       110
         PER       0.83      0.88      0.86       121

   micro avg       0.63      0.73      0.67       429
   macro avg       0.52      0.59      0.55       429
weighted avg       0.64      0.73      0.68       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.15it/s, F1=0.627, eval_acc=0.957, eval_loss=6, eval_precision=0.62, eval_recall=0.647]    


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.64      0.57      0.61      3160
         LOC       0.10      0.19      0.13       482
         ORG       0.53      0.59      0.56      1645
         PER       0.84      0.91      0.87      1650

   micro avg       0.60      0.63      0.61      6937
   macro avg       0.53      0.57      0.54      6937
weighted avg       0.63      0.63      0.63      6937



Epoch: 5/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.69it/s, F1=0.851, train_acc=0.99, train_loss=1.11, train_precision=0.863, train_recall=0.862]  


train_reports:
              precision    recall  f1-score   support

         GPE       0.82      0.85      0.84       171
         LOC       0.35      0.33      0.34        27
         ORG       0.88      0.94      0.91       110
         PER       0.89      0.88      0.88       121

   micro avg       0.83      0.85      0.84       429
   macro avg       0.73      0.75      0.74       429
weighted avg       0.83      0.85      0.84       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.11it/s, F1=0.63, eval_acc=0.952, eval_loss=7.63, eval_precision=0.551, eval_recall=0.756] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.53      0.85      0.65      3160
         LOC       0.14      0.30      0.19       482
         ORG       0.50      0.52      0.51      1645
         PER       0.84      0.92      0.88      1650

   micro avg       0.54      0.75      0.63      6937
   macro avg       0.50      0.65      0.56      6937
weighted avg       0.57      0.75      0.64      6937



Epoch: 6/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.70it/s, F1=0.858, train_acc=0.991, train_loss=0.847, train_precision=0.843, train_recall=0.886]


train_reports:
              precision    recall  f1-score   support

         GPE       0.88      0.91      0.90       171
         LOC       0.60      0.78      0.68        27
         ORG       0.85      0.91      0.88       110
         PER       0.93      0.98      0.96       121

   micro avg       0.87      0.92      0.89       429
   macro avg       0.82      0.90      0.85       429
weighted avg       0.87      0.92      0.90       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.14it/s, F1=0.692, eval_acc=0.959, eval_loss=6.23, eval_precision=0.651, eval_recall=0.75] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.65      0.77      0.71      3160
         LOC       0.28      0.24      0.26       482
         ORG       0.51      0.64      0.57      1645
         PER       0.85      0.92      0.88      1650

   micro avg       0.64      0.74      0.69      6937
   macro avg       0.57      0.64      0.60      6937
weighted avg       0.64      0.74      0.68      6937



Epoch: 7/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.65it/s, F1=0.938, train_acc=0.996, train_loss=0.424, train_precision=0.928, train_recall=0.952]


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.97      0.97       171
         LOC       0.68      0.78      0.72        27
         ORG       0.92      0.98      0.95       110
         PER       0.98      1.00      0.99       121

   micro avg       0.94      0.97      0.95       429
   macro avg       0.89      0.93      0.91       429
weighted avg       0.94      0.97      0.96       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.01it/s, F1=0.689, eval_acc=0.959, eval_loss=7.68, eval_precision=0.645, eval_recall=0.752]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.64      0.81      0.72      3160
         LOC       0.30      0.39      0.34       482
         ORG       0.54      0.60      0.57      1645
         PER       0.85      0.88      0.86      1650

   micro avg       0.64      0.75      0.69      6937
   macro avg       0.58      0.67      0.62      6937
weighted avg       0.64      0.75      0.69      6937



Epoch: 8/30 Train: 100%|██████████| 63/63 [00:20<00:00,  3.05it/s, F1=0.962, train_acc=0.998, train_loss=0.287, train_precision=0.959, train_recall=0.966]


train_reports:
              precision    recall  f1-score   support

         GPE       0.95      0.96      0.96       171
         LOC       1.00      1.00      1.00        27
         ORG       0.96      0.96      0.96       110
         PER       0.98      0.99      0.98       121

   micro avg       0.97      0.97      0.97       429
   macro avg       0.97      0.98      0.98       429
weighted avg       0.97      0.97      0.97       429



Eval Result: 100%|██████████| 68/68 [00:17<00:00,  3.99it/s, F1=0.69, eval_acc=0.959, eval_loss=7.32, eval_precision=0.66, eval_recall=0.734]  


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.68      0.77      0.72      3160
         LOC       0.30      0.50      0.37       482
         ORG       0.54      0.57      0.55      1645
         PER       0.85      0.89      0.87      1650

   micro avg       0.65      0.73      0.69      6937
   macro avg       0.59      0.68      0.63      6937
weighted avg       0.66      0.73      0.69      6937



Epoch: 9/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.68it/s, F1=0.961, train_acc=0.999, train_loss=0.166, train_precision=0.955, train_recall=0.969]


train_reports:
              precision    recall  f1-score   support

         GPE       0.97      0.99      0.98       171
         LOC       1.00      1.00      1.00        27
         ORG       0.93      0.96      0.95       110
         PER       0.98      0.99      0.99       121

   micro avg       0.96      0.98      0.97       429
   macro avg       0.97      0.99      0.98       429
weighted avg       0.96      0.98      0.97       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.12it/s, F1=0.713, eval_acc=0.962, eval_loss=7.96, eval_precision=0.703, eval_recall=0.734]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.73      0.72      0.72      3160
         LOC       0.36      0.42      0.39       482
         ORG       0.58      0.67      0.62      1645
         PER       0.87      0.89      0.88      1650

   micro avg       0.70      0.73      0.71      6937
   macro avg       0.63      0.67      0.65      6937
weighted avg       0.70      0.73      0.71      6937



Epoch: 10/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.71it/s, F1=0.961, train_acc=0.999, train_loss=0.182, train_precision=0.96, train_recall=0.963]  


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.98      0.98       171
         LOC       0.96      1.00      0.98        27
         ORG       0.99      0.99      0.99       110
         PER       1.00      1.00      1.00       121

   micro avg       0.99      0.99      0.99       429
   macro avg       0.98      0.99      0.99       429
weighted avg       0.99      0.99      0.99       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.17it/s, F1=0.713, eval_acc=0.961, eval_loss=7.6, eval_precision=0.68, eval_recall=0.764]  


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.67      0.80      0.73      3160
         LOC       0.32      0.37      0.35       482
         ORG       0.58      0.65      0.61      1645
         PER       0.86      0.91      0.88      1650

   micro avg       0.67      0.76      0.71      6937
   macro avg       0.61      0.68      0.64      6937
weighted avg       0.67      0.76      0.71      6937



Epoch: 11/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.63it/s, F1=0.977, train_acc=0.999, train_loss=0.124, train_precision=0.974, train_recall=0.982] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      1.00      0.99       171
         LOC       1.00      1.00      1.00        27
         ORG       0.99      0.99      0.99       110
         PER       1.00      1.00      1.00       121

   micro avg       0.99      1.00      1.00       429
   macro avg       0.99      1.00      1.00       429
weighted avg       0.99      1.00      1.00       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.10it/s, F1=0.71, eval_acc=0.962, eval_loss=7.05, eval_precision=0.702, eval_recall=0.729] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.72      0.72      0.72      3160
         LOC       0.35      0.35      0.35       482
         ORG       0.57      0.64      0.60      1645
         PER       0.86      0.91      0.88      1650

   micro avg       0.69      0.72      0.71      6937
   macro avg       0.63      0.65      0.64      6937
weighted avg       0.69      0.72      0.71      6937



Epoch: 12/30 Train: 100%|██████████| 63/63 [00:21<00:00,  2.99it/s, F1=0.967, train_acc=0.998, train_loss=0.214, train_precision=0.959, train_recall=0.977] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.94      0.98      0.96       171
         LOC       0.96      1.00      0.98        27
         ORG       1.00      0.99      1.00       110
         PER       0.93      0.96      0.94       121

   micro avg       0.95      0.98      0.97       429
   macro avg       0.96      0.98      0.97       429
weighted avg       0.95      0.98      0.97       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.08it/s, F1=0.71, eval_acc=0.961, eval_loss=7.87, eval_precision=0.704, eval_recall=0.727] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.71      0.73      0.72      3160
         LOC       0.42      0.35      0.38       482
         ORG       0.58      0.62      0.60      1645
         PER       0.85      0.89      0.87      1650

   micro avg       0.69      0.72      0.71      6937
   macro avg       0.64      0.65      0.64      6937
weighted avg       0.69      0.72      0.70      6937



Epoch: 13/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.65it/s, F1=0.995, train_acc=0.999, train_loss=0.0993, train_precision=0.994, train_recall=0.996]


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.99      0.99       171
         LOC       1.00      1.00      1.00        27
         ORG       1.00      1.00      1.00       110
         PER       0.98      0.99      0.98       121

   micro avg       0.99      0.99      0.99       429
   macro avg       0.99      1.00      0.99       429
weighted avg       0.99      0.99      0.99       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.15it/s, F1=0.69, eval_acc=0.96, eval_loss=9.11, eval_precision=0.671, eval_recall=0.722]  


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.67      0.76      0.71      3160
         LOC       0.28      0.41      0.33       482
         ORG       0.58      0.57      0.57      1645
         PER       0.84      0.89      0.87      1650

   micro avg       0.66      0.72      0.69      6937
   macro avg       0.59      0.66      0.62      6937
weighted avg       0.66      0.72      0.69      6937



Epoch: 14/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.71it/s, F1=0.936, train_acc=0.997, train_loss=0.39, train_precision=0.932, train_recall=0.945] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.99      0.98       171
         LOC       0.93      0.96      0.95        27
         ORG       0.92      0.95      0.94       110
         PER       0.99      0.99      0.99       121

   micro avg       0.96      0.98      0.97       429
   macro avg       0.95      0.97      0.96       429
weighted avg       0.96      0.98      0.97       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.04it/s, F1=0.675, eval_acc=0.956, eval_loss=9.01, eval_precision=0.618, eval_recall=0.758]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.67      0.77      0.72      3160
         LOC       0.21      0.57      0.31       482
         ORG       0.56      0.61      0.58      1645
         PER       0.82      0.91      0.86      1650

   micro avg       0.61      0.75      0.67      6937
   macro avg       0.56      0.72      0.62      6937
weighted avg       0.65      0.75      0.69      6937



Epoch: 15/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.71it/s, F1=0.954, train_acc=0.998, train_loss=0.341, train_precision=0.946, train_recall=0.965]


train_reports:
              precision    recall  f1-score   support

         GPE       0.97      0.99      0.98       171
         LOC       0.73      0.81      0.77        27
         ORG       0.95      0.96      0.96       110
         PER       0.98      1.00      0.99       121

   micro avg       0.95      0.97      0.96       429
   macro avg       0.91      0.94      0.92       429
weighted avg       0.95      0.97      0.96       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.07it/s, F1=0.66, eval_acc=0.957, eval_loss=10.4, eval_precision=0.715, eval_recall=0.623] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.68      0.68      0.68      3160
         LOC       0.40      0.15      0.22       482
         ORG       0.61      0.49      0.55      1645
         PER       0.88      0.79      0.83      1650

   micro avg       0.71      0.62      0.66      6937
   macro avg       0.64      0.53      0.57      6937
weighted avg       0.69      0.62      0.65      6937



Epoch: 16/30 Train: 100%|██████████| 63/63 [00:20<00:00,  3.08it/s, F1=0.955, train_acc=0.999, train_loss=0.101, train_precision=0.955, train_recall=0.957] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.99      0.99       171
         LOC       1.00      0.96      0.98        27
         ORG       0.97      0.98      0.98       110
         PER       0.98      0.99      0.99       121

   micro avg       0.98      0.99      0.98       429
   macro avg       0.98      0.98      0.98       429
weighted avg       0.98      0.99      0.98       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.16it/s, F1=0.687, eval_acc=0.958, eval_loss=10.3, eval_precision=0.71, eval_recall=0.676] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.73      0.67      0.70      3160
         LOC       0.25      0.40      0.31       482
         ORG       0.66      0.56      0.60      1645
         PER       0.89      0.86      0.88      1650

   micro avg       0.70      0.67      0.68      6937
   macro avg       0.63      0.62      0.62      6937
weighted avg       0.72      0.67      0.69      6937



Epoch: 17/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.70it/s, F1=0.949, train_acc=0.998, train_loss=0.215, train_precision=0.937, train_recall=0.967] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.92      0.98      0.95       171
         LOC       0.74      0.96      0.84        27
         ORG       1.00      0.99      1.00       110
         PER       0.95      0.98      0.97       121

   micro avg       0.94      0.98      0.96       429
   macro avg       0.90      0.98      0.94       429
weighted avg       0.94      0.98      0.96       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.07it/s, F1=0.695, eval_acc=0.958, eval_loss=8.86, eval_precision=0.661, eval_recall=0.746]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.66      0.75      0.70      3160
         LOC       0.54      0.17      0.26       482
         ORG       0.49      0.72      0.58      1645
         PER       0.89      0.90      0.90      1650

   micro avg       0.65      0.74      0.69      6937
   macro avg       0.65      0.64      0.61      6937
weighted avg       0.67      0.74      0.69      6937



Epoch: 18/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.65it/s, F1=0.966, train_acc=0.996, train_loss=0.593, train_precision=0.964, train_recall=0.972]


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.99      0.99       171
         LOC       0.78      0.78      0.78        27
         ORG       0.93      0.96      0.95       110
         PER       1.00      0.99      1.00       121

   micro avg       0.96      0.97      0.97       429
   macro avg       0.92      0.93      0.93       429
weighted avg       0.96      0.97      0.97       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.11it/s, F1=0.672, eval_acc=0.954, eval_loss=11.3, eval_precision=0.697, eval_recall=0.659]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.67      0.78      0.72      3160
         LOC       0.46      0.24      0.31       482
         ORG       0.52      0.34      0.41      1645
         PER       0.87      0.86      0.87      1650

   micro avg       0.69      0.66      0.67      6937
   macro avg       0.63      0.56      0.58      6937
weighted avg       0.67      0.66      0.65      6937



Epoch: 19/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.69it/s, F1=0.943, train_acc=0.999, train_loss=0.143, train_precision=0.948, train_recall=0.94] 


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       171
         LOC       0.93      0.93      0.93        27
         ORG       0.98      0.97      0.98       110
         PER       0.99      1.00      1.00       121

   micro avg       0.99      0.99      0.99       429
   macro avg       0.97      0.97      0.97       429
weighted avg       0.99      0.99      0.99       429



Eval Result: 100%|██████████| 68/68 [00:19<00:00,  3.45it/s, F1=0.702, eval_acc=0.959, eval_loss=10.1, eval_precision=0.687, eval_recall=0.728]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.68      0.80      0.74      3160
         LOC       0.47      0.35      0.40       482
         ORG       0.53      0.59      0.56      1645
         PER       0.87      0.84      0.86      1650

   micro avg       0.68      0.73      0.70      6937
   macro avg       0.64      0.64      0.64      6937
weighted avg       0.68      0.73      0.70      6937



Epoch: 20/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.70it/s, F1=0.976, train_acc=1, train_loss=0.0571, train_precision=0.981, train_recall=0.975]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       171
         LOC       0.93      0.93      0.93        27
         ORG       1.00      1.00      1.00       110
         PER       1.00      1.00      1.00       121

   micro avg       1.00      1.00      1.00       429
   macro avg       0.98      0.98      0.98       429
weighted avg       1.00      1.00      1.00       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.11it/s, F1=0.703, eval_acc=0.959, eval_loss=9.82, eval_precision=0.664, eval_recall=0.76] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.68      0.81      0.74      3160
         LOC       0.29      0.50      0.36       482
         ORG       0.57      0.62      0.60      1645
         PER       0.89      0.88      0.88      1650

   micro avg       0.65      0.76      0.70      6937
   macro avg       0.61      0.70      0.64      6937
weighted avg       0.67      0.76      0.71      6937



Epoch: 21/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.71it/s, F1=0.998, train_acc=1, train_loss=0.0158, train_precision=0.997, train_recall=1]   


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       171
         LOC       0.96      1.00      0.98        27
         ORG       1.00      1.00      1.00       110
         PER       1.00      1.00      1.00       121

   micro avg       1.00      1.00      1.00       429
   macro avg       0.99      1.00      1.00       429
weighted avg       1.00      1.00      1.00       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.13it/s, F1=0.713, eval_acc=0.96, eval_loss=10.2, eval_precision=0.688, eval_recall=0.753] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.69      0.81      0.74      3160
         LOC       0.36      0.46      0.40       482
         ORG       0.58      0.61      0.59      1645
         PER       0.89      0.87      0.88      1650

   micro avg       0.68      0.75      0.71      6937
   macro avg       0.63      0.69      0.66      6937
weighted avg       0.69      0.75      0.72      6937



Epoch: 22/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.70it/s, F1=0.952, train_acc=1, train_loss=0.0159, train_precision=0.952, train_recall=0.952]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       171
         LOC       1.00      1.00      1.00        27
         ORG       1.00      1.00      1.00       110
         PER       1.00      1.00      1.00       121

   micro avg       1.00      1.00      1.00       429
   macro avg       1.00      1.00      1.00       429
weighted avg       1.00      1.00      1.00       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.09it/s, F1=0.709, eval_acc=0.959, eval_loss=10.4, eval_precision=0.664, eval_recall=0.774]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.65      0.84      0.73      3160
         LOC       0.34      0.42      0.37       482
         ORG       0.56      0.63      0.59      1645
         PER       0.89      0.89      0.89      1650

   micro avg       0.66      0.77      0.71      6937
   macro avg       0.61      0.69      0.65      6937
weighted avg       0.66      0.77      0.71      6937



Epoch: 23/30 Train: 100%|██████████| 63/63 [00:20<00:00,  3.03it/s, F1=0.952, train_acc=1, train_loss=0.0111, train_precision=0.952, train_recall=0.952]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       171
         LOC       1.00      1.00      1.00        27
         ORG       1.00      1.00      1.00       110
         PER       1.00      1.00      1.00       121

   micro avg       1.00      1.00      1.00       429
   macro avg       1.00      1.00      1.00       429
weighted avg       1.00      1.00      1.00       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.11it/s, F1=0.724, eval_acc=0.961, eval_loss=10.8, eval_precision=0.714, eval_recall=0.745]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.71      0.79      0.75      3160
         LOC       0.46      0.37      0.41       482
         ORG       0.58      0.61      0.59      1645
         PER       0.89      0.89      0.89      1650

   micro avg       0.70      0.74      0.72      6937
   macro avg       0.66      0.67      0.66      6937
weighted avg       0.70      0.74      0.72      6937



Epoch: 24/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.74it/s, F1=0.966, train_acc=1, train_loss=0.00957, train_precision=0.966, train_recall=0.966]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       171
         LOC       0.96      0.96      0.96        27
         ORG       1.00      1.00      1.00       110
         PER       1.00      1.00      1.00       121

   micro avg       1.00      1.00      1.00       429
   macro avg       0.99      0.99      0.99       429
weighted avg       1.00      1.00      1.00       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.13it/s, F1=0.715, eval_acc=0.961, eval_loss=10.4, eval_precision=0.681, eval_recall=0.765]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.69      0.80      0.74      3160
         LOC       0.34      0.46      0.39       482
         ORG       0.57      0.64      0.61      1645
         PER       0.89      0.89      0.89      1650

   micro avg       0.67      0.76      0.72      6937
   macro avg       0.62      0.70      0.66      6937
weighted avg       0.68      0.76      0.72      6937



Epoch: 25/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.66it/s, F1=1, train_acc=1, train_loss=0.00795, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       171
         LOC       1.00      1.00      1.00        27
         ORG       1.00      1.00      1.00       110
         PER       1.00      1.00      1.00       121

   micro avg       1.00      1.00      1.00       429
   macro avg       1.00      1.00      1.00       429
weighted avg       1.00      1.00      1.00       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.03it/s, F1=0.713, eval_acc=0.961, eval_loss=10.5, eval_precision=0.682, eval_recall=0.758]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.69      0.79      0.74      3160
         LOC       0.33      0.45      0.38       482
         ORG       0.58      0.65      0.61      1645
         PER       0.89      0.89      0.89      1650

   micro avg       0.68      0.76      0.72      6937
   macro avg       0.62      0.69      0.66      6937
weighted avg       0.69      0.76      0.72      6937



Epoch: 26/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.70it/s, F1=0.984, train_acc=1, train_loss=0.00547, train_precision=0.984, train_recall=0.984]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       171
         LOC       1.00      1.00      1.00        27
         ORG       1.00      1.00      1.00       110
         PER       1.00      1.00      1.00       121

   micro avg       1.00      1.00      1.00       429
   macro avg       1.00      1.00      1.00       429
weighted avg       1.00      1.00      1.00       429



Eval Result: 100%|██████████| 68/68 [00:19<00:00,  3.52it/s, F1=0.709, eval_acc=0.96, eval_loss=10.9, eval_precision=0.671, eval_recall=0.763] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.67      0.81      0.73      3160
         LOC       0.33      0.45      0.38       482
         ORG       0.58      0.63      0.60      1645
         PER       0.89      0.89      0.89      1650

   micro avg       0.67      0.76      0.71      6937
   macro avg       0.62      0.70      0.65      6937
weighted avg       0.68      0.76      0.72      6937



Epoch: 27/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.69it/s, F1=0.968, train_acc=1, train_loss=0.00473, train_precision=0.968, train_recall=0.968]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       171
         LOC       1.00      1.00      1.00        27
         ORG       1.00      1.00      1.00       110
         PER       1.00      1.00      1.00       121

   micro avg       1.00      1.00      1.00       429
   macro avg       1.00      1.00      1.00       429
weighted avg       1.00      1.00      1.00       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.08it/s, F1=0.716, eval_acc=0.961, eval_loss=11, eval_precision=0.688, eval_recall=0.758]  


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.69      0.80      0.74      3160
         LOC       0.36      0.43      0.39       482
         ORG       0.59      0.64      0.61      1645
         PER       0.89      0.89      0.89      1650

   micro avg       0.68      0.76      0.72      6937
   macro avg       0.63      0.69      0.66      6937
weighted avg       0.69      0.76      0.72      6937



Epoch: 28/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.69it/s, F1=0.968, train_acc=1, train_loss=0.00533, train_precision=0.968, train_recall=0.968]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       171
         LOC       1.00      1.00      1.00        27
         ORG       1.00      1.00      1.00       110
         PER       1.00      1.00      1.00       121

   micro avg       1.00      1.00      1.00       429
   macro avg       1.00      1.00      1.00       429
weighted avg       1.00      1.00      1.00       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.07it/s, F1=0.723, eval_acc=0.961, eval_loss=11.6, eval_precision=0.72, eval_recall=0.737] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.72      0.76      0.74      3160
         LOC       0.42      0.40      0.41       482
         ORG       0.60      0.62      0.61      1645
         PER       0.89      0.89      0.89      1650

   micro avg       0.71      0.73      0.72      6937
   macro avg       0.66      0.67      0.66      6937
weighted avg       0.71      0.73      0.72      6937



Epoch: 29/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.72it/s, F1=0.984, train_acc=1, train_loss=0.00397, train_precision=0.984, train_recall=0.984]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       171
         LOC       1.00      1.00      1.00        27
         ORG       1.00      1.00      1.00       110
         PER       1.00      1.00      1.00       121

   micro avg       1.00      1.00      1.00       429
   macro avg       1.00      1.00      1.00       429
weighted avg       1.00      1.00      1.00       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.13it/s, F1=0.722, eval_acc=0.962, eval_loss=11.5, eval_precision=0.712, eval_recall=0.744]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.72      0.77      0.74      3160
         LOC       0.41      0.41      0.41       482
         ORG       0.59      0.63      0.61      1645
         PER       0.89      0.89      0.89      1650

   micro avg       0.71      0.74      0.72      6937
   macro avg       0.65      0.68      0.66      6937
weighted avg       0.71      0.74      0.72      6937



Epoch: 30/30 Train: 100%|██████████| 63/63 [00:20<00:00,  3.04it/s, F1=0.984, train_acc=1, train_loss=0.00273, train_precision=0.984, train_recall=0.984]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       171
         LOC       1.00      1.00      1.00        27
         ORG       1.00      1.00      1.00       110
         PER       1.00      1.00      1.00       121

   micro avg       1.00      1.00      1.00       429
   macro avg       1.00      1.00      1.00       429
weighted avg       1.00      1.00      1.00       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.12it/s, F1=0.722, eval_acc=0.961, eval_loss=11.6, eval_precision=0.709, eval_recall=0.746]


eval_reports:
              precision    recall  f1-score   support

         GPE       0.71      0.78      0.74      3160
         LOC       0.39      0.41      0.40       482
         ORG       0.60      0.63      0.61      1645
         PER       0.89      0.89      0.89      1650

   micro avg       0.70      0.74      0.72      6937
   macro avg       0.65      0.68      0.66      6937
weighted avg       0.70      0.74      0.72      6937



calculate data/few_shot/note4/train_500.json etag: 100%|██████████| 192k/192k [00:00<00:00, 203MB/s]
calculate data/few_shot/note4/dev.json etag: 100%|██████████| 2.46M/2.46M [00:00<00:00, 330MB/s]
calculate data/few_shot/note4/test.json etag: 100%|██████████| 2.56M/2.56M [00:00<00:00, 374MB/s]
calculate data/few_shot/note4/labels.txt etag: 100%|██████████| 100/100 [00:00<00:00, 207kB/s]

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/note4/train_500.json",
    "eval_file": "data/few_shot/note4/dev.json",
    "test_file": "data/few_shot/note4/test.json",
    "tag_file": "data/few_shot/note4/labels.txt",
    "bert_vocab_file": "./model/chinese_wwm_ext/vocab.txt",
    "output_eval": true,
    "max_scan_num": 1000000,
    "add_seq_vocab": false,
    "max_seq_length": 150,
    "max_word_num": 5,
    "default_tag": "O",
    "use_test": false,
    "do_shuffle": true,
    "do_predict": false,
    "task_name": "note4_pretrain_lebert_crf_500_x2"
}
load cached ./temp/36a18c95fb213f26988dba66c921f34a_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/lexicon_tree



count line size data/few_shot/note4/labels.txt: 19L [00:00, 187069.90L/s]
build line mapper: 19L [00:00, 159702.96L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 19/19 [00:00<00:00, 5505.10it/s]
load vocab from list: 100%|██████████| 18/18 [00:00<00:00, 213269.69it/s]
load dataset from data/few_shot/note4/train_500.json: 0it [00:00, ?it/s]

load cached ./temp/36a18c95fb213f26988dba66c921f34a_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/matched_words
load cached ./temp/36a18c95fb213f26988dba66c921f34a_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/word_vocab
load cached ./temp/36a18c95fb213f26988dba66c921f34a_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/vocab_embedding


load dataset from data/few_shot/note4/train_500.json: 500it [00:00, 844.55it/s]
load dataset from data/few_shot/note4/dev.json: 4301it [00:10, 426.60it/s]
Some weights of the model checkpoint at save_pretrained/note4_pretrain_lebert_500_pretraind_task/Bert_480/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model f

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.63it/s, F1=0.000449, train_acc=0.558, train_loss=64.1, train_precision=0.000239, train_recall=0.00403] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.00      0.00      0.00       171
         LOC       0.00      0.00      0.00        27
         ORG       0.00      0.00      0.00       110
         PER       0.00      0.02      0.00       121
           _       0.00      0.00      0.00         0

   micro avg       0.00      0.01      0.00       429
   macro avg       0.00      0.00      0.00       429
weighted avg       0.00      0.01      0.00       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.08it/s, F1=0, eval_acc=0.895, eval_loss=33.6, eval_precision=0, eval_recall=0]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.00      0.00      0.00      3160
         LOC       0.00      0.00      0.00       482
         ORG       0.00      0.00      0.00      1645
         PER       0.00      0.00      0.00      1650

   micro avg       0.00      0.00      0.00      6937
   macro avg       0.00      0.00      0.00      6937
weighted avg       0.00      0.00      0.00      6937



Epoch: 2/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.67it/s, F1=0, train_acc=0.919, train_loss=14.4, train_precision=0, train_recall=0]


train_reports:
              precision    recall  f1-score   support

         GPE       0.00      0.00      0.00       171
         LOC       0.00      0.00      0.00        27
         ORG       0.00      0.00      0.00       110
         PER       0.00      0.00      0.00       121

   micro avg       0.00      0.00      0.00       429
   macro avg       0.00      0.00      0.00       429
weighted avg       0.00      0.00      0.00       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.10it/s, F1=0.0149, eval_acc=0.901, eval_loss=20.1, eval_precision=0.0113, eval_recall=0.0222] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.03      0.05      0.03      3160
         LOC       0.00      0.00      0.00       482
         ORG       0.01      0.02      0.01      1645
         PER       0.00      0.01      0.00      1650

   micro avg       0.01      0.03      0.02      6937
   macro avg       0.01      0.02      0.01      6937
weighted avg       0.01      0.03      0.02      6937



Epoch: 3/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.68it/s, F1=0.0956, train_acc=0.935, train_loss=7.9, train_precision=0.0884, train_recall=0.11]      


train_reports:
              precision    recall  f1-score   support

         GPE       0.11      0.20      0.14       171
         LOC       0.00      0.00      0.00        27
         ORG       0.09      0.13      0.11       110
         PER       0.03      0.04      0.04       121

   micro avg       0.08      0.12      0.10       429
   macro avg       0.06      0.09      0.07       429
weighted avg       0.08      0.12      0.09       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.15it/s, F1=0.546, eval_acc=0.936, eval_loss=12.1, eval_precision=0.449, eval_recall=0.709]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.44      0.86      0.58      3160
         LOC       0.00      0.00      0.00       482
         ORG       0.31      0.48      0.37      1645
         PER       0.61      0.83      0.70      1650

   micro avg       0.44      0.70      0.54      6937
   macro avg       0.34      0.54      0.41      6937
weighted avg       0.42      0.70      0.52      6937



Epoch: 4/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.65it/s, F1=0.626, train_acc=0.97, train_loss=3.87, train_precision=0.589, train_recall=0.691] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.52      0.76      0.62       171
         LOC       0.00      0.00      0.00        27
         ORG       0.57      0.70      0.63       110
         PER       0.68      0.80      0.74       121

   micro avg       0.58      0.71      0.64       429
   macro avg       0.45      0.57      0.50       429
weighted avg       0.55      0.71      0.62       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.08it/s, F1=0.542, eval_acc=0.955, eval_loss=8.26, eval_precision=0.52, eval_recall=0.578] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.43      0.53      0.47      3160
         LOC       0.02      0.01      0.01       482
         ORG       0.48      0.50      0.49      1645
         PER       0.73      0.86      0.79      1650

   micro avg       0.50      0.56      0.53      6937
   macro avg       0.41      0.47      0.44      6937
weighted avg       0.48      0.56      0.52      6937



Epoch: 5/30 Train: 100%|██████████| 63/63 [00:20<00:00,  3.10it/s, F1=0.75, train_acc=0.985, train_loss=2.02, train_precision=0.732, train_recall=0.786] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.75      0.84      0.79       171
         LOC       0.24      0.26      0.25        27
         ORG       0.77      0.85      0.81       110
         PER       0.80      0.87      0.83       121

   micro avg       0.74      0.81      0.77       429
   macro avg       0.64      0.70      0.67       429
weighted avg       0.74      0.81      0.77       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.12it/s, F1=0.649, eval_acc=0.958, eval_loss=8.2, eval_precision=0.608, eval_recall=0.71]  


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.61      0.77      0.68      3160
         LOC       0.07      0.06      0.07       482
         ORG       0.51      0.57      0.54      1645
         PER       0.79      0.90      0.84      1650

   micro avg       0.60      0.70      0.65      6937
   macro avg       0.49      0.57      0.53      6937
weighted avg       0.59      0.70      0.64      6937



Epoch: 6/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.66it/s, F1=0.778, train_acc=0.99, train_loss=1.12, train_precision=0.751, train_recall=0.821]  


train_reports:
              precision    recall  f1-score   support

         GPE       0.80      0.88      0.84       171
         LOC       0.12      0.19      0.14        27
         ORG       0.80      0.89      0.84       110
         PER       0.94      0.97      0.96       121

   micro avg       0.78      0.86      0.82       429
   macro avg       0.67      0.73      0.70       429
weighted avg       0.80      0.86      0.83       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.16it/s, F1=0.643, eval_acc=0.958, eval_loss=8.54, eval_precision=0.592, eval_recall=0.717]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.64      0.76      0.70      3160
         LOC       0.08      0.20      0.12       482
         ORG       0.54      0.58      0.56      1645
         PER       0.81      0.89      0.85      1650

   micro avg       0.58      0.71      0.64      6937
   macro avg       0.52      0.61      0.56      6937
weighted avg       0.62      0.71      0.66      6937



Epoch: 7/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.63it/s, F1=0.866, train_acc=0.993, train_loss=0.837, train_precision=0.852, train_recall=0.889]


train_reports:
              precision    recall  f1-score   support

         GPE       0.89      0.92      0.91       171
         LOC       0.26      0.37      0.30        27
         ORG       0.91      0.96      0.93       110
         PER       0.95      0.95      0.95       121

   micro avg       0.86      0.91      0.88       429
   macro avg       0.75      0.80      0.77       429
weighted avg       0.87      0.91      0.89       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.18it/s, F1=0.633, eval_acc=0.957, eval_loss=8.39, eval_precision=0.59, eval_recall=0.697] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.60      0.74      0.66      3160
         LOC       0.06      0.08      0.07       482
         ORG       0.50      0.56      0.53      1645
         PER       0.78      0.89      0.84      1650

   micro avg       0.58      0.69      0.63      6937
   macro avg       0.49      0.57      0.52      6937
weighted avg       0.58      0.69      0.63      6937



Epoch: 8/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.72it/s, F1=0.87, train_acc=0.995, train_loss=0.576, train_precision=0.857, train_recall=0.892] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.91      0.94      0.92       171
         LOC       0.58      0.67      0.62        27
         ORG       0.88      0.95      0.91       110
         PER       0.91      0.97      0.94       121

   micro avg       0.88      0.93      0.90       429
   macro avg       0.82      0.88      0.85       429
weighted avg       0.88      0.93      0.91       429



Eval Result: 100%|██████████| 68/68 [00:19<00:00,  3.44it/s, F1=0.655, eval_acc=0.962, eval_loss=8.47, eval_precision=0.625, eval_recall=0.698]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.70      0.69      0.70      3160
         LOC       0.13      0.28      0.18       482
         ORG       0.55      0.63      0.58      1645
         PER       0.82      0.88      0.85      1650

   micro avg       0.61      0.69      0.65      6937
   macro avg       0.55      0.62      0.58      6937
weighted avg       0.65      0.69      0.67      6937



Epoch: 9/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.70it/s, F1=0.947, train_acc=0.998, train_loss=0.269, train_precision=0.94, train_recall=0.956] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.94      0.97      0.96       171
         LOC       0.67      0.74      0.70        27
         ORG       0.97      0.98      0.98       110
         PER       0.97      0.98      0.97       121

   micro avg       0.94      0.96      0.95       429
   macro avg       0.89      0.92      0.90       429
weighted avg       0.94      0.96      0.95       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.06it/s, F1=0.657, eval_acc=0.96, eval_loss=9.18, eval_precision=0.619, eval_recall=0.71]  


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.70      0.69      0.70      3160
         LOC       0.15      0.37      0.21       482
         ORG       0.57      0.65      0.61      1645
         PER       0.81      0.89      0.85      1650

   micro avg       0.61      0.71      0.66      6937
   macro avg       0.56      0.65      0.59      6937
weighted avg       0.66      0.71      0.68      6937



Epoch: 10/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.72it/s, F1=0.959, train_acc=0.999, train_loss=0.144, train_precision=0.954, train_recall=0.964]


train_reports:
              precision    recall  f1-score   support

         GPE       0.96      0.98      0.97       171
         LOC       0.77      0.85      0.81        27
         ORG       1.00      1.00      1.00       110
         PER       0.98      0.99      0.99       121

   micro avg       0.96      0.98      0.97       429
   macro avg       0.93      0.96      0.94       429
weighted avg       0.96      0.98      0.97       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.09it/s, F1=0.662, eval_acc=0.961, eval_loss=9.76, eval_precision=0.622, eval_recall=0.719]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.68      0.75      0.71      3160
         LOC       0.16      0.37      0.22       482
         ORG       0.58      0.60      0.59      1645
         PER       0.80      0.89      0.84      1650

   micro avg       0.61      0.72      0.66      6937
   macro avg       0.56      0.65      0.59      6937
weighted avg       0.65      0.72      0.68      6937



Epoch: 11/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.64it/s, F1=0.921, train_acc=0.997, train_loss=0.517, train_precision=0.903, train_recall=0.95] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.88      0.91      0.90       171
         LOC       0.68      0.85      0.75        27
         ORG       0.96      1.00      0.98       110
         PER       0.94      0.99      0.97       121

   micro avg       0.90      0.95      0.93       429
   macro avg       0.87      0.94      0.90       429
weighted avg       0.91      0.95      0.93       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.16it/s, F1=0.636, eval_acc=0.956, eval_loss=9.51, eval_precision=0.58, eval_recall=0.716] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.63      0.66      0.65      3160
         LOC       0.17      0.34      0.23       482
         ORG       0.54      0.67      0.60      1645
         PER       0.69      0.92      0.79      1650

   micro avg       0.57      0.70      0.63      6937
   macro avg       0.51      0.65      0.57      6937
weighted avg       0.59      0.70      0.64      6937



Epoch: 12/30 Train: 100%|██████████| 63/63 [00:20<00:00,  3.11it/s, F1=0.938, train_acc=0.998, train_loss=0.312, train_precision=0.929, train_recall=0.949]


train_reports:
              precision    recall  f1-score   support

         GPE       0.94      0.97      0.95       171
         LOC       0.77      0.89      0.83        27
         ORG       0.98      1.00      0.99       110
         PER       0.97      0.98      0.97       121

   micro avg       0.95      0.97      0.96       429
   macro avg       0.92      0.96      0.94       429
weighted avg       0.95      0.97      0.96       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.12it/s, F1=0.611, eval_acc=0.956, eval_loss=11, eval_precision=0.595, eval_recall=0.638]  


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.63      0.65      0.64      3160
         LOC       0.17      0.41      0.24       482
         ORG       0.59      0.51      0.55      1645
         PER       0.83      0.80      0.82      1650

   micro avg       0.59      0.64      0.61      6937
   macro avg       0.55      0.59      0.56      6937
weighted avg       0.63      0.64      0.63      6937



Epoch: 13/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.67it/s, F1=0.96, train_acc=0.999, train_loss=0.222, train_precision=0.954, train_recall=0.969] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.96      0.98      0.97       171
         LOC       0.93      0.93      0.93        27
         ORG       0.98      0.98      0.98       110
         PER       0.98      0.99      0.98       121

   micro avg       0.97      0.98      0.97       429
   macro avg       0.96      0.97      0.97       429
weighted avg       0.97      0.98      0.97       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.10it/s, F1=0.671, eval_acc=0.959, eval_loss=10.3, eval_precision=0.614, eval_recall=0.754]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.63      0.79      0.70      3160
         LOC       0.21      0.39      0.28       482
         ORG       0.55      0.64      0.59      1645
         PER       0.83      0.87      0.85      1650

   micro avg       0.61      0.75      0.67      6937
   macro avg       0.55      0.67      0.60      6937
weighted avg       0.63      0.75      0.68      6937



Epoch: 14/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.60it/s, F1=0.956, train_acc=1, train_loss=0.0649, train_precision=0.954, train_recall=0.959]


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.99      0.99       171
         LOC       1.00      1.00      1.00        27
         ORG       1.00      1.00      1.00       110
         PER       0.99      0.99      0.99       121

   micro avg       0.99      1.00      0.99       429
   macro avg       0.99      1.00      0.99       429
weighted avg       0.99      1.00      0.99       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.13it/s, F1=0.69, eval_acc=0.96, eval_loss=10.9, eval_precision=0.663, eval_recall=0.732]  


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.68      0.75      0.71      3160
         LOC       0.24      0.34      0.28       482
         ORG       0.58      0.64      0.61      1645
         PER       0.83      0.88      0.86      1650

   micro avg       0.65      0.73      0.69      6937
   macro avg       0.59      0.65      0.62      6937
weighted avg       0.66      0.73      0.69      6937



Epoch: 15/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.73it/s, F1=0.954, train_acc=0.999, train_loss=0.117, train_precision=0.95, train_recall=0.96]   


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.99      0.99       171
         LOC       1.00      1.00      1.00        27
         ORG       0.96      0.98      0.97       110
         PER       0.98      0.99      0.98       121

   micro avg       0.97      0.99      0.98       429
   macro avg       0.98      0.99      0.99       429
weighted avg       0.97      0.99      0.98       429



Eval Result: 100%|██████████| 68/68 [00:19<00:00,  3.45it/s, F1=0.657, eval_acc=0.954, eval_loss=11.4, eval_precision=0.598, eval_recall=0.742]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.68      0.72      0.70      3160
         LOC       0.22      0.37      0.28       482
         ORG       0.46      0.69      0.55      1645
         PER       0.77      0.90      0.83      1650

   micro avg       0.59      0.73      0.66      6937
   macro avg       0.53      0.67      0.59      6937
weighted avg       0.62      0.73      0.67      6937



Epoch: 16/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.68it/s, F1=0.982, train_acc=1, train_loss=0.101, train_precision=0.982, train_recall=0.983] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.99      0.99       171
         LOC       1.00      1.00      1.00        27
         ORG       0.98      1.00      0.99       110
         PER       1.00      1.00      1.00       121

   micro avg       0.99      1.00      0.99       429
   macro avg       0.99      1.00      1.00       429
weighted avg       0.99      1.00      0.99       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.08it/s, F1=0.689, eval_acc=0.96, eval_loss=11.5, eval_precision=0.653, eval_recall=0.742] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.67      0.77      0.72      3160
         LOC       0.26      0.37      0.31       482
         ORG       0.57      0.62      0.59      1645
         PER       0.81      0.89      0.85      1650

   micro avg       0.64      0.74      0.69      6937
   macro avg       0.58      0.66      0.62      6937
weighted avg       0.65      0.74      0.69      6937



Epoch: 17/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.66it/s, F1=0.967, train_acc=0.999, train_loss=0.132, train_precision=0.964, train_recall=0.971]


train_reports:
              precision    recall  f1-score   support

         GPE       0.96      0.99      0.97       171
         LOC       0.96      1.00      0.98        27
         ORG       0.97      0.96      0.97       110
         PER       0.98      0.98      0.98       121

   micro avg       0.97      0.98      0.98       429
   macro avg       0.97      0.98      0.98       429
weighted avg       0.97      0.98      0.98       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.12it/s, F1=0.665, eval_acc=0.959, eval_loss=12.1, eval_precision=0.653, eval_recall=0.689]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.66      0.69      0.67      3160
         LOC       0.26      0.21      0.24       482
         ORG       0.52      0.61      0.56      1645
         PER       0.82      0.90      0.85      1650

   micro avg       0.64      0.68      0.66      6937
   macro avg       0.57      0.60      0.58      6937
weighted avg       0.64      0.68      0.66      6937



Epoch: 18/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.64it/s, F1=0.98, train_acc=1, train_loss=0.126, train_precision=0.98, train_recall=0.981]  


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.99      0.99       171
         LOC       1.00      0.96      0.98        27
         ORG       0.99      1.00      1.00       110
         PER       1.00      1.00      1.00       121

   micro avg       1.00      1.00      1.00       429
   macro avg       1.00      0.99      0.99       429
weighted avg       1.00      1.00      1.00       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.06it/s, F1=0.667, eval_acc=0.959, eval_loss=11.4, eval_precision=0.635, eval_recall=0.714]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.65      0.76      0.70      3160
         LOC       0.20      0.34      0.25       482
         ORG       0.59      0.55      0.57      1645
         PER       0.81      0.90      0.85      1650

   micro avg       0.63      0.71      0.67      6937
   macro avg       0.56      0.64      0.59      6937
weighted avg       0.64      0.71      0.67      6937



Epoch: 19/30 Train: 100%|██████████| 63/63 [00:20<00:00,  3.04it/s, F1=0.977, train_acc=1, train_loss=0.0756, train_precision=0.976, train_recall=0.978]


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.99      0.99       171
         LOC       1.00      1.00      1.00        27
         ORG       1.00      1.00      1.00       110
         PER       1.00      1.00      1.00       121

   micro avg       0.99      1.00      0.99       429
   macro avg       1.00      1.00      1.00       429
weighted avg       0.99      1.00      0.99       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.09it/s, F1=0.674, eval_acc=0.96, eval_loss=11.6, eval_precision=0.663, eval_recall=0.696] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.66      0.73      0.69      3160
         LOC       0.26      0.28      0.27       482
         ORG       0.59      0.54      0.56      1645
         PER       0.82      0.90      0.86      1650

   micro avg       0.66      0.69      0.67      6937
   macro avg       0.58      0.61      0.60      6937
weighted avg       0.65      0.69      0.67      6937



Epoch: 20/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.68it/s, F1=0.983, train_acc=1, train_loss=0.0511, train_precision=0.983, train_recall=0.983]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      0.99      1.00       171
         LOC       1.00      1.00      1.00        27
         ORG       0.99      1.00      1.00       110
         PER       1.00      1.00      1.00       121

   micro avg       1.00      1.00      1.00       429
   macro avg       1.00      1.00      1.00       429
weighted avg       1.00      1.00      1.00       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.11it/s, F1=0.684, eval_acc=0.96, eval_loss=12, eval_precision=0.657, eval_recall=0.723]   


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.65      0.80      0.72      3160
         LOC       0.29      0.28      0.28       482
         ORG       0.58      0.52      0.55      1645
         PER       0.82      0.90      0.86      1650

   micro avg       0.65      0.72      0.69      6937
   macro avg       0.58      0.63      0.60      6937
weighted avg       0.65      0.72      0.68      6937



Epoch: 21/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.67it/s, F1=0.966, train_acc=0.999, train_loss=0.106, train_precision=0.964, train_recall=0.969]


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.99      0.99       171
         LOC       1.00      1.00      1.00        27
         ORG       0.98      0.98      0.98       110
         PER       0.99      1.00      1.00       121

   micro avg       0.99      0.99      0.99       429
   macro avg       0.99      0.99      0.99       429
weighted avg       0.99      0.99      0.99       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.11it/s, F1=0.676, eval_acc=0.961, eval_loss=11.3, eval_precision=0.671, eval_recall=0.692]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.69      0.70      0.69      3160
         LOC       0.29      0.32      0.31       482
         ORG       0.57      0.64      0.60      1645
         PER       0.86      0.84      0.85      1650

   micro avg       0.66      0.69      0.68      6937
   macro avg       0.60      0.62      0.61      6937
weighted avg       0.67      0.69      0.68      6937



Epoch: 22/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.73it/s, F1=0.991, train_acc=0.999, train_loss=0.0832, train_precision=0.989, train_recall=0.996]


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.99      0.99       171
         LOC       1.00      1.00      1.00        27
         ORG       0.99      1.00      1.00       110
         PER       0.99      0.99      0.99       121

   micro avg       0.99      1.00      0.99       429
   macro avg       0.99      1.00      1.00       429
weighted avg       0.99      1.00      0.99       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.13it/s, F1=0.687, eval_acc=0.96, eval_loss=11.6, eval_precision=0.651, eval_recall=0.739] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.67      0.77      0.72      3160
         LOC       0.25      0.37      0.30       482
         ORG       0.58      0.62      0.60      1645
         PER       0.80      0.89      0.84      1650

   micro avg       0.64      0.74      0.69      6937
   macro avg       0.58      0.66      0.61      6937
weighted avg       0.65      0.74      0.69      6937



Epoch: 23/30 Train: 100%|██████████| 63/63 [00:20<00:00,  3.05it/s, F1=0.952, train_acc=1, train_loss=0.0156, train_precision=0.952, train_recall=0.952]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       171
         LOC       1.00      1.00      1.00        27
         ORG       1.00      1.00      1.00       110
         PER       1.00      1.00      1.00       121

   micro avg       1.00      1.00      1.00       429
   macro avg       1.00      1.00      1.00       429
weighted avg       1.00      1.00      1.00       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.14it/s, F1=0.693, eval_acc=0.961, eval_loss=12.1, eval_precision=0.661, eval_recall=0.741]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.66      0.79      0.72      3160
         LOC       0.26      0.34      0.30       482
         ORG       0.59      0.60      0.59      1645
         PER       0.82      0.89      0.85      1650

   micro avg       0.65      0.74      0.69      6937
   macro avg       0.58      0.66      0.62      6937
weighted avg       0.66      0.74      0.69      6937



Epoch: 24/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.70it/s, F1=0.999, train_acc=1, train_loss=0.0107, train_precision=1, train_recall=0.998]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       171
         LOC       1.00      1.00      1.00        27
         ORG       1.00      1.00      1.00       110
         PER       1.00      0.99      1.00       121

   micro avg       1.00      1.00      1.00       429
   macro avg       1.00      1.00      1.00       429
weighted avg       1.00      1.00      1.00       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.13it/s, F1=0.694, eval_acc=0.961, eval_loss=12.4, eval_precision=0.665, eval_recall=0.739]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.67      0.78      0.72      3160
         LOC       0.29      0.37      0.32       482
         ORG       0.59      0.60      0.59      1645
         PER       0.81      0.89      0.85      1650

   micro avg       0.66      0.74      0.69      6937
   macro avg       0.59      0.66      0.62      6937
weighted avg       0.66      0.74      0.69      6937



Epoch: 25/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.71it/s, F1=0.967, train_acc=1, train_loss=0.0349, train_precision=0.968, train_recall=0.966] 


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       171
         LOC       1.00      1.00      1.00        27
         ORG       1.00      1.00      1.00       110
         PER       1.00      0.99      1.00       121

   micro avg       1.00      1.00      1.00       429
   macro avg       1.00      1.00      1.00       429
weighted avg       1.00      1.00      1.00       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.10it/s, F1=0.689, eval_acc=0.96, eval_loss=12.4, eval_precision=0.65, eval_recall=0.745]  


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.67      0.79      0.72      3160
         LOC       0.26      0.37      0.31       482
         ORG       0.57      0.61      0.59      1645
         PER       0.81      0.90      0.85      1650

   micro avg       0.64      0.74      0.69      6937
   macro avg       0.58      0.67      0.62      6937
weighted avg       0.65      0.74      0.69      6937



Epoch: 26/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.66it/s, F1=0.961, train_acc=1, train_loss=0.0703, train_precision=0.958, train_recall=0.964]   


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.99      0.99       171
         LOC       1.00      1.00      1.00        27
         ORG       1.00      1.00      1.00       110
         PER       0.98      1.00      0.99       121

   micro avg       0.99      1.00      0.99       429
   macro avg       0.99      1.00      1.00       429
weighted avg       0.99      1.00      0.99       429



Eval Result: 100%|██████████| 68/68 [00:19<00:00,  3.42it/s, F1=0.687, eval_acc=0.961, eval_loss=12.6, eval_precision=0.665, eval_recall=0.721]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.68      0.77      0.73      3160
         LOC       0.28      0.37      0.32       482
         ORG       0.59      0.58      0.59      1645
         PER       0.82      0.87      0.84      1650

   micro avg       0.66      0.72      0.69      6937
   macro avg       0.59      0.65      0.62      6937
weighted avg       0.67      0.72      0.69      6937



Epoch: 27/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.73it/s, F1=0.984, train_acc=1, train_loss=0.00973, train_precision=0.984, train_recall=0.984]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       171
         LOC       1.00      1.00      1.00        27
         ORG       1.00      1.00      1.00       110
         PER       1.00      1.00      1.00       121

   micro avg       1.00      1.00      1.00       429
   macro avg       1.00      1.00      1.00       429
weighted avg       1.00      1.00      1.00       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.12it/s, F1=0.697, eval_acc=0.962, eval_loss=12.2, eval_precision=0.658, eval_recall=0.753]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.68      0.79      0.73      3160
         LOC       0.28      0.34      0.31       482
         ORG       0.57      0.64      0.60      1645
         PER       0.81      0.91      0.85      1650

   micro avg       0.65      0.75      0.70      6937
   macro avg       0.58      0.67      0.62      6937
weighted avg       0.66      0.75      0.70      6937



Epoch: 28/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.68it/s, F1=0.984, train_acc=1, train_loss=0.008, train_precision=0.984, train_recall=0.984]  


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       171
         LOC       1.00      1.00      1.00        27
         ORG       1.00      1.00      1.00       110
         PER       1.00      1.00      1.00       121

   micro avg       1.00      1.00      1.00       429
   macro avg       1.00      1.00      1.00       429
weighted avg       1.00      1.00      1.00       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.07it/s, F1=0.693, eval_acc=0.961, eval_loss=12.3, eval_precision=0.647, eval_recall=0.759]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.67      0.78      0.72      3160
         LOC       0.27      0.37      0.31       482
         ORG       0.55      0.67      0.60      1645
         PER       0.80      0.90      0.85      1650

   micro avg       0.64      0.76      0.69      6937
   macro avg       0.57      0.68      0.62      6937
weighted avg       0.65      0.76      0.70      6937



Epoch: 29/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.69it/s, F1=0.984, train_acc=1, train_loss=0.007, train_precision=0.984, train_recall=0.984]  


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       171
         LOC       1.00      1.00      1.00        27
         ORG       1.00      1.00      1.00       110
         PER       1.00      1.00      1.00       121

   micro avg       1.00      1.00      1.00       429
   macro avg       1.00      1.00      1.00       429
weighted avg       1.00      1.00      1.00       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.15it/s, F1=0.694, eval_acc=0.961, eval_loss=12.4, eval_precision=0.654, eval_recall=0.752]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.68      0.77      0.72      3160
         LOC       0.27      0.37      0.31       482
         ORG       0.56      0.66      0.61      1645
         PER       0.80      0.90      0.85      1650

   micro avg       0.65      0.75      0.69      6937
   macro avg       0.58      0.67      0.62      6937
weighted avg       0.65      0.75      0.70      6937



Epoch: 30/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.70it/s, F1=0.937, train_acc=1, train_loss=0.00439, train_precision=0.937, train_recall=0.937]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       171
         LOC       1.00      1.00      1.00        27
         ORG       1.00      1.00      1.00       110
         PER       1.00      1.00      1.00       121

   micro avg       1.00      1.00      1.00       429
   macro avg       1.00      1.00      1.00       429
weighted avg       1.00      1.00      1.00       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.05it/s, F1=0.697, eval_acc=0.961, eval_loss=12.5, eval_precision=0.658, eval_recall=0.753]


eval_reports:
              precision    recall  f1-score   support

         GPE       0.68      0.78      0.73      3160
         LOC       0.28      0.36      0.31       482
         ORG       0.57      0.65      0.61      1645
         PER       0.80      0.90      0.85      1650

   micro avg       0.65      0.75      0.70      6937
   macro avg       0.58      0.67      0.62      6937
weighted avg       0.65      0.75      0.70      6937



calculate data/few_shot/note4/train_500.json etag: 100%|██████████| 192k/192k [00:00<00:00, 244MB/s]
calculate data/few_shot/note4/dev.json etag: 100%|██████████| 2.46M/2.46M [00:00<00:00, 331MB/s]
calculate data/few_shot/note4/test.json etag: 100%|██████████| 2.56M/2.56M [00:00<00:00, 375MB/s]
calculate data/few_shot/note4/labels.txt etag: 100%|██████████| 100/100 [00:00<00:00, 565kB/s]

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/note4/train_500.json",
    "eval_file": "data/few_shot/note4/dev.json",
    "test_file": "data/few_shot/note4/test.json",
    "tag_file": "data/few_shot/note4/labels.txt",
    "bert_vocab_file": "./model/chinese_wwm_ext/vocab.txt",
    "output_eval": true,
    "max_scan_num": 1000000,
    "add_seq_vocab": false,
    "max_seq_length": 150,
    "max_word_num": 5,
    "default_tag": "O",
    "use_test": false,
    "do_shuffle": true,
    "do_predict": false,
    "task_name": "note4_pretrain_lebert_crf_500_x3"
}
load cached ./temp/36a18c95fb213f26988dba66c921f34a_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/lexicon_tree



count line size data/few_shot/note4/labels.txt: 19L [00:00, 159702.96L/s]
build line mapper: 19L [00:00, 104995.75L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 19/19 [00:00<00:00, 5539.15it/s]
load vocab from list: 100%|██████████| 18/18 [00:00<00:00, 208556.55it/s]
load dataset from data/few_shot/note4/train_500.json: 0it [00:00, ?it/s]

load cached ./temp/36a18c95fb213f26988dba66c921f34a_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/matched_words
load cached ./temp/36a18c95fb213f26988dba66c921f34a_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/word_vocab
load cached ./temp/36a18c95fb213f26988dba66c921f34a_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/vocab_embedding


load dataset from data/few_shot/note4/train_500.json: 500it [00:00, 841.24it/s]
load dataset from data/few_shot/note4/dev.json: 4301it [00:07, 571.29it/s]
Some weights of the model checkpoint at save_pretrained/note4_pretrain_lebert_500_pretraind_task/Bert_480/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model f

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.66it/s, F1=0, train_acc=0.684, train_loss=30.4, train_precision=0, train_recall=0]  


train_reports:
              precision    recall  f1-score   support

         GPE       0.00      0.00      0.00       171
         LOC       0.00      0.00      0.00        27
         ORG       0.00      0.00      0.00       110
         PER       0.00      0.00      0.00       121

   micro avg       0.00      0.00      0.00       429
   macro avg       0.00      0.00      0.00       429
weighted avg       0.00      0.00      0.00       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.01it/s, F1=0, eval_acc=0.895, eval_loss=24.4, eval_precision=0, eval_recall=0]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.00      0.00      0.00      3160
         LOC       0.00      0.00      0.00       482
         ORG       0.00      0.00      0.00      1645
         PER       0.00      0.00      0.00      1650

   micro avg       0.00      0.00      0.00      6937
   macro avg       0.00      0.00      0.00      6937
weighted avg       0.00      0.00      0.00      6937



Epoch: 2/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.71it/s, F1=0.00942, train_acc=0.92, train_loss=10.1, train_precision=0.00816, train_recall=0.0112]  


train_reports:
              precision    recall  f1-score   support

         GPE       0.00      0.00      0.00       171
         LOC       0.00      0.00      0.00        27
         ORG       0.00      0.00      0.00       110
         PER       0.67      0.05      0.09       121

   micro avg       0.05      0.01      0.02       429
   macro avg       0.17      0.01      0.02       429
weighted avg       0.19      0.01      0.03       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.11it/s, F1=0.148, eval_acc=0.916, eval_loss=14.2, eval_precision=0.112, eval_recall=0.226]  


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.02      0.03      0.02      3160
         LOC       0.00      0.00      0.00       482
         ORG       0.05      0.23      0.08      1645
         PER       0.60      0.60      0.60      1650

   micro avg       0.10      0.21      0.13      6937
   macro avg       0.17      0.22      0.18      6937
weighted avg       0.16      0.21      0.17      6937



Epoch: 3/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.71it/s, F1=0.382, train_acc=0.958, train_loss=4.6, train_precision=0.39, train_recall=0.414]  


train_reports:
              precision    recall  f1-score   support

         GPE       0.30      0.50      0.38       171
         LOC       0.00      0.00      0.00        27
         ORG       0.13      0.25      0.17       110
         PER       0.70      0.63      0.66       121

   micro avg       0.32      0.44      0.37       429
   macro avg       0.28      0.34      0.30       429
weighted avg       0.35      0.44      0.38       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.08it/s, F1=0.546, eval_acc=0.953, eval_loss=6.89, eval_precision=0.516, eval_recall=0.593]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.58      0.60      0.59      3160
         LOC       0.00      0.00      0.00       482
         ORG       0.24      0.44      0.31      1645
         PER       0.82      0.86      0.84      1650

   micro avg       0.50      0.58      0.54      6937
   macro avg       0.41      0.47      0.43      6937
weighted avg       0.52      0.58      0.54      6937



Epoch: 4/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.65it/s, F1=0.686, train_acc=0.98, train_loss=2.17, train_precision=0.684, train_recall=0.698] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.72      0.81      0.76       171
         LOC       0.18      0.07      0.11        27
         ORG       0.67      0.81      0.73       110
         PER       0.79      0.81      0.80       121

   micro avg       0.71      0.76      0.74       429
   macro avg       0.59      0.63      0.60       429
weighted avg       0.69      0.76      0.72       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.09it/s, F1=0.657, eval_acc=0.958, eval_loss=6.75, eval_precision=0.649, eval_recall=0.676]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.63      0.76      0.69      3160
         LOC       0.23      0.06      0.10       482
         ORG       0.48      0.47      0.48      1645
         PER       0.85      0.88      0.87      1650

   micro avg       0.64      0.67      0.66      6937
   macro avg       0.55      0.54      0.53      6937
weighted avg       0.62      0.67      0.64      6937



Epoch: 5/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.72it/s, F1=0.762, train_acc=0.988, train_loss=1.25, train_precision=0.782, train_recall=0.762] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.81      0.86      0.83       171
         LOC       0.60      0.44      0.51        27
         ORG       0.85      0.90      0.88       110
         PER       0.90      0.83      0.87       121

   micro avg       0.83      0.84      0.84       429
   macro avg       0.79      0.76      0.77       429
weighted avg       0.83      0.84      0.83       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.13it/s, F1=0.644, eval_acc=0.952, eval_loss=7.56, eval_precision=0.571, eval_recall=0.755]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.62      0.74      0.68      3160
         LOC       0.26      0.24      0.25       482
         ORG       0.38      0.71      0.50      1645
         PER       0.82      0.91      0.86      1650

   micro avg       0.56      0.74      0.64      6937
   macro avg       0.52      0.65      0.57      6937
weighted avg       0.59      0.74      0.65      6937



Epoch: 6/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.69it/s, F1=0.871, train_acc=0.991, train_loss=1.03, train_precision=0.863, train_recall=0.893] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.87      0.92      0.89       171
         LOC       0.62      0.67      0.64        27
         ORG       0.86      0.92      0.89       110
         PER       0.94      0.97      0.96       121

   micro avg       0.87      0.92      0.89       429
   macro avg       0.82      0.87      0.84       429
weighted avg       0.87      0.92      0.89       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.11it/s, F1=0.652, eval_acc=0.954, eval_loss=6.81, eval_precision=0.6, eval_recall=0.729]  


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.67      0.68      0.67      3160
         LOC       0.27      0.37      0.31       482
         ORG       0.39      0.69      0.50      1645
         PER       0.89      0.90      0.89      1650

   micro avg       0.58      0.71      0.64      6937
   macro avg       0.55      0.66      0.59      6937
weighted avg       0.63      0.71      0.66      6937



Epoch: 7/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.71it/s, F1=0.904, train_acc=0.994, train_loss=0.68, train_precision=0.898, train_recall=0.921] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.94      0.94      0.94       171
         LOC       0.65      0.74      0.69        27
         ORG       0.88      0.96      0.92       110
         PER       0.96      0.93      0.95       121

   micro avg       0.91      0.93      0.92       429
   macro avg       0.86      0.89      0.87       429
weighted avg       0.91      0.93      0.92       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.15it/s, F1=0.691, eval_acc=0.96, eval_loss=6.94, eval_precision=0.658, eval_recall=0.741] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.65      0.78      0.71      3160
         LOC       0.35      0.30      0.32       482
         ORG       0.48      0.55      0.51      1645
         PER       0.86      0.94      0.90      1650

   micro avg       0.64      0.73      0.68      6937
   macro avg       0.59      0.64      0.61      6937
weighted avg       0.64      0.73      0.68      6937



Epoch: 8/30 Train: 100%|██████████| 63/63 [00:20<00:00,  3.08it/s, F1=0.949, train_acc=0.997, train_loss=0.372, train_precision=0.947, train_recall=0.954]


train_reports:
              precision    recall  f1-score   support

         GPE       0.97      0.98      0.97       171
         LOC       0.93      0.93      0.93        27
         ORG       0.95      0.97      0.96       110
         PER       0.98      0.98      0.98       121

   micro avg       0.96      0.97      0.97       429
   macro avg       0.96      0.96      0.96       429
weighted avg       0.96      0.97      0.97       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.13it/s, F1=0.673, eval_acc=0.956, eval_loss=8.35, eval_precision=0.695, eval_recall=0.663]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.69      0.69      0.69      3160
         LOC       0.39      0.29      0.33       482
         ORG       0.50      0.47      0.48      1645
         PER       0.90      0.89      0.89      1650

   micro avg       0.68      0.66      0.67      6937
   macro avg       0.62      0.59      0.60      6937
weighted avg       0.67      0.66      0.66      6937



Epoch: 9/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.65it/s, F1=0.965, train_acc=0.998, train_loss=0.339, train_precision=0.959, train_recall=0.974]


train_reports:
              precision    recall  f1-score   support

         GPE       0.97      0.98      0.97       171
         LOC       0.93      0.96      0.95        27
         ORG       0.93      0.95      0.94       110
         PER       0.97      0.99      0.98       121

   micro avg       0.96      0.97      0.97       429
   macro avg       0.95      0.97      0.96       429
weighted avg       0.96      0.97      0.97       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.00it/s, F1=0.676, eval_acc=0.957, eval_loss=8.24, eval_precision=0.646, eval_recall=0.719]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.65      0.80      0.72      3160
         LOC       0.32      0.41      0.36       482
         ORG       0.51      0.52      0.51      1645
         PER       0.88      0.84      0.86      1650

   micro avg       0.64      0.72      0.68      6937
   macro avg       0.59      0.64      0.61      6937
weighted avg       0.65      0.72      0.68      6937



Epoch: 10/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.66it/s, F1=0.95, train_acc=0.999, train_loss=0.206, train_precision=0.946, train_recall=0.954] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.98      0.98       171
         LOC       1.00      1.00      1.00        27
         ORG       0.95      0.96      0.95       110
         PER       0.98      0.99      0.98       121

   micro avg       0.97      0.98      0.98       429
   macro avg       0.98      0.98      0.98       429
weighted avg       0.97      0.98      0.98       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.13it/s, F1=0.674, eval_acc=0.959, eval_loss=7.84, eval_precision=0.614, eval_recall=0.76] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.63      0.81      0.71      3160
         LOC       0.33      0.43      0.37       482
         ORG       0.44      0.58      0.50      1645
         PER       0.87      0.90      0.88      1650

   micro avg       0.61      0.75      0.67      6937
   macro avg       0.57      0.68      0.62      6937
weighted avg       0.62      0.75      0.68      6937



Epoch: 11/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.69it/s, F1=0.997, train_acc=1, train_loss=0.0737, train_precision=0.995, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.99      0.99       171
         LOC       1.00      1.00      1.00        27
         ORG       0.99      1.00      1.00       110
         PER       1.00      1.00      1.00       121

   micro avg       0.99      1.00      0.99       429
   macro avg       0.99      1.00      1.00       429
weighted avg       0.99      1.00      0.99       429



Eval Result: 100%|██████████| 68/68 [00:20<00:00,  3.37it/s, F1=0.692, eval_acc=0.96, eval_loss=8.81, eval_precision=0.67, eval_recall=0.726]  


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.65      0.81      0.72      3160
         LOC       0.47      0.31      0.38       482
         ORG       0.50      0.52      0.51      1645
         PER       0.87      0.88      0.88      1650

   micro avg       0.66      0.72      0.69      6937
   macro avg       0.62      0.63      0.62      6937
weighted avg       0.66      0.72      0.68      6937



Epoch: 12/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.67it/s, F1=0.947, train_acc=1, train_loss=0.0536, train_precision=0.947, train_recall=0.947]    


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       171
         LOC       1.00      1.00      1.00        27
         ORG       1.00      1.00      1.00       110
         PER       0.99      0.99      0.99       121

   micro avg       1.00      1.00      1.00       429
   macro avg       1.00      1.00      1.00       429
weighted avg       1.00      1.00      1.00       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.11it/s, F1=0.701, eval_acc=0.961, eval_loss=8.67, eval_precision=0.671, eval_recall=0.746]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.67      0.80      0.73      3160
         LOC       0.42      0.40      0.41       482
         ORG       0.51      0.56      0.53      1645
         PER       0.87      0.90      0.89      1650

   micro avg       0.66      0.74      0.70      6937
   macro avg       0.62      0.67      0.64      6937
weighted avg       0.66      0.74      0.70      6937



Epoch: 13/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.72it/s, F1=0.925, train_acc=0.999, train_loss=0.108, train_precision=0.92, train_recall=0.931]  


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.98      0.98       171
         LOC       0.87      0.96      0.91        27
         ORG       0.99      1.00      1.00       110
         PER       1.00      1.00      1.00       121

   micro avg       0.98      0.99      0.98       429
   macro avg       0.96      0.99      0.97       429
weighted avg       0.98      0.99      0.99       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.12it/s, F1=0.708, eval_acc=0.962, eval_loss=8.49, eval_precision=0.709, eval_recall=0.719]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.70      0.75      0.73      3160
         LOC       0.44      0.28      0.35       482
         ORG       0.55      0.59      0.57      1645
         PER       0.89      0.90      0.89      1650

   micro avg       0.70      0.72      0.71      6937
   macro avg       0.65      0.63      0.64      6937
weighted avg       0.70      0.72      0.70      6937



Epoch: 14/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.68it/s, F1=0.987, train_acc=0.999, train_loss=0.111, train_precision=0.99, train_recall=0.986]  


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.99      0.99       171
         LOC       0.96      0.93      0.94        27
         ORG       0.99      0.99      0.99       110
         PER       1.00      1.00      1.00       121

   micro avg       0.99      0.99      0.99       429
   macro avg       0.99      0.98      0.98       429
weighted avg       0.99      0.99      0.99       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.14it/s, F1=0.692, eval_acc=0.961, eval_loss=8.37, eval_precision=0.656, eval_recall=0.744]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.63      0.82      0.71      3160
         LOC       0.42      0.31      0.36       482
         ORG       0.52      0.56      0.54      1645
         PER       0.88      0.89      0.88      1650

   micro avg       0.65      0.74      0.69      6937
   macro avg       0.61      0.65      0.62      6937
weighted avg       0.65      0.74      0.69      6937



Epoch: 15/30 Train: 100%|██████████| 63/63 [00:20<00:00,  3.05it/s, F1=0.999, train_acc=1, train_loss=0.0406, train_precision=1, train_recall=0.997]    


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       171
         LOC       1.00      0.96      0.98        27
         ORG       1.00      1.00      1.00       110
         PER       1.00      1.00      1.00       121

   micro avg       1.00      1.00      1.00       429
   macro avg       1.00      0.99      1.00       429
weighted avg       1.00      1.00      1.00       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.10it/s, F1=0.7, eval_acc=0.961, eval_loss=8.73, eval_precision=0.676, eval_recall=0.735]  


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.69      0.78      0.73      3160
         LOC       0.39      0.51      0.44       482
         ORG       0.54      0.54      0.54      1645
         PER       0.87      0.89      0.88      1650

   micro avg       0.67      0.73      0.70      6937
   macro avg       0.62      0.68      0.65      6937
weighted avg       0.68      0.73      0.70      6937



Epoch: 16/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.71it/s, F1=0.935, train_acc=0.999, train_loss=0.105, train_precision=0.939, train_recall=0.933]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       171
         LOC       1.00      1.00      1.00        27
         ORG       1.00      1.00      1.00       110
         PER       0.97      0.96      0.96       121

   micro avg       0.99      0.99      0.99       429
   macro avg       0.99      0.99      0.99       429
weighted avg       0.99      0.99      0.99       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.12it/s, F1=0.696, eval_acc=0.96, eval_loss=8.56, eval_precision=0.697, eval_recall=0.705] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.72      0.70      0.71      3160
         LOC       0.39      0.48      0.43       482
         ORG       0.56      0.56      0.56      1645
         PER       0.86      0.89      0.88      1650

   micro avg       0.69      0.70      0.69      6937
   macro avg       0.63      0.66      0.64      6937
weighted avg       0.69      0.70      0.70      6937



Epoch: 17/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.71it/s, F1=0.952, train_acc=0.998, train_loss=0.161, train_precision=0.955, train_recall=0.951]


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.98      0.98       171
         LOC       0.90      0.96      0.93        27
         ORG       1.00      1.00      1.00       110
         PER       0.99      0.98      0.99       121

   micro avg       0.99      0.98      0.98       429
   macro avg       0.97      0.98      0.97       429
weighted avg       0.99      0.98      0.98       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.15it/s, F1=0.672, eval_acc=0.956, eval_loss=10.5, eval_precision=0.629, eval_recall=0.735]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.58      0.87      0.70      3160
         LOC       0.41      0.20      0.27       482
         ORG       0.53      0.46      0.49      1645
         PER       0.83      0.88      0.85      1650

   micro avg       0.62      0.73      0.67      6937
   macro avg       0.59      0.60      0.58      6937
weighted avg       0.62      0.73      0.66      6937



Epoch: 18/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.63it/s, F1=0.956, train_acc=0.999, train_loss=0.159, train_precision=0.955, train_recall=0.957]


train_reports:
              precision    recall  f1-score   support

         GPE       0.95      0.99      0.97       171
         LOC       1.00      0.89      0.94        27
         ORG       1.00      1.00      1.00       110
         PER       0.99      0.98      0.99       121

   micro avg       0.98      0.98      0.98       429
   macro avg       0.99      0.97      0.97       429
weighted avg       0.98      0.98      0.98       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.09it/s, F1=0.689, eval_acc=0.96, eval_loss=8.95, eval_precision=0.67, eval_recall=0.721]  


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.66      0.74      0.70      3160
         LOC       0.40      0.34      0.37       482
         ORG       0.53      0.58      0.56      1645
         PER       0.86      0.90      0.88      1650

   micro avg       0.66      0.71      0.69      6937
   macro avg       0.61      0.64      0.63      6937
weighted avg       0.66      0.71      0.69      6937



Epoch: 19/30 Train: 100%|██████████| 63/63 [00:20<00:00,  3.08it/s, F1=0.977, train_acc=0.999, train_loss=0.125, train_precision=0.977, train_recall=0.978] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.98      0.99       171
         LOC       0.93      0.93      0.93        27
         ORG       1.00      1.00      1.00       110
         PER       1.00      1.00      1.00       121

   micro avg       0.99      0.99      0.99       429
   macro avg       0.98      0.98      0.98       429
weighted avg       0.99      0.99      0.99       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.10it/s, F1=0.68, eval_acc=0.958, eval_loss=9.21, eval_precision=0.629, eval_recall=0.753] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.62      0.81      0.70      3160
         LOC       0.31      0.43      0.36       482
         ORG       0.51      0.56      0.53      1645
         PER       0.84      0.90      0.87      1650

   micro avg       0.62      0.75      0.68      6937
   macro avg       0.57      0.67      0.62      6937
weighted avg       0.62      0.75      0.68      6937



Epoch: 20/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.68it/s, F1=0.959, train_acc=0.999, train_loss=0.0826, train_precision=0.959, train_recall=0.96] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      1.00      1.00       171
         LOC       0.96      0.93      0.94        27
         ORG       1.00      1.00      1.00       110
         PER       0.98      0.98      0.98       121

   micro avg       0.99      0.99      0.99       429
   macro avg       0.98      0.98      0.98       429
weighted avg       0.99      0.99      0.99       429



Eval Result: 100%|██████████| 68/68 [00:17<00:00,  4.00it/s, F1=0.701, eval_acc=0.961, eval_loss=9.04, eval_precision=0.674, eval_recall=0.742]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.72      0.75      0.73      3160
         LOC       0.32      0.54      0.40       482
         ORG       0.54      0.61      0.57      1645
         PER       0.85      0.90      0.88      1650

   micro avg       0.66      0.74      0.70      6937
   macro avg       0.61      0.70      0.64      6937
weighted avg       0.68      0.74      0.71      6937



Epoch: 21/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.76it/s, F1=0.955, train_acc=0.998, train_loss=0.348, train_precision=0.952, train_recall=0.961]


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.99      0.99       171
         LOC       1.00      1.00      1.00        27
         ORG       0.95      0.96      0.95       110
         PER       0.98      1.00      0.99       121

   micro avg       0.97      0.99      0.98       429
   macro avg       0.98      0.99      0.98       429
weighted avg       0.97      0.99      0.98       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.11it/s, F1=0.66, eval_acc=0.95, eval_loss=13.1, eval_precision=0.66, eval_recall=0.671]   


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.67      0.79      0.72      3160
         LOC       0.38      0.49      0.43       482
         ORG       0.48      0.31      0.37      1645
         PER       0.87      0.87      0.87      1650

   micro avg       0.66      0.67      0.67      6937
   macro avg       0.60      0.61      0.60      6937
weighted avg       0.65      0.67      0.65      6937



Epoch: 22/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.68it/s, F1=0.977, train_acc=0.998, train_loss=0.281, train_precision=0.967, train_recall=0.99] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.97      0.98      0.97       171
         LOC       1.00      1.00      1.00        27
         ORG       0.93      0.99      0.96       110
         PER       0.99      1.00      1.00       121

   micro avg       0.97      0.99      0.98       429
   macro avg       0.97      0.99      0.98       429
weighted avg       0.97      0.99      0.98       429



Eval Result: 100%|██████████| 68/68 [00:19<00:00,  3.41it/s, F1=0.679, eval_acc=0.959, eval_loss=9.3, eval_precision=0.706, eval_recall=0.663] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.72      0.68      0.70      3160
         LOC       0.46      0.33      0.38       482
         ORG       0.52      0.48      0.50      1645
         PER       0.86      0.90      0.88      1650

   micro avg       0.70      0.66      0.68      6937
   macro avg       0.64      0.60      0.62      6937
weighted avg       0.69      0.66      0.67      6937



Epoch: 23/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.75it/s, F1=0.981, train_acc=0.999, train_loss=0.238, train_precision=0.983, train_recall=0.982]


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.99      0.99       171
         LOC       1.00      1.00      1.00        27
         ORG       0.93      0.96      0.95       110
         PER       0.99      0.98      0.99       121

   micro avg       0.97      0.98      0.98       429
   macro avg       0.98      0.98      0.98       429
weighted avg       0.97      0.98      0.98       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.12it/s, F1=0.699, eval_acc=0.961, eval_loss=8.67, eval_precision=0.667, eval_recall=0.745]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.66      0.79      0.72      3160
         LOC       0.46      0.46      0.46       482
         ORG       0.53      0.55      0.54      1645
         PER       0.85      0.90      0.87      1650

   micro avg       0.66      0.74      0.70      6937
   macro avg       0.63      0.68      0.65      6937
weighted avg       0.66      0.74      0.70      6937



Epoch: 24/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.71it/s, F1=0.968, train_acc=1, train_loss=0.0323, train_precision=0.968, train_recall=0.968]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       171
         LOC       1.00      1.00      1.00        27
         ORG       1.00      1.00      1.00       110
         PER       1.00      1.00      1.00       121

   micro avg       1.00      1.00      1.00       429
   macro avg       1.00      1.00      1.00       429
weighted avg       1.00      1.00      1.00       429



Eval Result: 100%|██████████| 68/68 [00:17<00:00,  3.97it/s, F1=0.704, eval_acc=0.961, eval_loss=9.42, eval_precision=0.687, eval_recall=0.733]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.69      0.77      0.73      3160
         LOC       0.41      0.46      0.43       482
         ORG       0.55      0.52      0.54      1645
         PER       0.86      0.92      0.89      1650

   micro avg       0.68      0.73      0.70      6937
   macro avg       0.63      0.67      0.65      6937
weighted avg       0.68      0.73      0.70      6937



Epoch: 25/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.69it/s, F1=0.982, train_acc=1, train_loss=0.0416, train_precision=0.983, train_recall=0.981]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       171
         LOC       1.00      1.00      1.00        27
         ORG       1.00      1.00      1.00       110
         PER       0.99      0.99      0.99       121

   micro avg       1.00      1.00      1.00       429
   macro avg       1.00      1.00      1.00       429
weighted avg       1.00      1.00      1.00       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.16it/s, F1=0.704, eval_acc=0.961, eval_loss=9.91, eval_precision=0.723, eval_recall=0.697]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.72      0.73      0.72      3160
         LOC       0.45      0.41      0.43       482
         ORG       0.57      0.52      0.54      1645
         PER       0.88      0.89      0.89      1650

   micro avg       0.71      0.69      0.70      6937
   macro avg       0.66      0.64      0.64      6937
weighted avg       0.70      0.69      0.70      6937



Epoch: 26/30 Train: 100%|██████████| 63/63 [00:20<00:00,  3.07it/s, F1=0.936, train_acc=1, train_loss=0.0499, train_precision=0.937, train_recall=0.935] 


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       171
         LOC       1.00      1.00      1.00        27
         ORG       1.00      1.00      1.00       110
         PER       1.00      0.99      1.00       121

   micro avg       1.00      1.00      1.00       429
   macro avg       1.00      1.00      1.00       429
weighted avg       1.00      1.00      1.00       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.09it/s, F1=0.707, eval_acc=0.962, eval_loss=9.21, eval_precision=0.679, eval_recall=0.749]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.69      0.77      0.73      3160
         LOC       0.42      0.49      0.45       482
         ORG       0.53      0.58      0.55      1645
         PER       0.85      0.94      0.89      1650

   micro avg       0.67      0.74      0.71      6937
   macro avg       0.62      0.69      0.66      6937
weighted avg       0.67      0.74      0.71      6937



Epoch: 27/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.73it/s, F1=0.936, train_acc=1, train_loss=0.0149, train_precision=0.936, train_recall=0.936] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.99      0.99       171
         LOC       1.00      1.00      1.00        27
         ORG       1.00      1.00      1.00       110
         PER       1.00      1.00      1.00       121

   micro avg       1.00      1.00      1.00       429
   macro avg       1.00      1.00      1.00       429
weighted avg       1.00      1.00      1.00       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.10it/s, F1=0.695, eval_acc=0.96, eval_loss=10.1, eval_precision=0.655, eval_recall=0.753] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.64      0.81      0.72      3160
         LOC       0.43      0.47      0.45       482
         ORG       0.52      0.54      0.53      1645
         PER       0.85      0.92      0.88      1650

   micro avg       0.65      0.75      0.69      6937
   macro avg       0.61      0.68      0.65      6937
weighted avg       0.65      0.75      0.69      6937



Epoch: 28/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.67it/s, F1=0.968, train_acc=1, train_loss=0.00688, train_precision=0.968, train_recall=0.968]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       171
         LOC       1.00      1.00      1.00        27
         ORG       1.00      1.00      1.00       110
         PER       1.00      1.00      1.00       121

   micro avg       1.00      1.00      1.00       429
   macro avg       1.00      1.00      1.00       429
weighted avg       1.00      1.00      1.00       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.10it/s, F1=0.701, eval_acc=0.961, eval_loss=10.1, eval_precision=0.676, eval_recall=0.739]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.67      0.78      0.72      3160
         LOC       0.43      0.47      0.45       482
         ORG       0.54      0.54      0.54      1645
         PER       0.86      0.92      0.89      1650

   micro avg       0.67      0.74      0.70      6937
   macro avg       0.63      0.68      0.65      6937
weighted avg       0.67      0.74      0.70      6937



Epoch: 29/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.71it/s, F1=1, train_acc=1, train_loss=0.00466, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       171
         LOC       1.00      1.00      1.00        27
         ORG       1.00      1.00      1.00       110
         PER       1.00      1.00      1.00       121

   micro avg       1.00      1.00      1.00       429
   macro avg       1.00      1.00      1.00       429
weighted avg       1.00      1.00      1.00       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.14it/s, F1=0.703, eval_acc=0.961, eval_loss=10.4, eval_precision=0.682, eval_recall=0.737]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.68      0.78      0.73      3160
         LOC       0.43      0.47      0.45       482
         ORG       0.54      0.53      0.53      1645
         PER       0.87      0.92      0.89      1650

   micro avg       0.67      0.73      0.70      6937
   macro avg       0.63      0.68      0.65      6937
weighted avg       0.67      0.73      0.70      6937



Epoch: 30/30 Train: 100%|██████████| 63/63 [00:20<00:00,  3.05it/s, F1=0.984, train_acc=1, train_loss=0.00403, train_precision=0.984, train_recall=0.984]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       171
         LOC       1.00      1.00      1.00        27
         ORG       1.00      1.00      1.00       110
         PER       1.00      1.00      1.00       121

   micro avg       1.00      1.00      1.00       429
   macro avg       1.00      1.00      1.00       429
weighted avg       1.00      1.00      1.00       429



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.14it/s, F1=0.705, eval_acc=0.961, eval_loss=10.5, eval_precision=0.685, eval_recall=0.736]


eval_reports:
              precision    recall  f1-score   support

         GPE       0.68      0.78      0.73      3160
         LOC       0.43      0.48      0.45       482
         ORG       0.54      0.53      0.54      1645
         PER       0.87      0.92      0.89      1650

   micro avg       0.68      0.73      0.70      6937
   macro avg       0.63      0.68      0.65      6937
weighted avg       0.68      0.73      0.70      6937



calculate data/few_shot/note4/train_1000.json etag: 100%|██████████| 385k/385k [00:00<00:00, 15.5MB/s]
calculate data/few_shot/note4/dev.json etag: 100%|██████████| 2.46M/2.46M [00:00<00:00, 335MB/s]
calculate data/few_shot/note4/test.json etag: 100%|██████████| 2.56M/2.56M [00:00<00:00, 374MB/s]
calculate data/few_shot/note4/labels.txt etag: 100%|██████████| 100/100 [00:00<00:00, 189kB/s]

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/note4/train_1000.json",
    "eval_file": "data/few_shot/note4/dev.json",
    "test_file": "data/few_shot/note4/test.json",
    "tag_file": "data/few_shot/note4/labels.txt",
    "bert_vocab_file": "./model/chinese_wwm_ext/vocab.txt",
    "output_eval": true,
    "max_scan_num": 1000000,
    "add_seq_vocab": false,
    "max_seq_length": 150,
    "max_word_num": 5,
    "default_tag": "O",
    "use_test": false,
    "do_shuffle": true,
    "do_predict": false,
    "task_name": "note4_pretrain_lebert_crf_1000_x1"
}
load cached ./temp/f1dd66c8309dd10fb1912b81c20e7797_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/lexicon_tree



count line size data/few_shot/note4/labels.txt: 19L [00:00, 154142.70L/s]
build line mapper: 19L [00:00, 159702.96L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 19/19 [00:00<00:00, 5279.00it/s]
load vocab from list: 100%|██████████| 18/18 [00:00<00:00, 192595.59it/s]

load cached ./temp/f1dd66c8309dd10fb1912b81c20e7797_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/matched_words
load cached ./temp/f1dd66c8309dd10fb1912b81c20e7797_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/word_vocab
load cached ./temp/f1dd66c8309dd10fb1912b81c20e7797_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/vocab_embedding



load dataset from data/few_shot/note4/train_1000.json: 1000it [00:01, 837.07it/s]
load dataset from data/few_shot/note4/dev.json: 4301it [00:07, 568.68it/s]


Load pretrained embedding from file.........


Some weights of the model checkpoint at save_pretrained/note4_pretrain_lebert_1000_pretraind_task/Bert_960/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of LEBertModel were not initialized from the model checkpoint at save_pretrained/note4_pretrain_l

train_reports:
              precision    recall  f1-score   support

         GPE       0.00      0.02      0.01       326
         LOC       0.00      0.00      0.00        55
         ORG       0.00      0.00      0.00       190
         PER       0.00      0.00      0.00       267

   micro avg       0.00      0.01      0.00       838
   macro avg       0.00      0.00      0.00       838
weighted avg       0.00      0.01      0.00       838



Eval Result: 100%|██████████| 68/68 [00:17<00:00,  4.00it/s, F1=0.111, eval_acc=0.889, eval_loss=19.1, eval_precision=0.101, eval_recall=0.129] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.15      0.29      0.20      3160
         LOC       0.00      0.00      0.00       482
         ORG       0.00      0.00      0.00      1645
         PER       0.01      0.01      0.01      1650

   micro avg       0.11      0.14      0.12      6937
   macro avg       0.04      0.08      0.05      6937
weighted avg       0.07      0.14      0.09      6937



Epoch: 2/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.64it/s, F1=0.341, train_acc=0.952, train_loss=5.85, train_precision=0.316, train_recall=0.391]     


train_reports:
              precision    recall  f1-score   support

         GPE       0.34      0.50      0.41       326
         LOC       0.00      0.00      0.00        55
         ORG       0.31      0.33      0.32       190
         PER       0.30      0.48      0.37       267

   micro avg       0.32      0.42      0.36       838
   macro avg       0.24      0.33      0.27       838
weighted avg       0.30      0.42      0.35       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.12it/s, F1=0.539, eval_acc=0.952, eval_loss=7.82, eval_precision=0.476, eval_recall=0.631]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.50      0.72      0.59      3160
         LOC       0.01      0.01      0.01       482
         ORG       0.30      0.37      0.33      1645
         PER       0.76      0.87      0.81      1650

   micro avg       0.46      0.62      0.53      6937
   macro avg       0.39      0.49      0.44      6937
weighted avg       0.48      0.62      0.54      6937



Epoch: 3/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.64it/s, F1=0.645, train_acc=0.974, train_loss=2.83, train_precision=0.601, train_recall=0.72] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.70      0.81      0.75       326
         LOC       0.14      0.18      0.16        55
         ORG       0.52      0.71      0.60       190
         PER       0.66      0.78      0.71       267

   micro avg       0.60      0.74      0.66       838
   macro avg       0.50      0.62      0.55       838
weighted avg       0.61      0.74      0.66       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.14it/s, F1=0.654, eval_acc=0.958, eval_loss=7.02, eval_precision=0.615, eval_recall=0.711]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.67      0.73      0.70      3160
         LOC       0.11      0.03      0.05       482
         ORG       0.42      0.62      0.50      1645
         PER       0.78      0.93      0.85      1650

   micro avg       0.61      0.71      0.66      6937
   macro avg       0.50      0.58      0.53      6937
weighted avg       0.60      0.71      0.64      6937



Epoch: 4/30 Train: 100%|██████████| 125/125 [00:37<00:00,  3.34it/s, F1=0.794, train_acc=0.985, train_loss=1.63, train_precision=0.764, train_recall=0.845]


train_reports:
              precision    recall  f1-score   support

         GPE       0.84      0.90      0.87       326
         LOC       0.52      0.55      0.53        55
         ORG       0.66      0.81      0.73       190
         PER       0.79      0.92      0.85       267

   micro avg       0.76      0.86      0.81       838
   macro avg       0.70      0.79      0.74       838
weighted avg       0.76      0.86      0.81       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.05it/s, F1=0.679, eval_acc=0.959, eval_loss=7.29, eval_precision=0.645, eval_recall=0.726]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.67      0.76      0.71      3160
         LOC       0.18      0.23      0.20       482
         ORG       0.56      0.58      0.57      1645
         PER       0.82      0.93      0.87      1650

   micro avg       0.64      0.72      0.68      6937
   macro avg       0.56      0.62      0.59      6937
weighted avg       0.64      0.72      0.68      6937



Epoch: 5/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.64it/s, F1=0.872, train_acc=0.992, train_loss=0.952, train_precision=0.847, train_recall=0.913]


train_reports:
              precision    recall  f1-score   support

         GPE       0.89      0.94      0.92       326
         LOC       0.70      0.78      0.74        55
         ORG       0.80      0.89      0.84       190
         PER       0.89      0.96      0.93       267

   micro avg       0.86      0.93      0.89       838
   macro avg       0.82      0.89      0.86       838
weighted avg       0.86      0.93      0.89       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.12it/s, F1=0.672, eval_acc=0.961, eval_loss=7.04, eval_precision=0.643, eval_recall=0.711]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.69      0.74      0.72      3160
         LOC       0.22      0.33      0.27       482
         ORG       0.53      0.57      0.55      1645
         PER       0.82      0.90      0.86      1650

   micro avg       0.64      0.71      0.67      6937
   macro avg       0.56      0.63      0.60      6937
weighted avg       0.65      0.71      0.68      6937



Epoch: 6/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.63it/s, F1=0.881, train_acc=0.994, train_loss=0.628, train_precision=0.863, train_recall=0.909]


train_reports:
              precision    recall  f1-score   support

         GPE       0.91      0.95      0.93       326
         LOC       0.77      0.80      0.79        55
         ORG       0.86      0.93      0.89       190
         PER       0.92      0.97      0.94       267

   micro avg       0.89      0.94      0.92       838
   macro avg       0.86      0.91      0.89       838
weighted avg       0.89      0.94      0.92       838



Eval Result: 100%|██████████| 68/68 [00:19<00:00,  3.41it/s, F1=0.687, eval_acc=0.961, eval_loss=8.46, eval_precision=0.665, eval_recall=0.722]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.72      0.74      0.73      3160
         LOC       0.27      0.38      0.31       482
         ORG       0.56      0.62      0.59      1645
         PER       0.83      0.88      0.86      1650

   micro avg       0.66      0.72      0.69      6937
   macro avg       0.59      0.66      0.62      6937
weighted avg       0.68      0.72      0.70      6937



Epoch: 7/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.68it/s, F1=0.897, train_acc=0.996, train_loss=0.571, train_precision=0.885, train_recall=0.919]


train_reports:
              precision    recall  f1-score   support

         GPE       0.93      0.95      0.94       326
         LOC       0.89      0.89      0.89        55
         ORG       0.92      0.96      0.94       190
         PER       0.91      0.97      0.94       267

   micro avg       0.92      0.96      0.94       838
   macro avg       0.91      0.94      0.93       838
weighted avg       0.92      0.96      0.94       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.11it/s, F1=0.674, eval_acc=0.961, eval_loss=7.85, eval_precision=0.654, eval_recall=0.704]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.69      0.80      0.74      3160
         LOC       0.33      0.30      0.31       482
         ORG       0.48      0.50      0.49      1645
         PER       0.84      0.85      0.84      1650

   micro avg       0.65      0.70      0.68      6937
   macro avg       0.58      0.61      0.60      6937
weighted avg       0.65      0.70      0.67      6937



Epoch: 8/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.63it/s, F1=0.927, train_acc=0.997, train_loss=0.386, train_precision=0.915, train_recall=0.944]


train_reports:
              precision    recall  f1-score   support

         GPE       0.95      0.98      0.97       326
         LOC       0.86      0.87      0.86        55
         ORG       0.90      0.96      0.93       190
         PER       0.97      0.99      0.98       267

   micro avg       0.94      0.97      0.96       838
   macro avg       0.92      0.95      0.93       838
weighted avg       0.94      0.97      0.96       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.09it/s, F1=0.693, eval_acc=0.96, eval_loss=8.33, eval_precision=0.658, eval_recall=0.743] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.72      0.77      0.75      3160
         LOC       0.28      0.40      0.33       482
         ORG       0.53      0.62      0.58      1645
         PER       0.81      0.92      0.86      1650

   micro avg       0.66      0.75      0.70      6937
   macro avg       0.59      0.68      0.63      6937
weighted avg       0.67      0.75      0.70      6937



Epoch: 9/30 Train: 100%|██████████| 125/125 [00:37<00:00,  3.36it/s, F1=0.939, train_acc=0.998, train_loss=0.213, train_precision=0.935, train_recall=0.944]


train_reports:
              precision    recall  f1-score   support

         GPE       0.97      0.98      0.97       326
         LOC       0.94      0.93      0.94        55
         ORG       0.95      0.98      0.97       190
         PER       0.98      0.98      0.98       267

   micro avg       0.97      0.98      0.97       838
   macro avg       0.96      0.97      0.96       838
weighted avg       0.97      0.98      0.97       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.08it/s, F1=0.673, eval_acc=0.957, eval_loss=9.21, eval_precision=0.616, eval_recall=0.753]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.65      0.80      0.72      3160
         LOC       0.26      0.44      0.33       482
         ORG       0.50      0.58      0.54      1645
         PER       0.83      0.92      0.87      1650

   micro avg       0.62      0.75      0.68      6937
   macro avg       0.56      0.69      0.61      6937
weighted avg       0.63      0.75      0.68      6937



Epoch: 10/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.68it/s, F1=0.947, train_acc=0.999, train_loss=0.235, train_precision=0.94, train_recall=0.958] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.99      0.98       326
         LOC       0.83      0.89      0.86        55
         ORG       0.97      0.99      0.98       190
         PER       0.97      0.99      0.98       267

   micro avg       0.96      0.98      0.97       838
   macro avg       0.94      0.96      0.95       838
weighted avg       0.96      0.98      0.97       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.09it/s, F1=0.699, eval_acc=0.961, eval_loss=9.61, eval_precision=0.687, eval_recall=0.721]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.72      0.79      0.75      3160
         LOC       0.33      0.39      0.36       482
         ORG       0.56      0.53      0.54      1645
         PER       0.84      0.89      0.86      1650

   micro avg       0.68      0.72      0.70      6937
   macro avg       0.61      0.65      0.63      6937
weighted avg       0.68      0.72      0.70      6937



Epoch: 11/30 Train: 100%|██████████| 125/125 [00:37<00:00,  3.33it/s, F1=0.971, train_acc=0.999, train_loss=0.176, train_precision=0.968, train_recall=0.976]


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.99      0.99       326
         LOC       0.93      0.98      0.96        55
         ORG       0.96      0.97      0.97       190
         PER       0.98      0.99      0.99       267

   micro avg       0.98      0.99      0.98       838
   macro avg       0.97      0.98      0.98       838
weighted avg       0.98      0.99      0.98       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.04it/s, F1=0.708, eval_acc=0.962, eval_loss=9.08, eval_precision=0.678, eval_recall=0.751]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.74      0.79      0.76      3160
         LOC       0.34      0.40      0.37       482
         ORG       0.56      0.62      0.59      1645
         PER       0.78      0.92      0.84      1650

   micro avg       0.68      0.75      0.71      6937
   macro avg       0.61      0.68      0.64      6937
weighted avg       0.68      0.75      0.71      6937



Epoch: 12/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.65it/s, F1=0.936, train_acc=0.997, train_loss=0.371, train_precision=0.929, train_recall=0.947]


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      1.00      0.99       326
         LOC       0.90      0.95      0.92        55
         ORG       0.90      0.95      0.92       190
         PER       0.98      0.99      0.99       267

   micro avg       0.96      0.98      0.97       838
   macro avg       0.94      0.97      0.96       838
weighted avg       0.96      0.98      0.97       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.08it/s, F1=0.704, eval_acc=0.961, eval_loss=9.28, eval_precision=0.68, eval_recall=0.741] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.71      0.79      0.75      3160
         LOC       0.37      0.34      0.35       482
         ORG       0.54      0.61      0.57      1645
         PER       0.84      0.90      0.87      1650

   micro avg       0.68      0.74      0.71      6937
   macro avg       0.62      0.66      0.64      6937
weighted avg       0.68      0.74      0.71      6937



Epoch: 13/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.66it/s, F1=0.938, train_acc=0.999, train_loss=0.146, train_precision=0.934, train_recall=0.945]


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.99      0.99       326
         LOC       0.96      0.96      0.96        55
         ORG       0.95      0.98      0.96       190
         PER       0.99      0.99      0.99       267

   micro avg       0.98      0.99      0.98       838
   macro avg       0.97      0.98      0.98       838
weighted avg       0.98      0.99      0.98       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.12it/s, F1=0.68, eval_acc=0.958, eval_loss=9.87, eval_precision=0.665, eval_recall=0.709] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.71      0.68      0.70      3160
         LOC       0.27      0.40      0.32       482
         ORG       0.54      0.65      0.59      1645
         PER       0.86      0.87      0.87      1650

   micro avg       0.66      0.70      0.68      6937
   macro avg       0.60      0.65      0.62      6937
weighted avg       0.68      0.70      0.69      6937



Epoch: 14/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.66it/s, F1=0.954, train_acc=0.998, train_loss=0.252, train_precision=0.95, train_recall=0.959] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.98      0.98       326
         LOC       0.98      0.98      0.98        55
         ORG       0.95      0.98      0.97       190
         PER       1.00      1.00      1.00       267

   micro avg       0.98      0.99      0.98       838
   macro avg       0.98      0.98      0.98       838
weighted avg       0.98      0.99      0.98       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.06it/s, F1=0.691, eval_acc=0.957, eval_loss=9.74, eval_precision=0.654, eval_recall=0.745]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.72      0.76      0.74      3160
         LOC       0.33      0.38      0.35       482
         ORG       0.50      0.66      0.57      1645
         PER       0.84      0.90      0.86      1650

   micro avg       0.66      0.74      0.70      6937
   macro avg       0.60      0.67      0.63      6937
weighted avg       0.67      0.74      0.70      6937



Epoch: 15/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.65it/s, F1=0.94, train_acc=0.999, train_loss=0.174, train_precision=0.938, train_recall=0.945] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.99      0.99       326
         LOC       0.98      0.96      0.97        55
         ORG       0.96      0.97      0.97       190
         PER       0.99      0.99      0.99       267

   micro avg       0.98      0.99      0.98       838
   macro avg       0.98      0.98      0.98       838
weighted avg       0.98      0.99      0.98       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.05it/s, F1=0.694, eval_acc=0.96, eval_loss=9.57, eval_precision=0.655, eval_recall=0.749] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.74      0.78      0.76      3160
         LOC       0.25      0.45      0.32       482
         ORG       0.56      0.59      0.57      1645
         PER       0.80      0.92      0.85      1650

   micro avg       0.66      0.75      0.70      6937
   macro avg       0.58      0.69      0.63      6937
weighted avg       0.67      0.75      0.71      6937



Epoch: 16/30 Train: 100%|██████████| 125/125 [00:37<00:00,  3.35it/s, F1=0.989, train_acc=1, train_loss=0.0535, train_precision=0.987, train_recall=0.991]


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      1.00      0.99       326
         LOC       0.98      1.00      0.99        55
         ORG       0.98      0.99      0.99       190
         PER       1.00      1.00      1.00       267

   micro avg       0.99      1.00      0.99       838
   macro avg       0.99      1.00      0.99       838
weighted avg       0.99      1.00      0.99       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.15it/s, F1=0.715, eval_acc=0.963, eval_loss=10.4, eval_precision=0.703, eval_recall=0.738]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.72      0.80      0.76      3160
         LOC       0.38      0.35      0.37       482
         ORG       0.62      0.59      0.61      1645
         PER       0.83      0.88      0.86      1650

   micro avg       0.70      0.74      0.72      6937
   macro avg       0.64      0.66      0.65      6937
weighted avg       0.70      0.74      0.72      6937



Epoch: 17/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.65it/s, F1=0.956, train_acc=1, train_loss=0.087, train_precision=0.957, train_recall=0.955]    


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      0.99      1.00       326
         LOC       0.96      0.95      0.95        55
         ORG       0.99      1.00      1.00       190
         PER       1.00      1.00      1.00       267

   micro avg       1.00      0.99      0.99       838
   macro avg       0.99      0.98      0.99       838
weighted avg       1.00      0.99      0.99       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.02it/s, F1=0.712, eval_acc=0.962, eval_loss=10.2, eval_precision=0.686, eval_recall=0.748]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.72      0.80      0.75      3160
         LOC       0.30      0.43      0.35       482
         ORG       0.62      0.61      0.62      1645
         PER       0.85      0.89      0.87      1650

   micro avg       0.69      0.75      0.72      6937
   macro avg       0.62      0.68      0.65      6937
weighted avg       0.70      0.75      0.72      6937



Epoch: 18/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.66it/s, F1=0.968, train_acc=0.999, train_loss=0.0542, train_precision=0.969, train_recall=0.968]


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.99      0.99       326
         LOC       0.95      0.95      0.95        55
         ORG       0.99      0.99      0.99       190
         PER       1.00      1.00      1.00       267

   micro avg       0.99      0.99      0.99       838
   macro avg       0.98      0.98      0.98       838
weighted avg       0.99      0.99      0.99       838



Eval Result: 100%|██████████| 68/68 [00:19<00:00,  3.43it/s, F1=0.703, eval_acc=0.961, eval_loss=11.3, eval_precision=0.691, eval_recall=0.725]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.74      0.76      0.75      3160
         LOC       0.30      0.44      0.35       482
         ORG       0.58      0.55      0.57      1645
         PER       0.85      0.90      0.87      1650

   micro avg       0.68      0.72      0.70      6937
   macro avg       0.61      0.66      0.64      6937
weighted avg       0.69      0.72      0.71      6937



Epoch: 19/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.64it/s, F1=0.95, train_acc=0.998, train_loss=0.299, train_precision=0.945, train_recall=0.957] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.97      0.99      0.98       326
         LOC       0.95      0.95      0.95        55
         ORG       0.95      0.96      0.95       190
         PER       0.98      0.99      0.99       267

   micro avg       0.97      0.98      0.97       838
   macro avg       0.96      0.97      0.97       838
weighted avg       0.97      0.98      0.97       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.08it/s, F1=0.703, eval_acc=0.962, eval_loss=8.78, eval_precision=0.699, eval_recall=0.72] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.77      0.75      0.76      3160
         LOC       0.39      0.37      0.38       482
         ORG       0.50      0.65      0.57      1645
         PER       0.89      0.86      0.87      1650

   micro avg       0.69      0.72      0.71      6937
   macro avg       0.64      0.66      0.64      6937
weighted avg       0.71      0.72      0.71      6937



Epoch: 20/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.64it/s, F1=0.959, train_acc=0.998, train_loss=0.32, train_precision=0.956, train_recall=0.964] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.97      0.98      0.97       326
         LOC       1.00      0.96      0.98        55
         ORG       0.93      0.97      0.95       190
         PER       0.99      0.99      0.99       267

   micro avg       0.97      0.98      0.97       838
   macro avg       0.97      0.97      0.97       838
weighted avg       0.97      0.98      0.97       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.06it/s, F1=0.703, eval_acc=0.961, eval_loss=10.1, eval_precision=0.691, eval_recall=0.723]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.76      0.73      0.74      3160
         LOC       0.30      0.42      0.35       482
         ORG       0.56      0.65      0.60      1645
         PER       0.87      0.89      0.88      1650

   micro avg       0.69      0.73      0.71      6937
   macro avg       0.62      0.67      0.64      6937
weighted avg       0.71      0.73      0.71      6937



Epoch: 21/30 Train: 100%|██████████| 125/125 [00:37<00:00,  3.33it/s, F1=0.972, train_acc=0.999, train_loss=0.191, train_precision=0.968, train_recall=0.979]


train_reports:
              precision    recall  f1-score   support

         GPE       0.97      0.98      0.97       326
         LOC       0.95      0.95      0.95        55
         ORG       0.95      0.98      0.97       190
         PER       1.00      1.00      1.00       267

   micro avg       0.97      0.98      0.98       838
   macro avg       0.97      0.98      0.97       838
weighted avg       0.97      0.98      0.98       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.05it/s, F1=0.682, eval_acc=0.958, eval_loss=10.5, eval_precision=0.647, eval_recall=0.731]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.65      0.81      0.72      3160
         LOC       0.26      0.40      0.32       482
         ORG       0.58      0.53      0.56      1645
         PER       0.87      0.89      0.88      1650

   micro avg       0.65      0.73      0.69      6937
   macro avg       0.59      0.66      0.62      6937
weighted avg       0.66      0.73      0.69      6937



Epoch: 22/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.68it/s, F1=0.953, train_acc=0.999, train_loss=0.154, train_precision=0.95, train_recall=0.957] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.97      0.99      0.98       326
         LOC       0.96      0.98      0.97        55
         ORG       0.99      1.00      1.00       190
         PER       0.99      1.00      0.99       267

   micro avg       0.98      0.99      0.99       838
   macro avg       0.98      0.99      0.99       838
weighted avg       0.98      0.99      0.99       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.08it/s, F1=0.704, eval_acc=0.961, eval_loss=10.8, eval_precision=0.688, eval_recall=0.731]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.72      0.76      0.74      3160
         LOC       0.36      0.39      0.37       482
         ORG       0.58      0.59      0.58      1645
         PER       0.83      0.91      0.87      1650

   micro avg       0.69      0.73      0.71      6937
   macro avg       0.62      0.66      0.64      6937
weighted avg       0.69      0.73      0.71      6937



Epoch: 23/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.65it/s, F1=0.988, train_acc=1, train_loss=0.0647, train_precision=0.986, train_recall=0.99]    


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      1.00      0.99       326
         LOC       1.00      1.00      1.00        55
         ORG       1.00      1.00      1.00       190
         PER       0.99      1.00      0.99       267

   micro avg       0.99      1.00      1.00       838
   macro avg       1.00      1.00      1.00       838
weighted avg       0.99      1.00      1.00       838



Eval Result: 100%|██████████| 68/68 [00:20<00:00,  3.40it/s, F1=0.71, eval_acc=0.962, eval_loss=11, eval_precision=0.692, eval_recall=0.737]   


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.71      0.79      0.75      3160
         LOC       0.39      0.39      0.39       482
         ORG       0.58      0.58      0.58      1645
         PER       0.84      0.91      0.87      1650

   micro avg       0.69      0.74      0.72      6937
   macro avg       0.63      0.67      0.65      6937
weighted avg       0.69      0.74      0.71      6937



Epoch: 24/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.67it/s, F1=0.983, train_acc=1, train_loss=0.02, train_precision=0.983, train_recall=0.984]  


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       326
         LOC       1.00      1.00      1.00        55
         ORG       1.00      1.00      1.00       190
         PER       1.00      1.00      1.00       267

   micro avg       1.00      1.00      1.00       838
   macro avg       1.00      1.00      1.00       838
weighted avg       1.00      1.00      1.00       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.02it/s, F1=0.715, eval_acc=0.962, eval_loss=11.9, eval_precision=0.705, eval_recall=0.735]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.74      0.78      0.76      3160
         LOC       0.37      0.43      0.40       482
         ORG       0.60      0.57      0.58      1645
         PER       0.84      0.91      0.87      1650

   micro avg       0.70      0.74      0.72      6937
   macro avg       0.64      0.67      0.65      6937
weighted avg       0.70      0.74      0.72      6937



Epoch: 25/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.69it/s, F1=0.96, train_acc=1, train_loss=0.00816, train_precision=0.96, train_recall=0.96]   


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       326
         LOC       1.00      1.00      1.00        55
         ORG       1.00      1.00      1.00       190
         PER       1.00      1.00      1.00       267

   micro avg       1.00      1.00      1.00       838
   macro avg       1.00      1.00      1.00       838
weighted avg       1.00      1.00      1.00       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.11it/s, F1=0.709, eval_acc=0.961, eval_loss=12.4, eval_precision=0.695, eval_recall=0.733]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.74      0.77      0.76      3160
         LOC       0.32      0.48      0.38       482
         ORG       0.59      0.57      0.58      1645
         PER       0.85      0.90      0.88      1650

   micro avg       0.69      0.73      0.71      6937
   macro avg       0.63      0.68      0.65      6937
weighted avg       0.70      0.73      0.72      6937



Epoch: 26/30 Train: 100%|██████████| 125/125 [00:37<00:00,  3.36it/s, F1=1, train_acc=1, train_loss=0.00606, train_precision=0.999, train_recall=1]   


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       326
         LOC       1.00      1.00      1.00        55
         ORG       0.99      1.00      1.00       190
         PER       1.00      1.00      1.00       267

   micro avg       1.00      1.00      1.00       838
   macro avg       1.00      1.00      1.00       838
weighted avg       1.00      1.00      1.00       838



Eval Result: 100%|██████████| 68/68 [00:17<00:00,  3.98it/s, F1=0.711, eval_acc=0.961, eval_loss=12.6, eval_precision=0.694, eval_recall=0.738]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.73      0.78      0.76      3160
         LOC       0.32      0.47      0.38       482
         ORG       0.59      0.57      0.58      1645
         PER       0.85      0.90      0.88      1650

   micro avg       0.69      0.74      0.72      6937
   macro avg       0.63      0.68      0.65      6937
weighted avg       0.70      0.74      0.72      6937



Epoch: 27/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.61it/s, F1=0.988, train_acc=1, train_loss=0.0256, train_precision=0.987, train_recall=0.99] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      1.00      1.00       326
         LOC       1.00      1.00      1.00        55
         ORG       0.99      0.99      0.99       190
         PER       1.00      1.00      1.00       267

   micro avg       1.00      1.00      1.00       838
   macro avg       1.00      1.00      1.00       838
weighted avg       1.00      1.00      1.00       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.10it/s, F1=0.706, eval_acc=0.96, eval_loss=12.3, eval_precision=0.674, eval_recall=0.75]  


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.67      0.82      0.74      3160
         LOC       0.37      0.26      0.31       482
         ORG       0.54      0.59      0.57      1645
         PER       0.87      0.91      0.88      1650

   micro avg       0.67      0.75      0.71      6937
   macro avg       0.61      0.65      0.62      6937
weighted avg       0.67      0.75      0.70      6937



Epoch: 28/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.67it/s, F1=0.973, train_acc=1, train_loss=0.0349, train_precision=0.973, train_recall=0.973]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       326
         LOC       0.96      0.96      0.96        55
         ORG       1.00      1.00      1.00       190
         PER       1.00      1.00      1.00       267

   micro avg       1.00      1.00      1.00       838
   macro avg       0.99      0.99      0.99       838
weighted avg       1.00      1.00      1.00       838



Eval Result: 100%|██████████| 68/68 [00:19<00:00,  3.40it/s, F1=0.702, eval_acc=0.96, eval_loss=13.2, eval_precision=0.685, eval_recall=0.729] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.71      0.78      0.74      3160
         LOC       0.27      0.40      0.32       482
         ORG       0.60      0.53      0.56      1645
         PER       0.86      0.91      0.88      1650

   micro avg       0.68      0.73      0.70      6937
   macro avg       0.61      0.66      0.63      6937
weighted avg       0.69      0.73      0.70      6937



Epoch: 29/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.66it/s, F1=0.973, train_acc=1, train_loss=0.0143, train_precision=0.972, train_recall=0.974]


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      1.00      1.00       326
         LOC       0.95      0.98      0.96        55
         ORG       1.00      1.00      1.00       190
         PER       1.00      1.00      1.00       267

   micro avg       0.99      1.00      1.00       838
   macro avg       0.99      0.99      0.99       838
weighted avg       0.99      1.00      1.00       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.14it/s, F1=0.712, eval_acc=0.961, eval_loss=13, eval_precision=0.701, eval_recall=0.732]  


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.77      0.74      0.75      3160
         LOC       0.27      0.42      0.33       482
         ORG       0.60      0.62      0.61      1645
         PER       0.88      0.91      0.89      1650

   micro avg       0.70      0.73      0.71      6937
   macro avg       0.63      0.67      0.65      6937
weighted avg       0.72      0.73      0.72      6937



Epoch: 30/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.67it/s, F1=0.984, train_acc=1, train_loss=0.0415, train_precision=0.984, train_recall=0.983]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       326
         LOC       1.00      0.98      0.99        55
         ORG       1.00      1.00      1.00       190
         PER       1.00      1.00      1.00       267

   micro avg       1.00      1.00      1.00       838
   macro avg       1.00      1.00      1.00       838
weighted avg       1.00      1.00      1.00       838



Eval Result: 100%|██████████| 68/68 [00:19<00:00,  3.40it/s, F1=0.708, eval_acc=0.96, eval_loss=12.5, eval_precision=0.682, eval_recall=0.746] 


eval_reports:
              precision    recall  f1-score   support

         GPE       0.75      0.78      0.76      3160
         LOC       0.25      0.42      0.31       482
         ORG       0.57      0.61      0.59      1645
         PER       0.87      0.91      0.89      1650

   micro avg       0.68      0.74      0.71      6937
   macro avg       0.61      0.68      0.64      6937
weighted avg       0.70      0.74      0.72      6937



calculate data/few_shot/note4/train_1000.json etag: 100%|██████████| 385k/385k [00:00<00:00, 287MB/s]
calculate data/few_shot/note4/dev.json etag: 100%|██████████| 2.46M/2.46M [00:00<00:00, 332MB/s]
calculate data/few_shot/note4/test.json etag: 100%|██████████| 2.56M/2.56M [00:00<00:00, 372MB/s]
calculate data/few_shot/note4/labels.txt etag: 100%|██████████| 100/100 [00:00<00:00, 192kB/s]

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/note4/train_1000.json",
    "eval_file": "data/few_shot/note4/dev.json",
    "test_file": "data/few_shot/note4/test.json",
    "tag_file": "data/few_shot/note4/labels.txt",
    "bert_vocab_file": "./model/chinese_wwm_ext/vocab.txt",
    "output_eval": true,
    "max_scan_num": 1000000,
    "add_seq_vocab": false,
    "max_seq_length": 150,
    "max_word_num": 5,
    "default_tag": "O",
    "use_test": false,
    "do_shuffle": true,
    "do_predict": false,
    "task_name": "note4_pretrain_lebert_crf_1000_x2"
}
load cached ./temp/f1dd66c8309dd10fb1912b81c20e7797_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/lexicon_tree



count line size data/few_shot/note4/labels.txt: 19L [00:00, 150931.39L/s]
build line mapper: 19L [00:00, 162636.28L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 19/19 [00:00<00:00, 5735.28it/s]
load vocab from list: 100%|██████████| 18/18 [00:00<00:00, 184590.40it/s]
load dataset from data/few_shot/note4/train_1000.json: 0it [00:00, ?it/s]

load cached ./temp/f1dd66c8309dd10fb1912b81c20e7797_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/matched_words
load cached ./temp/f1dd66c8309dd10fb1912b81c20e7797_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/word_vocab
load cached ./temp/f1dd66c8309dd10fb1912b81c20e7797_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/vocab_embedding


load dataset from data/few_shot/note4/train_1000.json: 1000it [00:01, 580.23it/s]
load dataset from data/few_shot/note4/dev.json: 4301it [00:10, 394.94it/s]


Load pretrained embedding from file.........


Some weights of the model checkpoint at save_pretrained/note4_pretrain_lebert_1000_pretraind_task/Bert_960/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of LEBertModel were not initialized from the model checkpoint at save_pretrained/note4_pretrain_l

train_reports:
              precision    recall  f1-score   support

         GPE       0.00      0.00      0.00       326
         LOC       0.00      0.00      0.00        55
         ORG       0.00      0.00      0.00       190
         PER       0.00      0.00      0.00       267
           _       0.00      0.00      0.00         0

   micro avg       0.00      0.00      0.00       838
   macro avg       0.00      0.00      0.00       838
weighted avg       0.00      0.00      0.00       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.05it/s, F1=0.00132, eval_acc=0.899, eval_loss=14, eval_precision=0.00313, eval_recall=0.000896]  


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.01      0.00      0.00      3160
         LOC       0.00      0.00      0.00       482
         ORG       0.00      0.00      0.00      1645
         PER       0.00      0.00      0.00      1650

   micro avg       0.00      0.00      0.00      6937
   macro avg       0.00      0.00      0.00      6937
weighted avg       0.00      0.00      0.00      6937



Epoch: 2/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.62it/s, F1=0.393, train_acc=0.953, train_loss=4.64, train_precision=0.4, train_recall=0.414]       


train_reports:
              precision    recall  f1-score   support

         GPE       0.44      0.53      0.48       326
         LOC       0.00      0.00      0.00        55
         ORG       0.38      0.34      0.36       190
         PER       0.46      0.58      0.51       267

   micro avg       0.43      0.47      0.45       838
   macro avg       0.32      0.36      0.34       838
weighted avg       0.40      0.47      0.43       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.06it/s, F1=0.65, eval_acc=0.955, eval_loss=5.83, eval_precision=0.667, eval_recall=0.645] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.68      0.71      0.69      3160
         LOC       0.20      0.12      0.15       482
         ORG       0.49      0.41      0.45      1645
         PER       0.83      0.87      0.85      1650

   micro avg       0.66      0.64      0.65      6937
   macro avg       0.55      0.53      0.54      6937
weighted avg       0.63      0.64      0.63      6937



Epoch: 3/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.66it/s, F1=0.733, train_acc=0.978, train_loss=2.11, train_precision=0.723, train_recall=0.765]


train_reports:
              precision    recall  f1-score   support

         GPE       0.76      0.83      0.79       326
         LOC       0.41      0.40      0.40        55
         ORG       0.58      0.65      0.61       190
         PER       0.87      0.91      0.89       267

   micro avg       0.73      0.79      0.76       838
   macro avg       0.65      0.70      0.67       838
weighted avg       0.73      0.79      0.76       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.16it/s, F1=0.662, eval_acc=0.957, eval_loss=5.73, eval_precision=0.594, eval_recall=0.758]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.67      0.80      0.73      3160
         LOC       0.22      0.44      0.29       482
         ORG       0.43      0.61      0.50      1645
         PER       0.87      0.91      0.89      1650

   micro avg       0.59      0.76      0.67      6937
   macro avg       0.55      0.69      0.60      6937
weighted avg       0.63      0.76      0.68      6937



Epoch: 4/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.67it/s, F1=0.84, train_acc=0.988, train_loss=1.15, train_precision=0.822, train_recall=0.877] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.83      0.90      0.86       326
         LOC       0.50      0.55      0.52        55
         ORG       0.78      0.88      0.83       190
         PER       0.91      0.96      0.93       267

   micro avg       0.82      0.89      0.85       838
   macro avg       0.76      0.82      0.79       838
weighted avg       0.82      0.89      0.85       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.13it/s, F1=0.686, eval_acc=0.961, eval_loss=6.58, eval_precision=0.718, eval_recall=0.666]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.72      0.69      0.70      3160
         LOC       0.37      0.28      0.32       482
         ORG       0.60      0.53      0.57      1645
         PER       0.85      0.87      0.86      1650

   micro avg       0.71      0.67      0.69      6937
   macro avg       0.64      0.59      0.61      6937
weighted avg       0.70      0.67      0.68      6937



Epoch: 5/30 Train: 100%|██████████| 125/125 [00:37<00:00,  3.32it/s, F1=0.87, train_acc=0.993, train_loss=0.719, train_precision=0.858, train_recall=0.889] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.91      0.94      0.93       326
         LOC       0.64      0.67      0.65        55
         ORG       0.89      0.96      0.92       190
         PER       0.94      0.96      0.95       267

   micro avg       0.90      0.93      0.92       838
   macro avg       0.85      0.88      0.86       838
weighted avg       0.90      0.93      0.92       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.08it/s, F1=0.704, eval_acc=0.963, eval_loss=6.39, eval_precision=0.703, eval_recall=0.716]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.73      0.76      0.74      3160
         LOC       0.34      0.29      0.31       482
         ORG       0.59      0.56      0.57      1645
         PER       0.83      0.90      0.87      1650

   micro avg       0.70      0.71      0.71      6937
   macro avg       0.62      0.63      0.62      6937
weighted avg       0.69      0.71      0.70      6937



Epoch: 6/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.67it/s, F1=0.914, train_acc=0.995, train_loss=0.591, train_precision=0.91, train_recall=0.926] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.94      0.95      0.95       326
         LOC       0.73      0.80      0.77        55
         ORG       0.90      0.94      0.92       190
         PER       0.96      0.97      0.96       267

   micro avg       0.92      0.95      0.94       838
   macro avg       0.88      0.92      0.90       838
weighted avg       0.92      0.95      0.94       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.09it/s, F1=0.694, eval_acc=0.961, eval_loss=6.9, eval_precision=0.681, eval_recall=0.718] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.71      0.78      0.74      3160
         LOC       0.32      0.25      0.28       482
         ORG       0.55      0.56      0.55      1645
         PER       0.82      0.89      0.85      1650

   micro avg       0.68      0.72      0.70      6937
   macro avg       0.60      0.62      0.61      6937
weighted avg       0.67      0.72      0.69      6937



Epoch: 7/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.63it/s, F1=0.919, train_acc=0.997, train_loss=0.379, train_precision=0.906, train_recall=0.936]


train_reports:
              precision    recall  f1-score   support

         GPE       0.95      0.98      0.96       326
         LOC       0.93      0.91      0.92        55
         ORG       0.91      0.97      0.94       190
         PER       0.96      0.99      0.98       267

   micro avg       0.94      0.97      0.96       838
   macro avg       0.94      0.96      0.95       838
weighted avg       0.94      0.97      0.96       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.02it/s, F1=0.69, eval_acc=0.959, eval_loss=8.73, eval_precision=0.743, eval_recall=0.657] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.75      0.68      0.72      3160
         LOC       0.37      0.28      0.32       482
         ORG       0.64      0.49      0.56      1645
         PER       0.85      0.89      0.87      1650

   micro avg       0.73      0.66      0.69      6937
   macro avg       0.65      0.58      0.61      6937
weighted avg       0.72      0.66      0.69      6937



Epoch: 8/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.29it/s, F1=0.924, train_acc=0.995, train_loss=0.432, train_precision=0.922, train_recall=0.934]


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.98      0.98       326
         LOC       0.91      0.95      0.93        55
         ORG       0.87      0.92      0.89       190
         PER       0.99      0.99      0.99       267

   micro avg       0.95      0.97      0.96       838
   macro avg       0.94      0.96      0.95       838
weighted avg       0.95      0.97      0.96       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.10it/s, F1=0.696, eval_acc=0.961, eval_loss=7.23, eval_precision=0.703, eval_recall=0.7]  


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.73      0.72      0.73      3160
         LOC       0.32      0.37      0.34       482
         ORG       0.61      0.58      0.59      1645
         PER       0.83      0.89      0.86      1650

   micro avg       0.70      0.70      0.70      6937
   macro avg       0.62      0.64      0.63      6937
weighted avg       0.70      0.70      0.70      6937



Epoch: 9/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.66it/s, F1=0.975, train_acc=0.999, train_loss=0.133, train_precision=0.969, train_recall=0.981]


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.98      0.98       326
         LOC       0.96      0.98      0.97        55
         ORG       0.95      0.98      0.97       190
         PER       0.98      1.00      0.99       267

   micro avg       0.97      0.99      0.98       838
   macro avg       0.97      0.99      0.98       838
weighted avg       0.97      0.99      0.98       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.06it/s, F1=0.699, eval_acc=0.96, eval_loss=7.9, eval_precision=0.661, eval_recall=0.752]  


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.68      0.80      0.74      3160
         LOC       0.33      0.32      0.32       482
         ORG       0.53      0.63      0.58      1645
         PER       0.84      0.90      0.87      1650

   micro avg       0.66      0.75      0.70      6937
   macro avg       0.59      0.66      0.63      6937
weighted avg       0.66      0.75      0.70      6937



Epoch: 10/30 Train: 100%|██████████| 125/125 [00:37<00:00,  3.33it/s, F1=0.938, train_acc=0.999, train_loss=0.12, train_precision=0.935, train_recall=0.942] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.99      0.99       326
         LOC       0.91      0.95      0.93        55
         ORG       0.98      0.99      0.99       190
         PER       0.99      1.00      0.99       267

   micro avg       0.98      0.99      0.99       838
   macro avg       0.97      0.98      0.98       838
weighted avg       0.98      0.99      0.99       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.10it/s, F1=0.717, eval_acc=0.962, eval_loss=8.2, eval_precision=0.695, eval_recall=0.751] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.70      0.80      0.75      3160
         LOC       0.37      0.27      0.31       482
         ORG       0.57      0.63      0.60      1645
         PER       0.85      0.91      0.88      1650

   micro avg       0.69      0.75      0.72      6937
   macro avg       0.62      0.65      0.63      6937
weighted avg       0.68      0.75      0.71      6937



Epoch: 11/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.67it/s, F1=0.971, train_acc=0.999, train_loss=0.143, train_precision=0.97, train_recall=0.974]  


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      1.00      1.00       326
         LOC       0.96      0.98      0.97        55
         ORG       0.97      0.97      0.97       190
         PER       1.00      1.00      1.00       267

   micro avg       0.99      0.99      0.99       838
   macro avg       0.98      0.99      0.98       838
weighted avg       0.99      0.99      0.99       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.07it/s, F1=0.643, eval_acc=0.943, eval_loss=10.2, eval_precision=0.56, eval_recall=0.774] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.71      0.75      0.73      3160
         LOC       0.25      0.43      0.31       482
         ORG       0.37      0.74      0.50      1645
         PER       0.76      0.92      0.83      1650

   micro avg       0.56      0.76      0.65      6937
   macro avg       0.52      0.71      0.59      6937
weighted avg       0.61      0.76      0.67      6937



Epoch: 12/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.67it/s, F1=0.924, train_acc=0.996, train_loss=0.419, train_precision=0.918, train_recall=0.934]


train_reports:
              precision    recall  f1-score   support

         GPE       0.97      0.99      0.98       326
         LOC       0.93      0.93      0.93        55
         ORG       0.86      0.93      0.89       190
         PER       0.98      0.99      0.99       267

   micro avg       0.94      0.97      0.96       838
   macro avg       0.93      0.96      0.95       838
weighted avg       0.94      0.97      0.96       838



Eval Result: 100%|██████████| 68/68 [00:19<00:00,  3.43it/s, F1=0.674, eval_acc=0.958, eval_loss=8.85, eval_precision=0.658, eval_recall=0.699]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.73      0.69      0.71      3160
         LOC       0.25      0.47      0.33       482
         ORG       0.57      0.58      0.58      1645
         PER       0.83      0.91      0.87      1650

   micro avg       0.66      0.70      0.68      6937
   macro avg       0.59      0.66      0.62      6937
weighted avg       0.68      0.70      0.69      6937



Epoch: 13/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.69it/s, F1=0.957, train_acc=0.999, train_loss=0.195, train_precision=0.952, train_recall=0.963]


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.98      0.98       326
         LOC       0.91      0.96      0.94        55
         ORG       0.95      0.97      0.96       190
         PER       0.99      0.99      0.99       267

   micro avg       0.97      0.98      0.98       838
   macro avg       0.96      0.98      0.97       838
weighted avg       0.97      0.98      0.98       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.12it/s, F1=0.708, eval_acc=0.961, eval_loss=8.08, eval_precision=0.675, eval_recall=0.756]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.68      0.83      0.75      3160
         LOC       0.37      0.35      0.36       482
         ORG       0.55      0.61      0.58      1645
         PER       0.86      0.89      0.88      1650

   micro avg       0.67      0.76      0.71      6937
   macro avg       0.62      0.67      0.64      6937
weighted avg       0.67      0.76      0.71      6937



Epoch: 14/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.66it/s, F1=0.968, train_acc=0.999, train_loss=0.1, train_precision=0.966, train_recall=0.972]   


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.98      0.98       326
         LOC       0.96      0.96      0.96        55
         ORG       0.97      0.98      0.98       190
         PER       0.99      0.99      0.99       267

   micro avg       0.98      0.98      0.98       838
   macro avg       0.98      0.98      0.98       838
weighted avg       0.98      0.98      0.98       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.15it/s, F1=0.708, eval_acc=0.961, eval_loss=8.95, eval_precision=0.706, eval_recall=0.721]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.74      0.74      0.74      3160
         LOC       0.35      0.35      0.35       482
         ORG       0.58      0.62      0.60      1645
         PER       0.86      0.88      0.87      1650

   micro avg       0.70      0.72      0.71      6937
   macro avg       0.63      0.65      0.64      6937
weighted avg       0.70      0.72      0.71      6937



Epoch: 15/30 Train: 100%|██████████| 125/125 [00:37<00:00,  3.33it/s, F1=0.974, train_acc=1, train_loss=0.025, train_precision=0.974, train_recall=0.974]    


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       326
         LOC       0.98      0.98      0.98        55
         ORG       1.00      0.99      1.00       190
         PER       1.00      1.00      1.00       267

   micro avg       1.00      1.00      1.00       838
   macro avg       0.99      0.99      0.99       838
weighted avg       1.00      1.00      1.00       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.12it/s, F1=0.708, eval_acc=0.961, eval_loss=9.41, eval_precision=0.694, eval_recall=0.732]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.73      0.75      0.74      3160
         LOC       0.36      0.45      0.40       482
         ORG       0.57      0.62      0.59      1645
         PER       0.86      0.90      0.88      1650

   micro avg       0.69      0.73      0.71      6937
   macro avg       0.63      0.68      0.65      6937
weighted avg       0.70      0.73      0.71      6937



Epoch: 16/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.68it/s, F1=0.975, train_acc=1, train_loss=0.0226, train_precision=0.975, train_recall=0.975]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       326
         LOC       1.00      1.00      1.00        55
         ORG       0.99      0.99      0.99       190
         PER       1.00      1.00      1.00       267

   micro avg       1.00      1.00      1.00       838
   macro avg       1.00      1.00      1.00       838
weighted avg       1.00      1.00      1.00       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.12it/s, F1=0.712, eval_acc=0.962, eval_loss=9.83, eval_precision=0.713, eval_recall=0.721]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.75      0.74      0.75      3160
         LOC       0.37      0.43      0.40       482
         ORG       0.59      0.60      0.60      1645
         PER       0.88      0.88      0.88      1650

   micro avg       0.71      0.72      0.72      6937
   macro avg       0.65      0.67      0.66      6937
weighted avg       0.72      0.72      0.72      6937



Epoch: 17/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.67it/s, F1=0.968, train_acc=1, train_loss=0.00892, train_precision=0.968, train_recall=0.968]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       326
         LOC       1.00      1.00      1.00        55
         ORG       1.00      1.00      1.00       190
         PER       1.00      1.00      1.00       267

   micro avg       1.00      1.00      1.00       838
   macro avg       1.00      1.00      1.00       838
weighted avg       1.00      1.00      1.00       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.16it/s, F1=0.712, eval_acc=0.962, eval_loss=10.6, eval_precision=0.713, eval_recall=0.722]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.73      0.75      0.74      3160
         LOC       0.41      0.40      0.41       482
         ORG       0.60      0.60      0.60      1645
         PER       0.87      0.89      0.88      1650

   micro avg       0.71      0.72      0.72      6937
   macro avg       0.65      0.66      0.66      6937
weighted avg       0.71      0.72      0.72      6937



Epoch: 18/30 Train: 100%|██████████| 125/125 [00:37<00:00,  3.36it/s, F1=0.988, train_acc=0.999, train_loss=0.0648, train_precision=0.988, train_recall=0.989]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       326
         LOC       1.00      1.00      1.00        55
         ORG       0.98      0.99      0.99       190
         PER       1.00      1.00      1.00       267

   micro avg       1.00      1.00      1.00       838
   macro avg       1.00      1.00      1.00       838
weighted avg       1.00      1.00      1.00       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.09it/s, F1=0.711, eval_acc=0.962, eval_loss=9.28, eval_precision=0.718, eval_recall=0.716]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.74      0.73      0.74      3160
         LOC       0.41      0.42      0.42       482
         ORG       0.59      0.60      0.59      1645
         PER       0.88      0.88      0.88      1650

   micro avg       0.72      0.72      0.72      6937
   macro avg       0.66      0.66      0.66      6937
weighted avg       0.72      0.72      0.72      6937



Epoch: 19/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.67it/s, F1=0.975, train_acc=1, train_loss=0.0591, train_precision=0.975, train_recall=0.976]    


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.99      0.99       326
         LOC       0.96      0.96      0.96        55
         ORG       0.99      1.00      1.00       190
         PER       1.00      1.00      1.00       267

   micro avg       0.99      1.00      0.99       838
   macro avg       0.99      0.99      0.99       838
weighted avg       0.99      1.00      0.99       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.15it/s, F1=0.708, eval_acc=0.961, eval_loss=9.17, eval_precision=0.676, eval_recall=0.754]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.70      0.79      0.74      3160
         LOC       0.36      0.44      0.39       482
         ORG       0.56      0.62      0.59      1645
         PER       0.86      0.90      0.88      1650

   micro avg       0.68      0.75      0.71      6937
   macro avg       0.62      0.69      0.65      6937
weighted avg       0.68      0.75      0.71      6937



Epoch: 20/30 Train: 100%|██████████| 125/125 [00:37<00:00,  3.30it/s, F1=0.947, train_acc=0.999, train_loss=0.145, train_precision=0.945, train_recall=0.952]


train_reports:
              precision    recall  f1-score   support

         GPE       0.96      0.98      0.97       326
         LOC       0.93      0.96      0.95        55
         ORG       0.97      0.99      0.98       190
         PER       1.00      1.00      1.00       267

   micro avg       0.97      0.99      0.98       838
   macro avg       0.97      0.98      0.97       838
weighted avg       0.97      0.99      0.98       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.10it/s, F1=0.68, eval_acc=0.96, eval_loss=9.44, eval_precision=0.69, eval_recall=0.684]   


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.70      0.73      0.71      3160
         LOC       0.46      0.35      0.40       482
         ORG       0.58      0.47      0.52      1645
         PER       0.79      0.90      0.84      1650

   micro avg       0.69      0.68      0.68      6937
   macro avg       0.63      0.61      0.62      6937
weighted avg       0.67      0.68      0.68      6937



Epoch: 21/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.67it/s, F1=0.937, train_acc=0.999, train_loss=0.134, train_precision=0.935, train_recall=0.94] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.97      0.98      0.98       326
         LOC       0.93      0.96      0.95        55
         ORG       0.97      0.98      0.98       190
         PER       1.00      1.00      1.00       267

   micro avg       0.98      0.99      0.98       838
   macro avg       0.97      0.98      0.97       838
weighted avg       0.98      0.99      0.98       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.14it/s, F1=0.717, eval_acc=0.961, eval_loss=9.61, eval_precision=0.732, eval_recall=0.717]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.74      0.71      0.72      3160
         LOC       0.47      0.35      0.40       482
         ORG       0.61      0.63      0.62      1645
         PER       0.86      0.89      0.88      1650

   micro avg       0.72      0.71      0.72      6937
   macro avg       0.67      0.65      0.66      6937
weighted avg       0.72      0.71      0.71      6937



Epoch: 22/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.66it/s, F1=0.951, train_acc=0.998, train_loss=0.271, train_precision=0.949, train_recall=0.959]


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      1.00      0.99       326
         LOC       0.98      1.00      0.99        55
         ORG       0.94      0.97      0.96       190
         PER       0.97      0.98      0.97       267

   micro avg       0.97      0.99      0.98       838
   macro avg       0.97      0.99      0.98       838
weighted avg       0.97      0.99      0.98       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.11it/s, F1=0.69, eval_acc=0.957, eval_loss=11.3, eval_precision=0.76, eval_recall=0.643]  


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.77      0.64      0.70      3160
         LOC       0.49      0.36      0.41       482
         ORG       0.63      0.48      0.55      1645
         PER       0.88      0.87      0.87      1650

   micro avg       0.75      0.64      0.69      6937
   macro avg       0.69      0.59      0.63      6937
weighted avg       0.74      0.64      0.69      6937



Epoch: 23/30 Train: 100%|██████████| 125/125 [00:37<00:00,  3.33it/s, F1=0.947, train_acc=0.997, train_loss=0.446, train_precision=0.945, train_recall=0.952]


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.98      0.98       326
         LOC       1.00      1.00      1.00        55
         ORG       0.92      0.96      0.94       190
         PER       0.97      0.99      0.98       267

   micro avg       0.96      0.98      0.97       838
   macro avg       0.97      0.98      0.97       838
weighted avg       0.96      0.98      0.97       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.07it/s, F1=0.703, eval_acc=0.961, eval_loss=10.4, eval_precision=0.735, eval_recall=0.684]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.73      0.71      0.72      3160
         LOC       0.42      0.35      0.38       482
         ORG       0.65      0.54      0.59      1645
         PER       0.87      0.87      0.87      1650

   micro avg       0.73      0.68      0.71      6937
   macro avg       0.67      0.62      0.64      6937
weighted avg       0.72      0.68      0.70      6937



Epoch: 24/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.63it/s, F1=0.963, train_acc=0.998, train_loss=0.211, train_precision=0.959, train_recall=0.97] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      1.00      0.99       326
         LOC       0.93      0.96      0.95        55
         ORG       0.95      0.97      0.96       190
         PER       0.98      0.98      0.98       267

   micro avg       0.97      0.98      0.98       838
   macro avg       0.96      0.98      0.97       838
weighted avg       0.97      0.98      0.98       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.13it/s, F1=0.697, eval_acc=0.96, eval_loss=9.38, eval_precision=0.714, eval_recall=0.693] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.78      0.66      0.72      3160
         LOC       0.39      0.38      0.38       482
         ORG       0.55      0.64      0.59      1645
         PER       0.86      0.89      0.88      1650

   micro avg       0.71      0.69      0.70      6937
   macro avg       0.65      0.64      0.64      6937
weighted avg       0.72      0.69      0.70      6937



Epoch: 25/30 Train: 100%|██████████| 125/125 [00:37<00:00,  3.33it/s, F1=0.978, train_acc=1, train_loss=0.0554, train_precision=0.976, train_recall=0.98] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      1.00      0.99       326
         LOC       1.00      1.00      1.00        55
         ORG       0.99      0.99      0.99       190
         PER       0.99      0.99      0.99       267

   micro avg       0.99      0.99      0.99       838
   macro avg       0.99      1.00      0.99       838
weighted avg       0.99      0.99      0.99       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.12it/s, F1=0.722, eval_acc=0.962, eval_loss=9.67, eval_precision=0.74, eval_recall=0.714] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.77      0.73      0.75      3160
         LOC       0.43      0.40      0.42       482
         ORG       0.64      0.59      0.61      1645
         PER       0.85      0.89      0.87      1650

   micro avg       0.74      0.71      0.72      6937
   macro avg       0.67      0.65      0.66      6937
weighted avg       0.73      0.71      0.72      6937



Epoch: 26/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.66it/s, F1=0.982, train_acc=1, train_loss=0.0231, train_precision=0.982, train_recall=0.982]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       326
         LOC       1.00      1.00      1.00        55
         ORG       0.99      0.99      0.99       190
         PER       0.99      1.00      0.99       267

   micro avg       1.00      1.00      1.00       838
   macro avg       1.00      1.00      1.00       838
weighted avg       1.00      1.00      1.00       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.06it/s, F1=0.725, eval_acc=0.962, eval_loss=10.2, eval_precision=0.738, eval_recall=0.722]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.77      0.75      0.76      3160
         LOC       0.40      0.42      0.41       482
         ORG       0.64      0.61      0.62      1645
         PER       0.88      0.87      0.88      1650

   micro avg       0.74      0.72      0.73      6937
   macro avg       0.67      0.66      0.67      6937
weighted avg       0.74      0.72      0.73      6937



Epoch: 27/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.67it/s, F1=0.94, train_acc=0.999, train_loss=0.121, train_precision=0.941, train_recall=0.942] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.99      0.99       326
         LOC       0.95      0.96      0.95        55
         ORG       0.98      0.98      0.98       190
         PER       1.00      1.00      1.00       267

   micro avg       0.99      0.99      0.99       838
   macro avg       0.98      0.98      0.98       838
weighted avg       0.99      0.99      0.99       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.13it/s, F1=0.712, eval_acc=0.961, eval_loss=9.92, eval_precision=0.725, eval_recall=0.709]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.75      0.71      0.73      3160
         LOC       0.41      0.39      0.40       482
         ORG       0.61      0.62      0.62      1645
         PER       0.86      0.88      0.87      1650

   micro avg       0.72      0.71      0.71      6937
   macro avg       0.66      0.65      0.65      6937
weighted avg       0.72      0.71      0.71      6937



Epoch: 28/30 Train: 100%|██████████| 125/125 [00:37<00:00,  3.30it/s, F1=0.974, train_acc=0.998, train_loss=0.246, train_precision=0.974, train_recall=0.976]


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      1.00      1.00       326
         LOC       0.95      0.96      0.95        55
         ORG       0.96      0.96      0.96       190
         PER       1.00      1.00      1.00       267

   micro avg       0.99      0.99      0.99       838
   macro avg       0.98      0.98      0.98       838
weighted avg       0.99      0.99      0.99       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.07it/s, F1=0.702, eval_acc=0.961, eval_loss=9.04, eval_precision=0.707, eval_recall=0.707]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.75      0.70      0.72      3160
         LOC       0.38      0.44      0.41       482
         ORG       0.58      0.63      0.60      1645
         PER       0.85      0.88      0.87      1650

   micro avg       0.70      0.71      0.70      6937
   macro avg       0.64      0.66      0.65      6937
weighted avg       0.71      0.71      0.71      6937



Epoch: 29/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.68it/s, F1=0.967, train_acc=0.999, train_loss=0.105, train_precision=0.968, train_recall=0.967]


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.99      0.99       326
         LOC       0.95      0.96      0.95        55
         ORG       0.99      0.98      0.99       190
         PER       1.00      1.00      1.00       267

   micro avg       0.99      0.99      0.99       838
   macro avg       0.98      0.98      0.98       838
weighted avg       0.99      0.99      0.99       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.04it/s, F1=0.712, eval_acc=0.962, eval_loss=10.4, eval_precision=0.713, eval_recall=0.719]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.72      0.77      0.75      3160
         LOC       0.39      0.35      0.37       482
         ORG       0.60      0.56      0.58      1645
         PER       0.85      0.88      0.87      1650

   micro avg       0.71      0.72      0.71      6937
   macro avg       0.64      0.64      0.64      6937
weighted avg       0.70      0.72      0.71      6937



Epoch: 30/30 Train: 100%|██████████| 125/125 [00:37<00:00,  3.37it/s, F1=0.97, train_acc=0.999, train_loss=0.0685, train_precision=0.969, train_recall=0.971] 


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       326
         LOC       0.98      0.98      0.98        55
         ORG       0.98      0.99      0.98       190
         PER       1.00      1.00      1.00       267

   micro avg       0.99      1.00      1.00       838
   macro avg       0.99      0.99      0.99       838
weighted avg       0.99      1.00      1.00       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.08it/s, F1=0.682, eval_acc=0.948, eval_loss=11.1, eval_precision=0.636, eval_recall=0.746]


eval_reports:
              precision    recall  f1-score   support

         GPE       0.67      0.77      0.72      3160
         LOC       0.30      0.37      0.33       482
         ORG       0.49      0.63      0.55      1645
         PER       0.85      0.89      0.87      1650

   micro avg       0.63      0.74      0.68      6937
   macro avg       0.57      0.66      0.61      6937
weighted avg       0.64      0.74      0.69      6937



calculate data/few_shot/note4/train_1000.json etag: 100%|██████████| 385k/385k [00:00<00:00, 276MB/s]
calculate data/few_shot/note4/dev.json etag: 100%|██████████| 2.46M/2.46M [00:00<00:00, 334MB/s]
calculate data/few_shot/note4/test.json etag: 100%|██████████| 2.56M/2.56M [00:00<00:00, 374MB/s]
calculate data/few_shot/note4/labels.txt etag: 100%|██████████| 100/100 [00:00<00:00, 202kB/s]

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/note4/train_1000.json",
    "eval_file": "data/few_shot/note4/dev.json",
    "test_file": "data/few_shot/note4/test.json",
    "tag_file": "data/few_shot/note4/labels.txt",
    "bert_vocab_file": "./model/chinese_wwm_ext/vocab.txt",
    "output_eval": true,
    "max_scan_num": 1000000,
    "add_seq_vocab": false,
    "max_seq_length": 150,
    "max_word_num": 5,
    "default_tag": "O",
    "use_test": false,
    "do_shuffle": true,
    "do_predict": false,
    "task_name": "note4_pretrain_lebert_crf_1000_x3"
}
load cached ./temp/f1dd66c8309dd10fb1912b81c20e7797_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/lexicon_tree



count line size data/few_shot/note4/labels.txt: 19L [00:00, 179891.14L/s]
build line mapper: 19L [00:00, 35230.67L/s]9 [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 19/19 [00:00<00:00, 5501.30it/s]
load vocab from list: 100%|██████████| 18/18 [00:00<00:00, 203497.23it/s]
load dataset from data/few_shot/note4/train_1000.json: 0it [00:00, ?it/s]

load cached ./temp/f1dd66c8309dd10fb1912b81c20e7797_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/matched_words
load cached ./temp/f1dd66c8309dd10fb1912b81c20e7797_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/word_vocab
load cached ./temp/f1dd66c8309dd10fb1912b81c20e7797_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/vocab_embedding


load dataset from data/few_shot/note4/train_1000.json: 1000it [00:01, 837.52it/s]
load dataset from data/few_shot/note4/dev.json: 4301it [00:07, 572.30it/s]


Load pretrained embedding from file.........


Some weights of the model checkpoint at save_pretrained/note4_pretrain_lebert_1000_pretraind_task/Bert_960/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of LEBertModel were not initialized from the model checkpoint at save_pretrained/note4_pretrain_l

train_reports:
              precision    recall  f1-score   support

         GPE       0.00      0.01      0.00       326
         LOC       0.00      0.00      0.00        55
         ORG       0.00      0.00      0.00       190
         PER       0.00      0.00      0.00       267

   micro avg       0.00      0.00      0.00       838
   macro avg       0.00      0.00      0.00       838
weighted avg       0.00      0.00      0.00       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.03it/s, F1=0.00944, eval_acc=0.908, eval_loss=16.5, eval_precision=0.01, eval_recall=0.00923]   


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.01      0.02      0.01      3160
         LOC       0.00      0.00      0.00       482
         ORG       0.00      0.00      0.00      1645
         PER       0.03      0.02      0.02      1650

   micro avg       0.01      0.01      0.01      6937
   macro avg       0.01      0.01      0.01      6937
weighted avg       0.01      0.01      0.01      6937



Epoch: 2/30 Train: 100%|██████████| 125/125 [00:35<00:00,  3.57it/s, F1=0.308, train_acc=0.95, train_loss=5.75, train_precision=0.276, train_recall=0.372]      


train_reports:
              precision    recall  f1-score   support

         GPE       0.25      0.44      0.32       326
         LOC       0.00      0.00      0.00        55
         ORG       0.03      0.06      0.04       190
         PER       0.67      0.65      0.66       267

   micro avg       0.27      0.39      0.32       838
   macro avg       0.24      0.29      0.25       838
weighted avg       0.32      0.39      0.34       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.03it/s, F1=0.541, eval_acc=0.951, eval_loss=8.13, eval_precision=0.519, eval_recall=0.577]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.59      0.81      0.68      3160
         LOC       0.01      0.00      0.01       482
         ORG       0.01      0.01      0.01      1645
         PER       0.89      0.86      0.88      1650

   micro avg       0.51      0.58      0.54      6937
   macro avg       0.38      0.42      0.39      6937
weighted avg       0.49      0.58      0.52      6937



Epoch: 3/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.60it/s, F1=0.626, train_acc=0.972, train_loss=2.94, train_precision=0.61, train_recall=0.677] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.67      0.78      0.72       326
         LOC       0.16      0.11      0.13        55
         ORG       0.23      0.38      0.29       190
         PER       0.86      0.88      0.87       267

   micro avg       0.56      0.68      0.61       838
   macro avg       0.48      0.54      0.50       838
weighted avg       0.60      0.68      0.63       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.08it/s, F1=0.58, eval_acc=0.957, eval_loss=6.33, eval_precision=0.543, eval_recall=0.632] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.69      0.73      0.71      3160
         LOC       0.13      0.19      0.15       482
         ORG       0.20      0.29      0.24      1645
         PER       0.89      0.91      0.90      1650

   micro avg       0.54      0.63      0.58      6937
   macro avg       0.48      0.53      0.50      6937
weighted avg       0.58      0.63      0.61      6937



Epoch: 4/30 Train: 100%|██████████| 125/125 [00:37<00:00,  3.32it/s, F1=0.756, train_acc=0.984, train_loss=1.72, train_precision=0.72, train_recall=0.811] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.83      0.89      0.86       326
         LOC       0.30      0.44      0.36        55
         ORG       0.61      0.76      0.68       190
         PER       0.89      0.94      0.91       267

   micro avg       0.75      0.85      0.79       838
   macro avg       0.66      0.76      0.70       838
weighted avg       0.76      0.85      0.80       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.10it/s, F1=0.65, eval_acc=0.958, eval_loss=7.19, eval_precision=0.617, eval_recall=0.697] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.65      0.83      0.73      3160
         LOC       0.14      0.13      0.13       482
         ORG       0.37      0.42      0.39      1645
         PER       0.88      0.91      0.90      1650

   micro avg       0.61      0.70      0.65      6937
   macro avg       0.51      0.57      0.54      6937
weighted avg       0.61      0.70      0.65      6937



Epoch: 5/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.66it/s, F1=0.825, train_acc=0.991, train_loss=0.986, train_precision=0.812, train_recall=0.849]


train_reports:
              precision    recall  f1-score   support

         GPE       0.89      0.93      0.91       326
         LOC       0.44      0.55      0.49        55
         ORG       0.75      0.87      0.81       190
         PER       0.95      0.96      0.96       267

   micro avg       0.84      0.90      0.87       838
   macro avg       0.76      0.83      0.79       838
weighted avg       0.85      0.90      0.87       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.07it/s, F1=0.654, eval_acc=0.96, eval_loss=6.85, eval_precision=0.599, eval_recall=0.731] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.69      0.77      0.73      3160
         LOC       0.19      0.32      0.24       482
         ORG       0.43      0.56      0.48      1645
         PER       0.79      0.94      0.86      1650

   micro avg       0.60      0.73      0.66      6937
   macro avg       0.52      0.65      0.58      6937
weighted avg       0.62      0.73      0.67      6937



Epoch: 6/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.68it/s, F1=0.882, train_acc=0.994, train_loss=0.638, train_precision=0.862, train_recall=0.909]


train_reports:
              precision    recall  f1-score   support

         GPE       0.93      0.95      0.94       326
         LOC       0.77      0.87      0.82        55
         ORG       0.85      0.93      0.89       190
         PER       0.93      0.96      0.95       267

   micro avg       0.90      0.95      0.92       838
   macro avg       0.87      0.93      0.90       838
weighted avg       0.90      0.95      0.92       838



Eval Result: 100%|██████████| 68/68 [00:19<00:00,  3.49it/s, F1=0.604, eval_acc=0.924, eval_loss=12.1, eval_precision=0.506, eval_recall=0.762]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.64      0.79      0.71      3160
         LOC       0.21      0.35      0.26       482
         ORG       0.27      0.62      0.38      1645
         PER       0.81      0.93      0.87      1650

   micro avg       0.51      0.75      0.60      6937
   macro avg       0.48      0.67      0.55      6937
weighted avg       0.56      0.75      0.64      6937



Epoch: 7/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.65it/s, F1=0.94, train_acc=0.996, train_loss=0.504, train_precision=0.929, train_recall=0.956] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.97      0.98      0.98       326
         LOC       0.89      0.93      0.91        55
         ORG       0.85      0.93      0.89       190
         PER       0.96      0.99      0.98       267

   micro avg       0.94      0.97      0.95       838
   macro avg       0.92      0.96      0.94       838
weighted avg       0.94      0.97      0.95       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.12it/s, F1=0.675, eval_acc=0.959, eval_loss=8.51, eval_precision=0.621, eval_recall=0.753]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.67      0.81      0.74      3160
         LOC       0.23      0.46      0.31       482
         ORG       0.48      0.56      0.52      1645
         PER       0.84      0.91      0.87      1650

   micro avg       0.62      0.75      0.68      6937
   macro avg       0.56      0.69      0.61      6937
weighted avg       0.64      0.75      0.69      6937



Epoch: 8/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.67it/s, F1=0.91, train_acc=0.997, train_loss=0.36, train_precision=0.902, train_recall=0.922]  


train_reports:
              precision    recall  f1-score   support

         GPE       0.97      0.98      0.98       326
         LOC       0.88      0.91      0.89        55
         ORG       0.88      0.92      0.90       190
         PER       0.99      1.00      0.99       267

   micro avg       0.95      0.97      0.96       838
   macro avg       0.93      0.95      0.94       838
weighted avg       0.95      0.97      0.96       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.07it/s, F1=0.682, eval_acc=0.96, eval_loss=7.84, eval_precision=0.63, eval_recall=0.756]  


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.71      0.79      0.75      3160
         LOC       0.26      0.44      0.32       482
         ORG       0.46      0.60      0.52      1645
         PER       0.84      0.93      0.88      1650

   micro avg       0.63      0.75      0.69      6937
   macro avg       0.57      0.69      0.62      6937
weighted avg       0.65      0.75      0.70      6937



Epoch: 9/30 Train: 100%|██████████| 125/125 [00:37<00:00,  3.36it/s, F1=0.934, train_acc=0.997, train_loss=0.266, train_precision=0.928, train_recall=0.943]


train_reports:
              precision    recall  f1-score   support

         GPE       0.96      0.98      0.97       326
         LOC       0.93      0.93      0.93        55
         ORG       0.90      0.95      0.92       190
         PER       0.99      0.99      0.99       267

   micro avg       0.95      0.97      0.96       838
   macro avg       0.94      0.96      0.95       838
weighted avg       0.95      0.97      0.96       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.13it/s, F1=0.683, eval_acc=0.959, eval_loss=8.98, eval_precision=0.637, eval_recall=0.747]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.66      0.78      0.72      3160
         LOC       0.29      0.25      0.27       482
         ORG       0.49      0.65      0.56      1645
         PER       0.83      0.91      0.87      1650

   micro avg       0.64      0.74      0.69      6937
   macro avg       0.57      0.65      0.60      6937
weighted avg       0.64      0.74      0.68      6937



Epoch: 10/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.66it/s, F1=0.977, train_acc=0.999, train_loss=0.143, train_precision=0.972, train_recall=0.983]


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      1.00      0.99       326
         LOC       0.84      0.87      0.86        55
         ORG       0.96      0.99      0.98       190
         PER       0.99      1.00      0.99       267

   micro avg       0.97      0.99      0.98       838
   macro avg       0.95      0.97      0.96       838
weighted avg       0.97      0.99      0.98       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.08it/s, F1=0.669, eval_acc=0.959, eval_loss=9.31, eval_precision=0.646, eval_recall=0.703]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.75      0.64      0.70      3160
         LOC       0.20      0.43      0.28       482
         ORG       0.53      0.66      0.59      1645
         PER       0.85      0.92      0.88      1650

   micro avg       0.64      0.70      0.67      6937
   macro avg       0.58      0.66      0.61      6937
weighted avg       0.68      0.70      0.68      6937



Epoch: 11/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.69it/s, F1=0.962, train_acc=0.999, train_loss=0.178, train_precision=0.962, train_recall=0.962]


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.99      0.99       326
         LOC       0.93      0.93      0.93        55
         ORG       0.99      0.99      0.99       190
         PER       0.99      0.99      0.99       267

   micro avg       0.98      0.98      0.98       838
   macro avg       0.97      0.97      0.97       838
weighted avg       0.98      0.98      0.98       838



Eval Result: 100%|██████████| 68/68 [00:19<00:00,  3.45it/s, F1=0.687, eval_acc=0.96, eval_loss=8.45, eval_precision=0.646, eval_recall=0.746] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.72      0.75      0.74      3160
         LOC       0.21      0.50      0.30       482
         ORG       0.56      0.61      0.58      1645
         PER       0.84      0.91      0.88      1650

   micro avg       0.64      0.74      0.69      6937
   macro avg       0.58      0.70      0.62      6937
weighted avg       0.68      0.74      0.70      6937



Epoch: 12/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.66it/s, F1=0.959, train_acc=0.999, train_loss=0.101, train_precision=0.954, train_recall=0.966] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.97      0.98      0.98       326
         LOC       0.93      0.96      0.95        55
         ORG       0.95      0.98      0.96       190
         PER       1.00      0.99      0.99       267

   micro avg       0.97      0.98      0.98       838
   macro avg       0.96      0.98      0.97       838
weighted avg       0.97      0.98      0.98       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.12it/s, F1=0.701, eval_acc=0.963, eval_loss=9.87, eval_precision=0.708, eval_recall=0.704]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.75      0.71      0.73      3160
         LOC       0.31      0.38      0.34       482
         ORG       0.61      0.61      0.61      1645
         PER       0.86      0.92      0.89      1650

   micro avg       0.71      0.71      0.71      6937
   macro avg       0.63      0.65      0.64      6937
weighted avg       0.71      0.71      0.71      6937



Epoch: 13/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.67it/s, F1=0.967, train_acc=0.998, train_loss=0.205, train_precision=0.962, train_recall=0.975]


train_reports:
              precision    recall  f1-score   support

         GPE       0.97      0.99      0.98       326
         LOC       0.86      0.89      0.88        55
         ORG       0.96      0.97      0.97       190
         PER       0.98      0.99      0.99       267

   micro avg       0.96      0.98      0.97       838
   macro avg       0.94      0.96      0.95       838
weighted avg       0.96      0.98      0.97       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.09it/s, F1=0.696, eval_acc=0.96, eval_loss=8.97, eval_precision=0.651, eval_recall=0.759] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.72      0.79      0.75      3160
         LOC       0.25      0.42      0.31       482
         ORG       0.52      0.64      0.58      1645
         PER       0.84      0.91      0.88      1650

   micro avg       0.65      0.76      0.70      6937
   macro avg       0.58      0.69      0.63      6937
weighted avg       0.67      0.76      0.71      6937



Epoch: 14/30 Train: 100%|██████████| 125/125 [00:37<00:00,  3.33it/s, F1=0.946, train_acc=0.999, train_loss=0.123, train_precision=0.943, train_recall=0.952]


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.99      0.99       326
         LOC       0.83      0.91      0.87        55
         ORG       0.97      0.99      0.98       190
         PER       1.00      0.99      0.99       267

   micro avg       0.98      0.99      0.98       838
   macro avg       0.95      0.97      0.96       838
weighted avg       0.98      0.99      0.98       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.13it/s, F1=0.71, eval_acc=0.963, eval_loss=8.84, eval_precision=0.673, eval_recall=0.762] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.74      0.81      0.77      3160
         LOC       0.27      0.40      0.32       482
         ORG       0.55      0.61      0.58      1645
         PER       0.84      0.93      0.88      1650

   micro avg       0.68      0.77      0.72      6937
   macro avg       0.60      0.69      0.64      6937
weighted avg       0.69      0.77      0.72      6937



Epoch: 15/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.65it/s, F1=0.975, train_acc=0.999, train_loss=0.15, train_precision=0.972, train_recall=0.979] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.98      0.98       326
         LOC       1.00      1.00      1.00        55
         ORG       0.99      0.99      0.99       190
         PER       0.96      0.98      0.97       267

   micro avg       0.98      0.99      0.98       838
   macro avg       0.98      0.99      0.99       838
weighted avg       0.98      0.99      0.98       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.15it/s, F1=0.708, eval_acc=0.963, eval_loss=8.91, eval_precision=0.671, eval_recall=0.759]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.70      0.82      0.75      3160
         LOC       0.30      0.38      0.34       482
         ORG       0.54      0.59      0.57      1645
         PER       0.87      0.91      0.89      1650

   micro avg       0.67      0.76      0.71      6937
   macro avg       0.60      0.67      0.64      6937
weighted avg       0.67      0.76      0.71      6937



Epoch: 16/30 Train: 100%|██████████| 125/125 [00:37<00:00,  3.30it/s, F1=0.941, train_acc=0.999, train_loss=0.139, train_precision=0.937, train_recall=0.948]


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.98      0.98       326
         LOC       0.95      0.98      0.96        55
         ORG       0.97      0.99      0.98       190
         PER       1.00      1.00      1.00       267

   micro avg       0.98      0.99      0.99       838
   macro avg       0.97      0.99      0.98       838
weighted avg       0.98      0.99      0.99       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.10it/s, F1=0.712, eval_acc=0.963, eval_loss=9.07, eval_precision=0.674, eval_recall=0.764]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.70      0.83      0.76      3160
         LOC       0.38      0.30      0.34       482
         ORG       0.51      0.64      0.57      1645
         PER       0.88      0.91      0.89      1650

   micro avg       0.67      0.77      0.72      6937
   macro avg       0.62      0.67      0.64      6937
weighted avg       0.67      0.77      0.72      6937



Epoch: 17/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.69it/s, F1=0.976, train_acc=0.999, train_loss=0.109, train_precision=0.971, train_recall=0.982]


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.99      0.98       326
         LOC       0.98      1.00      0.99        55
         ORG       0.97      0.99      0.98       190
         PER       0.99      0.99      0.99       267

   micro avg       0.98      0.99      0.99       838
   macro avg       0.98      0.99      0.99       838
weighted avg       0.98      0.99      0.99       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.11it/s, F1=0.715, eval_acc=0.962, eval_loss=9.89, eval_precision=0.69, eval_recall=0.75]  


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.75      0.77      0.76      3160
         LOC       0.33      0.40      0.36       482
         ORG       0.57      0.65      0.61      1645
         PER       0.85      0.91      0.88      1650

   micro avg       0.69      0.75      0.72      6937
   macro avg       0.62      0.69      0.65      6937
weighted avg       0.70      0.75      0.72      6937



Epoch: 18/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.72it/s, F1=0.94, train_acc=0.999, train_loss=0.15, train_precision=0.939, train_recall=0.944]  


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.99      0.98       326
         LOC       0.89      0.93      0.91        55
         ORG       0.99      0.99      0.99       190
         PER       0.99      0.99      0.99       267

   micro avg       0.98      0.99      0.98       838
   macro avg       0.96      0.98      0.97       838
weighted avg       0.98      0.99      0.98       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.10it/s, F1=0.691, eval_acc=0.961, eval_loss=10.4, eval_precision=0.68, eval_recall=0.712] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.73      0.71      0.72      3160
         LOC       0.25      0.38      0.30       482
         ORG       0.59      0.62      0.61      1645
         PER       0.86      0.90      0.88      1650

   micro avg       0.68      0.71      0.70      6937
   macro avg       0.61      0.65      0.63      6937
weighted avg       0.70      0.71      0.70      6937



Epoch: 19/30 Train: 100%|██████████| 125/125 [00:37<00:00,  3.32it/s, F1=0.957, train_acc=0.998, train_loss=0.334, train_precision=0.953, train_recall=0.964]


train_reports:
              precision    recall  f1-score   support

         GPE       0.93      0.97      0.95       326
         LOC       1.00      1.00      1.00        55
         ORG       0.94      0.97      0.96       190
         PER       0.98      0.98      0.98       267

   micro avg       0.95      0.97      0.96       838
   macro avg       0.96      0.98      0.97       838
weighted avg       0.95      0.97      0.96       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.13it/s, F1=0.671, eval_acc=0.958, eval_loss=10.1, eval_precision=0.639, eval_recall=0.716]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.69      0.76      0.72      3160
         LOC       0.30      0.37      0.33       482
         ORG       0.51      0.51      0.51      1645
         PER       0.75      0.92      0.83      1650

   micro avg       0.64      0.72      0.67      6937
   macro avg       0.56      0.64      0.60      6937
weighted avg       0.63      0.72      0.67      6937



Epoch: 20/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.67it/s, F1=0.949, train_acc=0.999, train_loss=0.0987, train_precision=0.947, train_recall=0.952]


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.99      0.99       326
         LOC       0.96      1.00      0.98        55
         ORG       0.98      0.99      0.99       190
         PER       0.98      0.99      0.98       267

   micro avg       0.98      0.99      0.99       838
   macro avg       0.98      0.99      0.98       838
weighted avg       0.98      0.99      0.99       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.13it/s, F1=0.683, eval_acc=0.957, eval_loss=10.4, eval_precision=0.631, eval_recall=0.764]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.71      0.78      0.75      3160
         LOC       0.37      0.26      0.30       482
         ORG       0.44      0.68      0.53      1645
         PER       0.79      0.94      0.86      1650

   micro avg       0.63      0.76      0.69      6937
   macro avg       0.58      0.66      0.61      6937
weighted avg       0.64      0.76      0.69      6937



Epoch: 21/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.68it/s, F1=0.988, train_acc=1, train_loss=0.0395, train_precision=0.986, train_recall=0.99] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      1.00      1.00       326
         LOC       1.00      1.00      1.00        55
         ORG       0.98      0.99      0.99       190
         PER       1.00      1.00      1.00       267

   micro avg       0.99      1.00      1.00       838
   macro avg       0.99      1.00      1.00       838
weighted avg       0.99      1.00      1.00       838



Eval Result: 100%|██████████| 68/68 [00:19<00:00,  3.42it/s, F1=0.698, eval_acc=0.96, eval_loss=12.6, eval_precision=0.721, eval_recall=0.687] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.74      0.71      0.73      3160
         LOC       0.37      0.32      0.34       482
         ORG       0.59      0.55      0.56      1645
         PER       0.90      0.89      0.90      1650

   micro avg       0.72      0.69      0.70      6937
   macro avg       0.65      0.62      0.63      6937
weighted avg       0.72      0.69      0.70      6937



Epoch: 22/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.68it/s, F1=0.972, train_acc=1, train_loss=0.0331, train_precision=0.971, train_recall=0.974]   


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       326
         LOC       1.00      1.00      1.00        55
         ORG       0.98      0.99      0.98       190
         PER       1.00      1.00      1.00       267

   micro avg       0.99      1.00      1.00       838
   macro avg       0.99      1.00      1.00       838
weighted avg       0.99      1.00      1.00       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.10it/s, F1=0.704, eval_acc=0.961, eval_loss=11.5, eval_precision=0.692, eval_recall=0.725]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.71      0.79      0.75      3160
         LOC       0.35      0.35      0.35       482
         ORG       0.55      0.54      0.54      1645
         PER       0.88      0.90      0.89      1650

   micro avg       0.69      0.73      0.71      6937
   macro avg       0.62      0.64      0.63      6937
weighted avg       0.69      0.73      0.71      6937



Epoch: 23/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.61it/s, F1=0.955, train_acc=0.999, train_loss=0.114, train_precision=0.953, train_recall=0.957]


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.99      0.99       326
         LOC       1.00      1.00      1.00        55
         ORG       0.97      0.98      0.97       190
         PER       0.99      1.00      0.99       267

   micro avg       0.98      0.99      0.99       838
   macro avg       0.99      0.99      0.99       838
weighted avg       0.98      0.99      0.99       838



Eval Result: 100%|██████████| 68/68 [00:17<00:00,  4.00it/s, F1=0.704, eval_acc=0.961, eval_loss=10.9, eval_precision=0.678, eval_recall=0.744]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.71      0.83      0.77      3160
         LOC       0.36      0.36      0.36       482
         ORG       0.53      0.58      0.55      1645
         PER       0.86      0.88      0.87      1650

   micro avg       0.68      0.75      0.71      6937
   macro avg       0.61      0.66      0.64      6937
weighted avg       0.68      0.75      0.71      6937



Epoch: 24/30 Train: 100%|██████████| 125/125 [00:37<00:00,  3.34it/s, F1=0.976, train_acc=1, train_loss=0.0539, train_precision=0.974, train_recall=0.978]   


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.99      0.99       326
         LOC       1.00      1.00      1.00        55
         ORG       0.97      0.99      0.98       190
         PER       1.00      1.00      1.00       267

   micro avg       0.99      1.00      0.99       838
   macro avg       0.99      1.00      0.99       838
weighted avg       0.99      1.00      0.99       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.16it/s, F1=0.701, eval_acc=0.958, eval_loss=12.3, eval_precision=0.678, eval_recall=0.734]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.70      0.78      0.74      3160
         LOC       0.29      0.43      0.35       482
         ORG       0.57      0.54      0.56      1645
         PER       0.88      0.91      0.89      1650

   micro avg       0.68      0.73      0.70      6937
   macro avg       0.61      0.67      0.63      6937
weighted avg       0.68      0.73      0.71      6937



Epoch: 25/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.64it/s, F1=0.977, train_acc=0.999, train_loss=0.182, train_precision=0.975, train_recall=0.98] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.97      0.98      0.98       326
         LOC       0.98      0.98      0.98        55
         ORG       0.97      0.97      0.97       190
         PER       1.00      1.00      1.00       267

   micro avg       0.98      0.99      0.98       838
   macro avg       0.98      0.98      0.98       838
weighted avg       0.98      0.99      0.98       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.16it/s, F1=0.699, eval_acc=0.959, eval_loss=11.8, eval_precision=0.676, eval_recall=0.733]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.70      0.77      0.73      3160
         LOC       0.27      0.42      0.33       482
         ORG       0.59      0.60      0.60      1645
         PER       0.90      0.89      0.89      1650

   micro avg       0.68      0.73      0.70      6937
   macro avg       0.62      0.67      0.64      6937
weighted avg       0.69      0.73      0.71      6937



Epoch: 26/30 Train: 100%|██████████| 125/125 [00:37<00:00,  3.34it/s, F1=0.971, train_acc=0.999, train_loss=0.114, train_precision=0.972, train_recall=0.973]


train_reports:
              precision    recall  f1-score   support

         GPE       0.97      0.99      0.98       326
         LOC       1.00      0.98      0.99        55
         ORG       0.97      0.98      0.98       190
         PER       1.00      1.00      1.00       267

   micro avg       0.98      0.99      0.99       838
   macro avg       0.99      0.99      0.99       838
weighted avg       0.98      0.99      0.99       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.18it/s, F1=0.673, eval_acc=0.954, eval_loss=11.9, eval_precision=0.612, eval_recall=0.763]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.67      0.80      0.73      3160
         LOC       0.18      0.48      0.26       482
         ORG       0.55      0.63      0.59      1645
         PER       0.88      0.91      0.89      1650

   micro avg       0.61      0.76      0.68      6937
   macro avg       0.57      0.71      0.62      6937
weighted avg       0.65      0.76      0.70      6937



Epoch: 27/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.68it/s, F1=0.96, train_acc=1, train_loss=0.02, train_precision=0.959, train_recall=0.96]    


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       326
         LOC       0.98      1.00      0.99        55
         ORG       1.00      1.00      1.00       190
         PER       1.00      1.00      1.00       267

   micro avg       1.00      1.00      1.00       838
   macro avg       1.00      1.00      1.00       838
weighted avg       1.00      1.00      1.00       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.17it/s, F1=0.71, eval_acc=0.961, eval_loss=11.5, eval_precision=0.698, eval_recall=0.732] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.71      0.76      0.74      3160
         LOC       0.32      0.37      0.34       482
         ORG       0.59      0.62      0.60      1645
         PER       0.88      0.90      0.89      1650

   micro avg       0.69      0.74      0.71      6937
   macro avg       0.63      0.66      0.64      6937
weighted avg       0.70      0.74      0.72      6937



Epoch: 28/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.67it/s, F1=0.98, train_acc=1, train_loss=0.031, train_precision=0.978, train_recall=0.983]  


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      1.00      1.00       326
         LOC       0.96      0.98      0.97        55
         ORG       0.99      1.00      1.00       190
         PER       1.00      1.00      1.00       267

   micro avg       0.99      1.00      1.00       838
   macro avg       0.99      0.99      0.99       838
weighted avg       0.99      1.00      1.00       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.09it/s, F1=0.713, eval_acc=0.962, eval_loss=11.8, eval_precision=0.716, eval_recall=0.72] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.70      0.76      0.73      3160
         LOC       0.43      0.31      0.36       482
         ORG       0.61      0.58      0.59      1645
         PER       0.88      0.90      0.89      1650

   micro avg       0.71      0.72      0.71      6937
   macro avg       0.65      0.64      0.64      6937
weighted avg       0.70      0.72      0.71      6937



Epoch: 29/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.38it/s, F1=0.963, train_acc=1, train_loss=0.0589, train_precision=0.963, train_recall=0.963]   


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.99      0.99       326
         LOC       1.00      1.00      1.00        55
         ORG       0.99      0.98      0.99       190
         PER       1.00      1.00      1.00       267

   micro avg       0.99      0.99      0.99       838
   macro avg       0.99      0.99      0.99       838
weighted avg       0.99      0.99      0.99       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.07it/s, F1=0.71, eval_acc=0.959, eval_loss=11.3, eval_precision=0.671, eval_recall=0.765] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.71      0.80      0.76      3160
         LOC       0.41      0.38      0.39       482
         ORG       0.49      0.65      0.56      1645
         PER       0.85      0.92      0.88      1650

   micro avg       0.67      0.76      0.71      6937
   macro avg       0.62      0.69      0.65      6937
weighted avg       0.67      0.76      0.71      6937



Epoch: 30/30 Train: 100%|██████████| 125/125 [00:34<00:00,  3.66it/s, F1=0.952, train_acc=0.997, train_loss=0.337, train_precision=0.949, train_recall=0.958]


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.99      0.98       326
         LOC       0.91      0.93      0.92        55
         ORG       0.98      0.99      0.99       190
         PER       0.95      0.98      0.97       267

   micro avg       0.97      0.98      0.97       838
   macro avg       0.96      0.97      0.96       838
weighted avg       0.97      0.98      0.97       838



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.12it/s, F1=0.716, eval_acc=0.962, eval_loss=10.5, eval_precision=0.7, eval_recall=0.743]  


eval_reports:
              precision    recall  f1-score   support

         GPE       0.71      0.81      0.76      3160
         LOC       0.38      0.34      0.36       482
         ORG       0.56      0.59      0.57      1645
         PER       0.89      0.90      0.90      1650

   micro avg       0.70      0.75      0.72      6937
   macro avg       0.64      0.66      0.65      6937
weighted avg       0.70      0.75      0.72      6937



calculate data/few_shot/note4/train_1350.json etag: 100%|██████████| 518k/518k [00:00<00:00, 22.4MB/s]
calculate data/few_shot/note4/dev.json etag: 100%|██████████| 2.46M/2.46M [00:00<00:00, 337MB/s]
calculate data/few_shot/note4/test.json etag: 100%|██████████| 2.56M/2.56M [00:00<00:00, 374MB/s]
calculate data/few_shot/note4/labels.txt etag: 100%|██████████| 100/100 [00:00<00:00, 576kB/s]

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/note4/train_1350.json",
    "eval_file": "data/few_shot/note4/dev.json",
    "test_file": "data/few_shot/note4/test.json",
    "tag_file": "data/few_shot/note4/labels.txt",
    "bert_vocab_file": "./model/chinese_wwm_ext/vocab.txt",
    "output_eval": true,
    "max_scan_num": 1000000,
    "add_seq_vocab": false,
    "max_seq_length": 150,
    "max_word_num": 5,
    "default_tag": "O",
    "use_test": false,
    "do_shuffle": true,
    "do_predict": false,
    "task_name": "note4_pretrain_lebert_crf_1350_x1"
}
load cached ./temp/a92fb4e09540fd0fde5e16ec2dc288e7_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/lexicon_tree



count line size data/few_shot/note4/labels.txt: 19L [00:00, 144894.14L/s]
build line mapper: 19L [00:00, 164652.43L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 19/19 [00:00<00:00, 5550.34it/s]
load vocab from list: 100%|██████████| 18/18 [00:00<00:00, 156959.40it/s]

load cached ./temp/a92fb4e09540fd0fde5e16ec2dc288e7_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/matched_words
load cached ./temp/a92fb4e09540fd0fde5e16ec2dc288e7_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/word_vocab
load cached ./temp/a92fb4e09540fd0fde5e16ec2dc288e7_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/vocab_embedding



load dataset from data/few_shot/note4/train_1350.json: 1350it [00:01, 840.35it/s]
load dataset from data/few_shot/note4/dev.json: 4301it [00:07, 572.77it/s]
Some weights of the model checkpoint at save_pretrained/note4_pretrain_lebert_1350_pretraind_task/Bert_1290/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification mo

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.68it/s, F1=0.111, train_acc=0.857, train_loss=16.4, train_precision=0.115, train_recall=0.118]      


train_reports:
              precision    recall  f1-score   support

         GPE       0.07      0.15      0.09       424
         LOC       0.00      0.00      0.00        76
         ORG       0.01      0.04      0.01       256
         PER       0.07      0.14      0.09       362
           _       0.00      0.00      0.00         0

   micro avg       0.04      0.11      0.06      1118
   macro avg       0.03      0.07      0.04      1118
weighted avg       0.05      0.11      0.07      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.13it/s, F1=0.498, eval_acc=0.947, eval_loss=7.48, eval_precision=0.472, eval_recall=0.536]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.48      0.65      0.55      3160
         LOC       0.00      0.00      0.00       482
         ORG       0.10      0.10      0.10      1645
         PER       0.80      0.85      0.83      1650

   micro avg       0.46      0.52      0.49      6937
   macro avg       0.35      0.40      0.37      6937
weighted avg       0.43      0.52      0.47      6937



Epoch: 2/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.64it/s, F1=0.6, train_acc=0.969, train_loss=3.07, train_precision=0.592, train_recall=0.65]   


train_reports:
              precision    recall  f1-score   support

         GPE       0.58      0.73      0.65       424
         LOC       0.05      0.05      0.05        76
         ORG       0.45      0.54      0.49       256
         PER       0.77      0.82      0.79       362

   micro avg       0.58      0.67      0.62      1118
   macro avg       0.46      0.54      0.50      1118
weighted avg       0.58      0.67      0.62      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.15it/s, F1=0.604, eval_acc=0.954, eval_loss=5.85, eval_precision=0.617, eval_recall=0.604]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.58      0.70      0.63      3160
         LOC       0.00      0.00      0.00       482
         ORG       0.47      0.38      0.42      1645
         PER       0.89      0.80      0.84      1650

   micro avg       0.61      0.60      0.60      6937
   macro avg       0.49      0.47      0.48      6937
weighted avg       0.59      0.60      0.59      6937



Epoch: 3/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.70it/s, F1=0.785, train_acc=0.984, train_loss=1.51, train_precision=0.777, train_recall=0.818]


train_reports:
              precision    recall  f1-score   support

         GPE       0.83      0.86      0.85       424
         LOC       0.56      0.55      0.56        76
         ORG       0.71      0.82      0.76       256
         PER       0.88      0.91      0.89       362

   micro avg       0.80      0.85      0.82      1118
   macro avg       0.74      0.79      0.76      1118
weighted avg       0.80      0.85      0.82      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.13it/s, F1=0.701, eval_acc=0.961, eval_loss=6.48, eval_precision=0.721, eval_recall=0.691]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.77      0.75      0.76      3160
         LOC       0.36      0.27      0.31       482
         ORG       0.56      0.48      0.52      1645
         PER       0.84      0.92      0.88      1650

   micro avg       0.72      0.69      0.71      6937
   macro avg       0.63      0.60      0.62      6937
weighted avg       0.71      0.69      0.70      6937



Epoch: 4/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.66it/s, F1=0.867, train_acc=0.989, train_loss=1.02, train_precision=0.856, train_recall=0.899] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.88      0.92      0.90       424
         LOC       0.74      0.75      0.75        76
         ORG       0.82      0.89      0.85       256
         PER       0.87      0.95      0.91       362

   micro avg       0.85      0.91      0.88      1118
   macro avg       0.83      0.88      0.85      1118
weighted avg       0.85      0.91      0.88      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.15it/s, F1=0.704, eval_acc=0.961, eval_loss=5.5, eval_precision=0.68, eval_recall=0.739]  


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.72      0.79      0.75      3160
         LOC       0.29      0.38      0.33       482
         ORG       0.54      0.58      0.56      1645
         PER       0.85      0.92      0.89      1650

   micro avg       0.68      0.74      0.71      6937
   macro avg       0.60      0.67      0.63      6937
weighted avg       0.68      0.74      0.71      6937



Epoch: 5/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.68it/s, F1=0.895, train_acc=0.994, train_loss=0.678, train_precision=0.887, train_recall=0.912]


train_reports:
              precision    recall  f1-score   support

         GPE       0.90      0.92      0.91       424
         LOC       0.79      0.83      0.81        76
         ORG       0.87      0.93      0.90       256
         PER       0.95      0.98      0.96       362

   micro avg       0.90      0.94      0.92      1118
   macro avg       0.88      0.92      0.90      1118
weighted avg       0.90      0.94      0.92      1118



Eval Result: 100%|██████████| 68/68 [00:19<00:00,  3.52it/s, F1=0.711, eval_acc=0.961, eval_loss=6.75, eval_precision=0.697, eval_recall=0.733]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.74      0.77      0.75      3160
         LOC       0.28      0.46      0.35       482
         ORG       0.61      0.56      0.59      1645
         PER       0.88      0.90      0.89      1650

   micro avg       0.69      0.73      0.71      6937
   macro avg       0.63      0.67      0.64      6937
weighted avg       0.71      0.73      0.72      6937



Epoch: 6/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.70it/s, F1=0.909, train_acc=0.996, train_loss=0.433, train_precision=0.905, train_recall=0.919]


train_reports:
              precision    recall  f1-score   support

         GPE       0.97      0.96      0.97       424
         LOC       0.84      0.88      0.86        76
         ORG       0.89      0.94      0.91       256
         PER       0.96      0.98      0.97       362

   micro avg       0.94      0.96      0.95      1118
   macro avg       0.92      0.94      0.93      1118
weighted avg       0.94      0.96      0.95      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.10it/s, F1=0.718, eval_acc=0.963, eval_loss=6.76, eval_precision=0.696, eval_recall=0.749]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.69      0.84      0.75      3160
         LOC       0.38      0.26      0.31       482
         ORG       0.60      0.57      0.58      1645
         PER       0.88      0.92      0.90      1650

   micro avg       0.70      0.75      0.72      6937
   macro avg       0.64      0.64      0.64      6937
weighted avg       0.69      0.75      0.72      6937



Epoch: 7/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.65it/s, F1=0.95, train_acc=0.997, train_loss=0.292, train_precision=0.945, train_recall=0.957] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.97      0.97      0.97       424
         LOC       0.91      0.89      0.90        76
         ORG       0.94      0.97      0.96       256
         PER       0.98      0.99      0.99       362

   micro avg       0.96      0.97      0.97      1118
   macro avg       0.95      0.96      0.95      1118
weighted avg       0.96      0.97      0.97      1118



Eval Result: 100%|██████████| 68/68 [00:19<00:00,  3.48it/s, F1=0.705, eval_acc=0.958, eval_loss=7.17, eval_precision=0.66, eval_recall=0.765] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.76      0.75      0.75      3160
         LOC       0.21      0.44      0.28       482
         ORG       0.55      0.71      0.62      1645
         PER       0.87      0.92      0.89      1650

   micro avg       0.66      0.76      0.70      6937
   macro avg       0.60      0.71      0.64      6937
weighted avg       0.70      0.76      0.72      6937



Epoch: 8/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.64it/s, F1=0.948, train_acc=0.997, train_loss=0.281, train_precision=0.939, train_recall=0.965]


train_reports:
              precision    recall  f1-score   support

         GPE       0.97      0.98      0.98       424
         LOC       0.84      0.91      0.87        76
         ORG       0.92      0.96      0.94       256
         PER       0.98      0.99      0.99       362

   micro avg       0.95      0.98      0.97      1118
   macro avg       0.93      0.96      0.94      1118
weighted avg       0.96      0.98      0.97      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.16it/s, F1=0.725, eval_acc=0.963, eval_loss=7.43, eval_precision=0.705, eval_recall=0.755]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.75      0.82      0.79      3160
         LOC       0.40      0.32      0.36       482
         ORG       0.57      0.65      0.60      1645
         PER       0.84      0.88      0.86      1650

   micro avg       0.71      0.76      0.73      6937
   macro avg       0.64      0.67      0.65      6937
weighted avg       0.71      0.76      0.73      6937



Epoch: 9/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.64it/s, F1=0.958, train_acc=0.998, train_loss=0.272, train_precision=0.956, train_recall=0.962]


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      1.00      0.99       424
         LOC       0.91      0.91      0.91        76
         ORG       0.96      0.97      0.97       256
         PER       0.99      0.99      0.99       362

   micro avg       0.98      0.98      0.98      1118
   macro avg       0.96      0.97      0.96      1118
weighted avg       0.98      0.98      0.98      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.15it/s, F1=0.713, eval_acc=0.957, eval_loss=7.2, eval_precision=0.671, eval_recall=0.775] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.78      0.76      0.77      3160
         LOC       0.26      0.38      0.31       482
         ORG       0.52      0.76      0.62      1645
         PER       0.85      0.91      0.88      1650

   micro avg       0.67      0.77      0.72      6937
   macro avg       0.60      0.70      0.64      6937
weighted avg       0.70      0.77      0.73      6937



Epoch: 10/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.44it/s, F1=0.939, train_acc=0.999, train_loss=0.148, train_precision=0.938, train_recall=0.941]


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.98      0.98       424
         LOC       0.94      0.97      0.95        76
         ORG       0.98      0.99      0.98       256
         PER       0.99      0.99      0.99       362

   micro avg       0.98      0.98      0.98      1118
   macro avg       0.97      0.98      0.98      1118
weighted avg       0.98      0.98      0.98      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.10it/s, F1=0.73, eval_acc=0.963, eval_loss=7.64, eval_precision=0.694, eval_recall=0.781] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.71      0.84      0.77      3160
         LOC       0.30      0.41      0.35       482
         ORG       0.64      0.64      0.64      1645
         PER       0.84      0.91      0.87      1650

   micro avg       0.69      0.78      0.73      6937
   macro avg       0.62      0.70      0.66      6937
weighted avg       0.70      0.78      0.74      6937



Epoch: 11/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.64it/s, F1=0.954, train_acc=0.999, train_loss=0.0825, train_precision=0.953, train_recall=0.957]


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.99      0.99       424
         LOC       0.97      0.95      0.96        76
         ORG       1.00      1.00      1.00       256
         PER       0.99      0.99      0.99       362

   micro avg       0.99      0.99      0.99      1118
   macro avg       0.99      0.98      0.98      1118
weighted avg       0.99      0.99      0.99      1118



Eval Result: 100%|██████████| 68/68 [00:19<00:00,  3.44it/s, F1=0.718, eval_acc=0.961, eval_loss=8, eval_precision=0.686, eval_recall=0.763]   


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.77      0.74      0.76      3160
         LOC       0.24      0.53      0.33       482
         ORG       0.62      0.70      0.66      1645
         PER       0.85      0.92      0.88      1650

   micro avg       0.68      0.76      0.72      6937
   macro avg       0.62      0.72      0.66      6937
weighted avg       0.72      0.76      0.73      6937



Epoch: 12/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.70it/s, F1=0.936, train_acc=0.997, train_loss=0.271, train_precision=0.931, train_recall=0.944]


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.99      0.98       424
         LOC       0.92      0.95      0.94        76
         ORG       0.91      0.95      0.93       256
         PER       0.99      1.00      1.00       362

   micro avg       0.96      0.98      0.97      1118
   macro avg       0.95      0.97      0.96      1118
weighted avg       0.97      0.98      0.97      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.10it/s, F1=0.713, eval_acc=0.96, eval_loss=7.43, eval_precision=0.659, eval_recall=0.786] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.68      0.83      0.75      3160
         LOC       0.30      0.33      0.31       482
         ORG       0.54      0.68      0.60      1645
         PER       0.88      0.91      0.89      1650

   micro avg       0.66      0.78      0.72      6937
   macro avg       0.60      0.69      0.64      6937
weighted avg       0.67      0.78      0.72      6937



Epoch: 13/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.67it/s, F1=0.95, train_acc=0.999, train_loss=0.132, train_precision=0.949, train_recall=0.952] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.97      0.99      0.98       424
         LOC       0.95      0.97      0.96        76
         ORG       0.99      0.97      0.98       256
         PER       0.99      1.00      1.00       362

   micro avg       0.98      0.99      0.98      1118
   macro avg       0.98      0.98      0.98      1118
weighted avg       0.98      0.99      0.98      1118



Eval Result: 100%|██████████| 68/68 [00:19<00:00,  3.41it/s, F1=0.733, eval_acc=0.963, eval_loss=7.45, eval_precision=0.709, eval_recall=0.769]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.75      0.81      0.78      3160
         LOC       0.39      0.38      0.38       482
         ORG       0.57      0.70      0.63      1645
         PER       0.90      0.89      0.89      1650

   micro avg       0.71      0.77      0.74      6937
   macro avg       0.65      0.69      0.67      6937
weighted avg       0.72      0.77      0.74      6937



Epoch: 14/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.67it/s, F1=0.958, train_acc=0.999, train_loss=0.0813, train_precision=0.958, train_recall=0.959]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       424
         LOC       1.00      1.00      1.00        76
         ORG       0.97      0.98      0.98       256
         PER       0.99      0.99      0.99       362

   micro avg       0.99      0.99      0.99      1118
   macro avg       0.99      0.99      0.99      1118
weighted avg       0.99      0.99      0.99      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.14it/s, F1=0.725, eval_acc=0.964, eval_loss=7.9, eval_precision=0.714, eval_recall=0.745] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.78      0.76      0.77      3160
         LOC       0.32      0.48      0.39       482
         ORG       0.63      0.64      0.63      1645
         PER       0.84      0.90      0.87      1650

   micro avg       0.71      0.75      0.73      6937
   macro avg       0.64      0.70      0.66      6937
weighted avg       0.73      0.75      0.74      6937



Epoch: 15/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.68it/s, F1=0.952, train_acc=0.999, train_loss=0.152, train_precision=0.95, train_recall=0.955] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.99      0.99       424
         LOC       0.99      0.99      0.99        76
         ORG       0.99      1.00      0.99       256
         PER       0.97      0.98      0.98       362

   micro avg       0.98      0.99      0.98      1118
   macro avg       0.98      0.99      0.99      1118
weighted avg       0.98      0.99      0.98      1118



Eval Result: 100%|██████████| 68/68 [00:19<00:00,  3.44it/s, F1=0.728, eval_acc=0.962, eval_loss=8.06, eval_precision=0.709, eval_recall=0.756]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.76      0.78      0.77      3160
         LOC       0.30      0.44      0.36       482
         ORG       0.63      0.65      0.64      1645
         PER       0.84      0.90      0.87      1650

   micro avg       0.71      0.75      0.73      6937
   macro avg       0.63      0.69      0.66      6937
weighted avg       0.72      0.75      0.73      6937



Epoch: 16/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.63it/s, F1=0.949, train_acc=0.998, train_loss=0.31, train_precision=0.944, train_recall=0.956] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.95      0.96      0.96       424
         LOC       0.88      0.92      0.90        76
         ORG       0.97      0.99      0.98       256
         PER       0.96      0.98      0.97       362

   micro avg       0.95      0.97      0.96      1118
   macro avg       0.94      0.96      0.95      1118
weighted avg       0.95      0.97      0.96      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.12it/s, F1=0.735, eval_acc=0.963, eval_loss=8.1, eval_precision=0.752, eval_recall=0.728] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.76      0.79      0.78      3160
         LOC       0.41      0.34      0.37       482
         ORG       0.65      0.58      0.61      1645
         PER       0.89      0.89      0.89      1650

   micro avg       0.75      0.73      0.74      6937
   macro avg       0.68      0.65      0.66      6937
weighted avg       0.74      0.73      0.74      6937



Epoch: 17/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.67it/s, F1=0.972, train_acc=0.999, train_loss=0.179, train_precision=0.968, train_recall=0.978] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.97      0.98      0.97       424
         LOC       0.97      0.97      0.97        76
         ORG       0.99      1.00      1.00       256
         PER       0.99      0.99      0.99       362

   micro avg       0.98      0.99      0.98      1118
   macro avg       0.98      0.99      0.98      1118
weighted avg       0.98      0.99      0.98      1118



Eval Result: 100%|██████████| 68/68 [00:20<00:00,  3.34it/s, F1=0.734, eval_acc=0.963, eval_loss=7.84, eval_precision=0.73, eval_recall=0.745] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.76      0.79      0.77      3160
         LOC       0.32      0.36      0.34       482
         ORG       0.63      0.67      0.65      1645
         PER       0.90      0.85      0.87      1650

   micro avg       0.73      0.74      0.73      6937
   macro avg       0.65      0.67      0.66      6937
weighted avg       0.73      0.74      0.74      6937



Epoch: 18/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.68it/s, F1=0.969, train_acc=0.999, train_loss=0.207, train_precision=0.971, train_recall=0.971] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.99      0.99       424
         LOC       0.96      0.89      0.93        76
         ORG       0.99      0.99      0.99       256
         PER       0.99      1.00      1.00       362

   micro avg       0.99      0.98      0.99      1118
   macro avg       0.98      0.97      0.97      1118
weighted avg       0.99      0.98      0.99      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.13it/s, F1=0.688, eval_acc=0.958, eval_loss=7.77, eval_precision=0.644, eval_recall=0.749]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.65      0.83      0.73      3160
         LOC       0.22      0.33      0.27       482
         ORG       0.59      0.57      0.58      1645
         PER       0.83      0.90      0.86      1650

   micro avg       0.64      0.75      0.69      6937
   macro avg       0.57      0.66      0.61      6937
weighted avg       0.65      0.75      0.69      6937



Epoch: 19/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.65it/s, F1=0.97, train_acc=0.999, train_loss=0.126, train_precision=0.972, train_recall=0.971] 


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       424
         LOC       0.92      0.93      0.93        76
         ORG       0.98      0.99      0.99       256
         PER       1.00      0.99      1.00       362

   micro avg       0.99      0.99      0.99      1118
   macro avg       0.97      0.98      0.98      1118
weighted avg       0.99      0.99      0.99      1118



Eval Result: 100%|██████████| 68/68 [00:20<00:00,  3.36it/s, F1=0.69, eval_acc=0.956, eval_loss=9.17, eval_precision=0.713, eval_recall=0.676] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.75      0.78      0.76      3160
         LOC       0.36      0.33      0.34       482
         ORG       0.53      0.38      0.44      1645
         PER       0.85      0.89      0.87      1650

   micro avg       0.71      0.68      0.69      6937
   macro avg       0.62      0.59      0.61      6937
weighted avg       0.70      0.68      0.68      6937



Epoch: 20/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.70it/s, F1=0.978, train_acc=0.999, train_loss=0.122, train_precision=0.977, train_recall=0.979] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.99      0.99       424
         LOC       0.97      0.99      0.98        76
         ORG       0.98      0.98      0.98       256
         PER       1.00      1.00      1.00       362

   micro avg       0.99      0.99      0.99      1118
   macro avg       0.99      0.99      0.99      1118
weighted avg       0.99      0.99      0.99      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.06it/s, F1=0.696, eval_acc=0.958, eval_loss=10.3, eval_precision=0.678, eval_recall=0.721]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.66      0.87      0.75      3160
         LOC       0.39      0.25      0.30       482
         ORG       0.60      0.42      0.49      1645
         PER       0.83      0.89      0.86      1650

   micro avg       0.68      0.72      0.70      6937
   macro avg       0.62      0.61      0.60      6937
weighted avg       0.67      0.72      0.68      6937



Epoch: 21/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.66it/s, F1=0.968, train_acc=1, train_loss=0.0865, train_precision=0.967, train_recall=0.97]     


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.99      0.99       424
         LOC       1.00      0.99      0.99        76
         ORG       0.98      0.99      0.99       256
         PER       1.00      1.00      1.00       362

   micro avg       0.99      0.99      0.99      1118
   macro avg       0.99      0.99      0.99      1118
weighted avg       0.99      0.99      0.99      1118



Eval Result: 100%|██████████| 68/68 [00:20<00:00,  3.39it/s, F1=0.711, eval_acc=0.961, eval_loss=8.55, eval_precision=0.683, eval_recall=0.75] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.76      0.75      0.75      3160
         LOC       0.26      0.50      0.34       482
         ORG       0.62      0.68      0.65      1645
         PER       0.85      0.90      0.88      1650

   micro avg       0.69      0.75      0.72      6937
   macro avg       0.62      0.71      0.66      6937
weighted avg       0.71      0.75      0.73      6937



Epoch: 22/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.64it/s, F1=0.968, train_acc=0.999, train_loss=0.0876, train_precision=0.97, train_recall=0.969] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.99      0.99       424
         LOC       1.00      1.00      1.00        76
         ORG       0.99      0.99      0.99       256
         PER       1.00      1.00      1.00       362

   micro avg       0.99      0.99      0.99      1118
   macro avg       1.00      1.00      1.00      1118
weighted avg       0.99      0.99      0.99      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.15it/s, F1=0.715, eval_acc=0.962, eval_loss=8.62, eval_precision=0.737, eval_recall=0.703]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.76      0.76      0.76      3160
         LOC       0.35      0.34      0.35       482
         ORG       0.66      0.52      0.58      1645
         PER       0.86      0.89      0.88      1650

   micro avg       0.74      0.71      0.72      6937
   macro avg       0.66      0.63      0.64      6937
weighted avg       0.73      0.71      0.72      6937



Epoch: 23/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.45it/s, F1=0.957, train_acc=0.999, train_loss=0.072, train_precision=0.956, train_recall=0.96]  


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      1.00      0.99       424
         LOC       0.99      0.99      0.99        76
         ORG       0.98      0.98      0.98       256
         PER       0.99      1.00      1.00       362

   micro avg       0.99      0.99      0.99      1118
   macro avg       0.99      0.99      0.99      1118
weighted avg       0.99      0.99      0.99      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.08it/s, F1=0.727, eval_acc=0.963, eval_loss=8.9, eval_precision=0.72, eval_recall=0.74]   


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.78      0.76      0.77      3160
         LOC       0.34      0.46      0.39       482
         ORG       0.65      0.62      0.64      1645
         PER       0.83      0.89      0.86      1650

   micro avg       0.72      0.74      0.73      6937
   macro avg       0.65      0.68      0.66      6937
weighted avg       0.73      0.74      0.73      6937



Epoch: 24/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.69it/s, F1=0.976, train_acc=0.999, train_loss=0.0826, train_precision=0.975, train_recall=0.978]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       424
         LOC       0.99      0.97      0.98        76
         ORG       0.98      0.99      0.99       256
         PER       0.99      1.00      1.00       362

   micro avg       0.99      0.99      0.99      1118
   macro avg       0.99      0.99      0.99      1118
weighted avg       0.99      0.99      0.99      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.00it/s, F1=0.721, eval_acc=0.961, eval_loss=9.19, eval_precision=0.703, eval_recall=0.747]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.72      0.82      0.77      3160
         LOC       0.33      0.43      0.37       482
         ORG       0.63      0.57      0.60      1645
         PER       0.86      0.90      0.88      1650

   micro avg       0.70      0.75      0.72      6937
   macro avg       0.64      0.68      0.65      6937
weighted avg       0.71      0.75      0.72      6937



Epoch: 25/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.40it/s, F1=0.971, train_acc=1, train_loss=0.0538, train_precision=0.971, train_recall=0.972]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      0.99      1.00       424
         LOC       0.97      0.99      0.98        76
         ORG       1.00      1.00      1.00       256
         PER       1.00      1.00      1.00       362

   micro avg       1.00      1.00      1.00      1118
   macro avg       0.99      0.99      0.99      1118
weighted avg       1.00      1.00      1.00      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.17it/s, F1=0.744, eval_acc=0.964, eval_loss=9.13, eval_precision=0.718, eval_recall=0.781]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.74      0.83      0.78      3160
         LOC       0.38      0.44      0.41       482
         ORG       0.64      0.65      0.65      1645
         PER       0.87      0.91      0.89      1650

   micro avg       0.72      0.78      0.75      6937
   macro avg       0.66      0.71      0.68      6937
weighted avg       0.72      0.78      0.75      6937



Epoch: 26/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.69it/s, F1=0.994, train_acc=1, train_loss=0.0227, train_precision=0.994, train_recall=0.994]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       424
         LOC       1.00      0.99      0.99        76
         ORG       1.00      1.00      1.00       256
         PER       1.00      1.00      1.00       362

   micro avg       1.00      1.00      1.00      1118
   macro avg       1.00      1.00      1.00      1118
weighted avg       1.00      1.00      1.00      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.11it/s, F1=0.747, eval_acc=0.964, eval_loss=9.62, eval_precision=0.739, eval_recall=0.764]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.75      0.81      0.78      3160
         LOC       0.38      0.40      0.39       482
         ORG       0.68      0.63      0.65      1645
         PER       0.86      0.91      0.88      1650

   micro avg       0.74      0.76      0.75      6937
   macro avg       0.67      0.69      0.68      6937
weighted avg       0.74      0.76      0.75      6937



Epoch: 27/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.40it/s, F1=0.982, train_acc=1, train_loss=0.0127, train_precision=0.981, train_recall=0.982] 


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       424
         LOC       0.99      1.00      0.99        76
         ORG       1.00      1.00      1.00       256
         PER       1.00      1.00      1.00       362

   micro avg       1.00      1.00      1.00      1118
   macro avg       1.00      1.00      1.00      1118
weighted avg       1.00      1.00      1.00      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.11it/s, F1=0.736, eval_acc=0.964, eval_loss=10.1, eval_precision=0.753, eval_recall=0.73] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.78      0.77      0.77      3160
         LOC       0.44      0.26      0.33       482
         ORG       0.65      0.63      0.64      1645
         PER       0.87      0.90      0.88      1650

   micro avg       0.75      0.73      0.74      6937
   macro avg       0.68      0.64      0.66      6937
weighted avg       0.74      0.73      0.74      6937



Epoch: 28/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.64it/s, F1=0.968, train_acc=1, train_loss=0.0335, train_precision=0.969, train_recall=0.968]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       424
         LOC       0.99      0.99      0.99        76
         ORG       1.00      1.00      1.00       256
         PER       1.00      1.00      1.00       362

   micro avg       1.00      1.00      1.00      1118
   macro avg       1.00      1.00      1.00      1118
weighted avg       1.00      1.00      1.00      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.07it/s, F1=0.734, eval_acc=0.963, eval_loss=9.86, eval_precision=0.762, eval_recall=0.719]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.79      0.73      0.76      3160
         LOC       0.45      0.22      0.30       482
         ORG       0.65      0.68      0.66      1645
         PER       0.87      0.87      0.87      1650

   micro avg       0.76      0.72      0.74      6937
   macro avg       0.69      0.63      0.65      6937
weighted avg       0.75      0.72      0.73      6937



Epoch: 29/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.39it/s, F1=0.974, train_acc=0.999, train_loss=0.207, train_precision=0.975, train_recall=0.973]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       424
         LOC       1.00      0.99      0.99        76
         ORG       0.98      0.97      0.98       256
         PER       0.99      0.99      0.99       362

   micro avg       0.99      0.99      0.99      1118
   macro avg       0.99      0.99      0.99      1118
weighted avg       0.99      0.99      0.99      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.08it/s, F1=0.738, eval_acc=0.963, eval_loss=9.18, eval_precision=0.758, eval_recall=0.729]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.80      0.75      0.77      3160
         LOC       0.41      0.36      0.38       482
         ORG       0.67      0.66      0.66      1645
         PER       0.86      0.88      0.87      1650

   micro avg       0.76      0.73      0.74      6937
   macro avg       0.69      0.66      0.67      6937
weighted avg       0.76      0.73      0.74      6937



Epoch: 30/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.70it/s, F1=0.943, train_acc=0.999, train_loss=0.196, train_precision=0.946, train_recall=0.943]


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.99      0.99       424
         LOC       0.99      1.00      0.99        76
         ORG       0.99      0.98      0.98       256
         PER       1.00      0.99      1.00       362

   micro avg       0.99      0.99      0.99      1118
   macro avg       0.99      0.99      0.99      1118
weighted avg       0.99      0.99      0.99      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.03it/s, F1=0.694, eval_acc=0.957, eval_loss=8.53, eval_precision=0.666, eval_recall=0.737]


eval_reports:
              precision    recall  f1-score   support

         GPE       0.77      0.69      0.73      3160
         LOC       0.29      0.41      0.34       482
         ORG       0.53      0.73      0.62      1645
         PER       0.82      0.90      0.86      1650

   micro avg       0.67      0.73      0.70      6937
   macro avg       0.60      0.68      0.64      6937
weighted avg       0.69      0.73      0.71      6937



calculate data/few_shot/note4/train_1350.json etag: 100%|██████████| 518k/518k [00:00<00:00, 291MB/s]
calculate data/few_shot/note4/dev.json etag: 100%|██████████| 2.46M/2.46M [00:00<00:00, 339MB/s]
calculate data/few_shot/note4/test.json etag: 100%|██████████| 2.56M/2.56M [00:00<00:00, 374MB/s]
calculate data/few_shot/note4/labels.txt etag: 100%|██████████| 100/100 [00:00<00:00, 329kB/s]

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/note4/train_1350.json",
    "eval_file": "data/few_shot/note4/dev.json",
    "test_file": "data/few_shot/note4/test.json",
    "tag_file": "data/few_shot/note4/labels.txt",
    "bert_vocab_file": "./model/chinese_wwm_ext/vocab.txt",
    "output_eval": true,
    "max_scan_num": 1000000,
    "add_seq_vocab": false,
    "max_seq_length": 150,
    "max_word_num": 5,
    "default_tag": "O",
    "use_test": false,
    "do_shuffle": true,
    "do_predict": false,
    "task_name": "note4_pretrain_lebert_crf_1350_x2"
}
load cached ./temp/a92fb4e09540fd0fde5e16ec2dc288e7_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/lexicon_tree



count line size data/few_shot/note4/labels.txt: 19L [00:00, 164993.33L/s]
build line mapper: 19L [00:00, 158118.60L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 19/19 [00:00<00:00, 5649.09it/s]
load vocab from list: 100%|██████████| 18/18 [00:00<00:00, 209715.20it/s]
load dataset from data/few_shot/note4/train_1350.json: 0it [00:00, ?it/s]

load cached ./temp/a92fb4e09540fd0fde5e16ec2dc288e7_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/matched_words
load cached ./temp/a92fb4e09540fd0fde5e16ec2dc288e7_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/word_vocab
load cached ./temp/a92fb4e09540fd0fde5e16ec2dc288e7_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/vocab_embedding


load dataset from data/few_shot/note4/train_1350.json: 1350it [00:01, 838.09it/s]
load dataset from data/few_shot/note4/dev.json: 4301it [00:12, 332.49it/s]
Some weights of the model checkpoint at save_pretrained/note4_pretrain_lebert_1350_pretraind_task/Bert_1290/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification mod

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.67it/s, F1=0.0266, train_acc=0.77, train_loss=32.1, train_precision=0.024, train_recall=0.0332]       


train_reports:
              precision    recall  f1-score   support

         GPE       0.09      0.10      0.09       424
         LOC       0.00      0.00      0.00        76
         ORG       0.00      0.00      0.00       256
         PER       0.01      0.01      0.01       362

   micro avg       0.01      0.04      0.01      1118
   macro avg       0.02      0.03      0.03      1118
weighted avg       0.04      0.04      0.04      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.08it/s, F1=0.263, eval_acc=0.934, eval_loss=13.2, eval_precision=0.219, eval_recall=0.334]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.45      0.67      0.54      3160
         LOC       0.00      0.00      0.00       482
         ORG       0.00      0.00      0.00      1645
         PER       0.07      0.16      0.10      1650

   micro avg       0.22      0.34      0.27      6937
   macro avg       0.13      0.21      0.16      6937
weighted avg       0.22      0.34      0.27      6937



Epoch: 2/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.62it/s, F1=0.448, train_acc=0.963, train_loss=4.33, train_precision=0.4, train_recall=0.541]   


train_reports:
              precision    recall  f1-score   support

         GPE       0.49      0.66      0.56       424
         LOC       0.11      0.07      0.08        76
         ORG       0.10      0.24      0.14       256
         PER       0.64      0.80      0.71       362

   micro avg       0.38      0.57      0.46      1118
   macro avg       0.34      0.44      0.37      1118
weighted avg       0.43      0.57      0.48      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.01it/s, F1=0.602, eval_acc=0.958, eval_loss=7.3, eval_precision=0.538, eval_recall=0.699] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.70      0.78      0.74      3160
         LOC       0.11      0.06      0.07       482
         ORG       0.22      0.47      0.30      1645
         PER       0.81      0.93      0.87      1650

   micro avg       0.53      0.69      0.60      6937
   macro avg       0.46      0.56      0.50      6937
weighted avg       0.57      0.69      0.62      6937



Epoch: 3/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.62it/s, F1=0.681, train_acc=0.98, train_loss=2.41, train_precision=0.654, train_recall=0.732] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.76      0.81      0.78       424
         LOC       0.36      0.36      0.36        76
         ORG       0.49      0.71      0.58       256
         PER       0.78      0.89      0.83       362

   micro avg       0.67      0.78      0.72      1118
   macro avg       0.60      0.69      0.64      1118
weighted avg       0.68      0.78      0.72      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.01it/s, F1=0.653, eval_acc=0.958, eval_loss=7.5, eval_precision=0.582, eval_recall=0.758] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.75      0.76      0.76      3160
         LOC       0.19      0.49      0.28       482
         ORG       0.37      0.65      0.47      1645
         PER       0.87      0.91      0.89      1650

   micro avg       0.57      0.75      0.65      6937
   macro avg       0.54      0.70      0.60      6937
weighted avg       0.65      0.75      0.69      6937



Epoch: 4/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.40it/s, F1=0.838, train_acc=0.989, train_loss=1.31, train_precision=0.819, train_recall=0.873]


train_reports:
              precision    recall  f1-score   support

         GPE       0.88      0.91      0.89       424
         LOC       0.64      0.66      0.65        76
         ORG       0.67      0.82      0.74       256
         PER       0.90      0.95      0.92       362

   micro avg       0.81      0.88      0.85      1118
   macro avg       0.77      0.83      0.80      1118
weighted avg       0.82      0.88      0.85      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.07it/s, F1=0.688, eval_acc=0.962, eval_loss=7.91, eval_precision=0.648, eval_recall=0.745]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.76      0.77      0.76      3160
         LOC       0.31      0.36      0.33       482
         ORG       0.44      0.66      0.53      1645
         PER       0.83      0.90      0.86      1650

   micro avg       0.64      0.75      0.69      6937
   macro avg       0.58      0.67      0.62      6937
weighted avg       0.67      0.75      0.70      6937



Epoch: 5/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.67it/s, F1=0.842, train_acc=0.992, train_loss=0.986, train_precision=0.82, train_recall=0.879] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.91      0.95      0.93       424
         LOC       0.71      0.78      0.74        76
         ORG       0.73      0.86      0.79       256
         PER       0.91      0.97      0.94       362

   micro avg       0.85      0.92      0.89      1118
   macro avg       0.82      0.89      0.85      1118
weighted avg       0.86      0.92      0.89      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.13it/s, F1=0.691, eval_acc=0.962, eval_loss=8.78, eval_precision=0.672, eval_recall=0.721]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.72      0.78      0.75      3160
         LOC       0.34      0.31      0.33       482
         ORG       0.49      0.57      0.52      1645
         PER       0.86      0.90      0.88      1650

   micro avg       0.67      0.73      0.70      6937
   macro avg       0.60      0.64      0.62      6937
weighted avg       0.67      0.73      0.70      6937



Epoch: 6/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.43it/s, F1=0.893, train_acc=0.994, train_loss=0.71, train_precision=0.876, train_recall=0.923] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.94      0.97      0.96       424
         LOC       0.87      0.87      0.87        76
         ORG       0.81      0.91      0.85       256
         PER       0.94      0.97      0.96       362

   micro avg       0.90      0.95      0.93      1118
   macro avg       0.89      0.93      0.91      1118
weighted avg       0.90      0.95      0.93      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.07it/s, F1=0.668, eval_acc=0.956, eval_loss=9.54, eval_precision=0.6, eval_recall=0.767]  


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.73      0.75      0.74      3160
         LOC       0.31      0.36      0.33       482
         ORG       0.38      0.73      0.50      1645
         PER       0.85      0.92      0.88      1650

   micro avg       0.60      0.76      0.67      6937
   macro avg       0.56      0.69      0.61      6937
weighted avg       0.64      0.76      0.69      6937



Epoch: 7/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.64it/s, F1=0.902, train_acc=0.996, train_loss=0.475, train_precision=0.891, train_recall=0.918]


train_reports:
              precision    recall  f1-score   support

         GPE       0.93      0.96      0.95       424
         LOC       0.86      0.82      0.84        76
         ORG       0.88      0.95      0.91       256
         PER       0.98      0.99      0.98       362

   micro avg       0.93      0.96      0.94      1118
   macro avg       0.91      0.93      0.92      1118
weighted avg       0.93      0.96      0.94      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.06it/s, F1=0.679, eval_acc=0.961, eval_loss=9.95, eval_precision=0.681, eval_recall=0.685]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.78      0.68      0.72      3160
         LOC       0.28      0.40      0.33       482
         ORG       0.49      0.54      0.51      1645
         PER       0.84      0.92      0.87      1650

   micro avg       0.67      0.68      0.68      6937
   macro avg       0.60      0.63      0.61      6937
weighted avg       0.69      0.68      0.68      6937



Epoch: 8/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.39it/s, F1=0.938, train_acc=0.998, train_loss=0.338, train_precision=0.932, train_recall=0.948]


train_reports:
              precision    recall  f1-score   support

         GPE       0.97      0.99      0.98       424
         LOC       0.93      0.91      0.92        76
         ORG       0.93      0.96      0.94       256
         PER       0.96      0.98      0.97       362

   micro avg       0.95      0.97      0.96      1118
   macro avg       0.95      0.96      0.95      1118
weighted avg       0.95      0.97      0.96      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.15it/s, F1=0.688, eval_acc=0.96, eval_loss=10.4, eval_precision=0.662, eval_recall=0.725] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.72      0.80      0.76      3160
         LOC       0.35      0.44      0.39       482
         ORG       0.45      0.48      0.46      1645
         PER       0.83      0.90      0.87      1650

   micro avg       0.66      0.72      0.69      6937
   macro avg       0.59      0.65      0.62      6937
weighted avg       0.66      0.72      0.69      6937



Epoch: 9/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.64it/s, F1=0.955, train_acc=0.998, train_loss=0.221, train_precision=0.949, train_recall=0.963]


train_reports:
              precision    recall  f1-score   support

         GPE       0.97      0.99      0.98       424
         LOC       0.88      0.89      0.89        76
         ORG       0.95      0.97      0.96       256
         PER       0.98      0.99      0.99       362

   micro avg       0.96      0.98      0.97      1118
   macro avg       0.95      0.96      0.95      1118
weighted avg       0.96      0.98      0.97      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.09it/s, F1=0.68, eval_acc=0.959, eval_loss=10.1, eval_precision=0.638, eval_recall=0.738] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.67      0.79      0.72      3160
         LOC       0.27      0.38      0.31       482
         ORG       0.51      0.56      0.53      1645
         PER       0.83      0.91      0.87      1650

   micro avg       0.63      0.73      0.68      6937
   macro avg       0.57      0.66      0.61      6937
weighted avg       0.64      0.73      0.68      6937



Epoch: 10/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.44it/s, F1=0.952, train_acc=0.998, train_loss=0.231, train_precision=0.948, train_recall=0.96] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.99      0.98       424
         LOC       0.94      0.96      0.95        76
         ORG       0.94      0.96      0.95       256
         PER       0.98      0.99      0.98       362

   micro avg       0.97      0.98      0.97      1118
   macro avg       0.96      0.98      0.97      1118
weighted avg       0.97      0.98      0.97      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.13it/s, F1=0.671, eval_acc=0.953, eval_loss=11.3, eval_precision=0.603, eval_recall=0.77] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.72      0.74      0.73      3160
         LOC       0.23      0.48      0.31       482
         ORG       0.43      0.72      0.54      1645
         PER       0.88      0.92      0.90      1650

   micro avg       0.60      0.76      0.67      6937
   macro avg       0.57      0.72      0.62      6937
weighted avg       0.66      0.76      0.70      6937



Epoch: 11/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.69it/s, F1=0.937, train_acc=0.998, train_loss=0.379, train_precision=0.932, train_recall=0.948]


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.99      0.98       424
         LOC       0.90      0.91      0.90        76
         ORG       0.88      0.95      0.91       256
         PER       0.99      1.00      1.00       362

   micro avg       0.95      0.98      0.96      1118
   macro avg       0.94      0.96      0.95      1118
weighted avg       0.95      0.98      0.96      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.12it/s, F1=0.683, eval_acc=0.959, eval_loss=10.4, eval_precision=0.647, eval_recall=0.733]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.72      0.78      0.75      3160
         LOC       0.27      0.51      0.35       482
         ORG       0.48      0.54      0.51      1645
         PER       0.86      0.90      0.88      1650

   micro avg       0.64      0.73      0.68      6937
   macro avg       0.58      0.68      0.62      6937
weighted avg       0.66      0.73      0.69      6937



Epoch: 12/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.44it/s, F1=0.932, train_acc=0.997, train_loss=0.436, train_precision=0.925, train_recall=0.945]


train_reports:
              precision    recall  f1-score   support

         GPE       0.94      0.97      0.96       424
         LOC       0.89      0.95      0.92        76
         ORG       0.91      0.95      0.93       256
         PER       0.99      0.99      0.99       362

   micro avg       0.95      0.97      0.96      1118
   macro avg       0.93      0.96      0.95      1118
weighted avg       0.95      0.97      0.96      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.12it/s, F1=0.654, eval_acc=0.96, eval_loss=8.93, eval_precision=0.598, eval_recall=0.733] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.69      0.82      0.75      3160
         LOC       0.33      0.41      0.37       482
         ORG       0.35      0.52      0.42      1645
         PER       0.86      0.90      0.88      1650

   micro avg       0.60      0.74      0.66      6937
   macro avg       0.56      0.66      0.60      6937
weighted avg       0.62      0.74      0.68      6937



Epoch: 13/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.64it/s, F1=0.95, train_acc=0.999, train_loss=0.183, train_precision=0.944, train_recall=0.958] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.96      0.98      0.97       424
         LOC       0.97      0.97      0.97        76
         ORG       0.94      0.97      0.95       256
         PER       0.99      0.99      0.99       362

   micro avg       0.97      0.98      0.97      1118
   macro avg       0.97      0.98      0.97      1118
weighted avg       0.97      0.98      0.97      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.11it/s, F1=0.697, eval_acc=0.961, eval_loss=10.7, eval_precision=0.667, eval_recall=0.739]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.70      0.79      0.74      3160
         LOC       0.31      0.43      0.36       482
         ORG       0.54      0.55      0.55      1645
         PER       0.84      0.90      0.87      1650

   micro avg       0.66      0.74      0.70      6937
   macro avg       0.60      0.67      0.63      6937
weighted avg       0.67      0.74      0.70      6937



Epoch: 14/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.41it/s, F1=0.924, train_acc=0.997, train_loss=0.38, train_precision=0.918, train_recall=0.937] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.97      0.98      0.97       424
         LOC       0.97      0.95      0.96        76
         ORG       0.84      0.94      0.89       256
         PER       1.00      1.00      1.00       362

   micro avg       0.95      0.97      0.96      1118
   macro avg       0.95      0.97      0.95      1118
weighted avg       0.95      0.97      0.96      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.16it/s, F1=0.678, eval_acc=0.958, eval_loss=9.59, eval_precision=0.641, eval_recall=0.729]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.80      0.68      0.73      3160
         LOC       0.32      0.46      0.38       482
         ORG       0.43      0.71      0.54      1645
         PER       0.87      0.90      0.89      1650

   micro avg       0.65      0.72      0.68      6937
   macro avg       0.61      0.69      0.63      6937
weighted avg       0.70      0.72      0.70      6937



Epoch: 15/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.63it/s, F1=0.958, train_acc=0.999, train_loss=0.222, train_precision=0.952, train_recall=0.964]


train_reports:
              precision    recall  f1-score   support

         GPE       0.97      0.99      0.98       424
         LOC       0.96      0.96      0.96        76
         ORG       0.91      0.96      0.94       256
         PER       1.00      1.00      1.00       362

   micro avg       0.97      0.98      0.97      1118
   macro avg       0.96      0.98      0.97      1118
weighted avg       0.97      0.98      0.97      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.07it/s, F1=0.683, eval_acc=0.96, eval_loss=9.53, eval_precision=0.65, eval_recall=0.729]  


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.74      0.73      0.74      3160
         LOC       0.25      0.50      0.33       482
         ORG       0.50      0.60      0.55      1645
         PER       0.87      0.89      0.88      1650

   micro avg       0.64      0.73      0.68      6937
   macro avg       0.59      0.68      0.62      6937
weighted avg       0.68      0.73      0.70      6937



Epoch: 16/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.71it/s, F1=0.972, train_acc=1, train_loss=0.0517, train_precision=0.971, train_recall=0.974]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       424
         LOC       1.00      1.00      1.00        76
         ORG       0.98      0.99      0.98       256
         PER       1.00      1.00      1.00       362

   micro avg       0.99      1.00      0.99      1118
   macro avg       0.99      1.00      0.99      1118
weighted avg       0.99      1.00      0.99      1118



Eval Result: 100%|██████████| 68/68 [00:19<00:00,  3.45it/s, F1=0.71, eval_acc=0.962, eval_loss=10.5, eval_precision=0.687, eval_recall=0.743] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.73      0.79      0.76      3160
         LOC       0.42      0.43      0.43       482
         ORG       0.51      0.60      0.55      1645
         PER       0.87      0.89      0.88      1650

   micro avg       0.68      0.74      0.71      6937
   macro avg       0.63      0.68      0.65      6937
weighted avg       0.69      0.74      0.71      6937



Epoch: 17/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.65it/s, F1=0.963, train_acc=0.999, train_loss=0.0806, train_precision=0.961, train_recall=0.965]


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.99      0.99       424
         LOC       1.00      1.00      1.00        76
         ORG       1.00      1.00      1.00       256
         PER       0.98      0.99      0.99       362

   micro avg       0.99      0.99      0.99      1118
   macro avg       0.99      1.00      0.99      1118
weighted avg       0.99      0.99      0.99      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.17it/s, F1=0.699, eval_acc=0.962, eval_loss=10.9, eval_precision=0.68, eval_recall=0.728] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.75      0.75      0.75      3160
         LOC       0.39      0.44      0.41       482
         ORG       0.51      0.60      0.55      1645
         PER       0.81      0.90      0.85      1650

   micro avg       0.68      0.73      0.70      6937
   macro avg       0.62      0.67      0.64      6937
weighted avg       0.68      0.73      0.71      6937



Epoch: 18/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.48it/s, F1=0.953, train_acc=0.999, train_loss=0.0924, train_precision=0.951, train_recall=0.957]


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.98      0.98       424
         LOC       0.99      1.00      0.99        76
         ORG       0.99      1.00      0.99       256
         PER       0.99      1.00      0.99       362

   micro avg       0.99      0.99      0.99      1118
   macro avg       0.99      0.99      0.99      1118
weighted avg       0.99      0.99      0.99      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.05it/s, F1=0.71, eval_acc=0.962, eval_loss=10.9, eval_precision=0.688, eval_recall=0.743] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.72      0.80      0.76      3160
         LOC       0.49      0.35      0.41       482
         ORG       0.52      0.57      0.54      1645
         PER       0.82      0.92      0.86      1650

   micro avg       0.69      0.74      0.71      6937
   macro avg       0.64      0.66      0.64      6937
weighted avg       0.68      0.74      0.71      6937



Epoch: 19/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.64it/s, F1=0.967, train_acc=0.999, train_loss=0.0683, train_precision=0.966, train_recall=0.969]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       424
         LOC       0.99      0.97      0.98        76
         ORG       0.99      1.00      0.99       256
         PER       0.99      0.99      0.99       362

   micro avg       0.99      0.99      0.99      1118
   macro avg       0.99      0.99      0.99      1118
weighted avg       0.99      0.99      0.99      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.08it/s, F1=0.703, eval_acc=0.962, eval_loss=11.3, eval_precision=0.684, eval_recall=0.733]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.76      0.76      0.76      3160
         LOC       0.36      0.46      0.41       482
         ORG       0.50      0.60      0.55      1645
         PER       0.85      0.90      0.88      1650

   micro avg       0.68      0.74      0.71      6937
   macro avg       0.62      0.68      0.65      6937
weighted avg       0.69      0.74      0.71      6937



Epoch: 20/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.42it/s, F1=0.969, train_acc=1, train_loss=0.0288, train_precision=0.968, train_recall=0.969]   


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       424
         LOC       0.97      0.99      0.98        76
         ORG       1.00      1.00      1.00       256
         PER       1.00      1.00      1.00       362

   micro avg       1.00      1.00      1.00      1118
   macro avg       0.99      1.00      0.99      1118
weighted avg       1.00      1.00      1.00      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.17it/s, F1=0.712, eval_acc=0.962, eval_loss=11.4, eval_precision=0.684, eval_recall=0.752]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.71      0.82      0.76      3160
         LOC       0.42      0.37      0.39       482
         ORG       0.52      0.59      0.55      1645
         PER       0.86      0.91      0.88      1650

   micro avg       0.68      0.76      0.72      6937
   macro avg       0.63      0.67      0.65      6937
weighted avg       0.68      0.76      0.72      6937



Epoch: 21/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.63it/s, F1=0.973, train_acc=1, train_loss=0.0334, train_precision=0.973, train_recall=0.973]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       424
         LOC       0.97      0.97      0.97        76
         ORG       0.99      1.00      0.99       256
         PER       1.00      1.00      1.00       362

   micro avg       0.99      1.00      1.00      1118
   macro avg       0.99      0.99      0.99      1118
weighted avg       0.99      1.00      1.00      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.08it/s, F1=0.695, eval_acc=0.96, eval_loss=11.3, eval_precision=0.649, eval_recall=0.759] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.76      0.77      0.76      3160
         LOC       0.30      0.47      0.37       482
         ORG       0.49      0.64      0.55      1645
         PER       0.80      0.93      0.86      1650

   micro avg       0.65      0.76      0.70      6937
   macro avg       0.59      0.70      0.64      6937
weighted avg       0.67      0.76      0.71      6937



Epoch: 22/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.43it/s, F1=0.98, train_acc=1, train_loss=0.0602, train_precision=0.979, train_recall=0.981]     


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.99      0.99       424
         LOC       0.96      0.96      0.96        76
         ORG       0.99      1.00      0.99       256
         PER       0.99      1.00      1.00       362

   micro avg       0.99      0.99      0.99      1118
   macro avg       0.98      0.99      0.99      1118
weighted avg       0.99      0.99      0.99      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.14it/s, F1=0.715, eval_acc=0.963, eval_loss=11.6, eval_precision=0.702, eval_recall=0.738]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.76      0.77      0.76      3160
         LOC       0.43      0.40      0.42       482
         ORG       0.51      0.61      0.56      1645
         PER       0.87      0.91      0.89      1650

   micro avg       0.70      0.74      0.72      6937
   macro avg       0.64      0.67      0.66      6937
weighted avg       0.70      0.74      0.72      6937



Epoch: 23/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.67it/s, F1=0.978, train_acc=1, train_loss=0.0787, train_precision=0.977, train_recall=0.982]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       424
         LOC       1.00      1.00      1.00        76
         ORG       0.98      0.99      0.99       256
         PER       0.99      0.99      0.99       362

   micro avg       0.99      1.00      0.99      1118
   macro avg       0.99      1.00      0.99      1118
weighted avg       0.99      1.00      0.99      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.05it/s, F1=0.677, eval_acc=0.956, eval_loss=13.3, eval_precision=0.62, eval_recall=0.763] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.74      0.75      0.75      3160
         LOC       0.36      0.47      0.41       482
         ORG       0.42      0.72      0.53      1645
         PER       0.81      0.90      0.85      1650

   micro avg       0.62      0.76      0.68      6937
   macro avg       0.58      0.71      0.64      6937
weighted avg       0.66      0.76      0.70      6937



Epoch: 24/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.39it/s, F1=0.905, train_acc=0.997, train_loss=0.446, train_precision=0.903, train_recall=0.912]


train_reports:
              precision    recall  f1-score   support

         GPE       0.96      0.97      0.96       424
         LOC       0.94      0.95      0.94        76
         ORG       0.92      0.94      0.93       256
         PER       0.98      0.98      0.98       362

   micro avg       0.95      0.96      0.96      1118
   macro avg       0.95      0.96      0.95      1118
weighted avg       0.95      0.96      0.96      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.09it/s, F1=0.663, eval_acc=0.956, eval_loss=10.7, eval_precision=0.602, eval_recall=0.75] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.73      0.76      0.74      3160
         LOC       0.25      0.51      0.34       482
         ORG       0.44      0.61      0.51      1645
         PER       0.76      0.92      0.83      1650

   micro avg       0.60      0.75      0.67      6937
   macro avg       0.54      0.70      0.61      6937
weighted avg       0.63      0.75      0.68      6937



Epoch: 25/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.65it/s, F1=0.947, train_acc=0.998, train_loss=0.36, train_precision=0.944, train_recall=0.955] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.96      0.98      0.97       424
         LOC       0.92      0.95      0.94        76
         ORG       0.95      0.98      0.96       256
         PER       0.98      0.99      0.98       362

   micro avg       0.96      0.98      0.97      1118
   macro avg       0.95      0.97      0.96      1118
weighted avg       0.96      0.98      0.97      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.15it/s, F1=0.692, eval_acc=0.959, eval_loss=11.1, eval_precision=0.662, eval_recall=0.736]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.73      0.79      0.76      3160
         LOC       0.43      0.38      0.40       482
         ORG       0.53      0.56      0.55      1645
         PER       0.71      0.90      0.79      1650

   micro avg       0.66      0.73      0.70      6937
   macro avg       0.60      0.66      0.62      6937
weighted avg       0.66      0.73      0.69      6937



Epoch: 26/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.42it/s, F1=0.972, train_acc=0.998, train_loss=0.182, train_precision=0.968, train_recall=0.976]


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.99      0.99       424
         LOC       0.95      0.96      0.95        76
         ORG       0.98      0.99      0.98       256
         PER       0.96      0.98      0.97       362

   micro avg       0.97      0.98      0.98      1118
   macro avg       0.97      0.98      0.97      1118
weighted avg       0.97      0.98      0.98      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.08it/s, F1=0.702, eval_acc=0.961, eval_loss=10.4, eval_precision=0.668, eval_recall=0.75] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.70      0.81      0.75      3160
         LOC       0.36      0.37      0.37       482
         ORG       0.53      0.63      0.57      1645
         PER       0.84      0.87      0.86      1650

   micro avg       0.67      0.75      0.71      6937
   macro avg       0.61      0.67      0.64      6937
weighted avg       0.67      0.75      0.71      6937



Epoch: 27/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.68it/s, F1=0.954, train_acc=0.999, train_loss=0.136, train_precision=0.953, train_recall=0.956]


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      1.00      0.99       424
         LOC       0.96      0.97      0.97        76
         ORG       0.98      0.98      0.98       256
         PER       0.99      0.99      0.99       362

   micro avg       0.99      0.99      0.99      1118
   macro avg       0.98      0.99      0.98      1118
weighted avg       0.99      0.99      0.99      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.17it/s, F1=0.714, eval_acc=0.963, eval_loss=11.5, eval_precision=0.703, eval_recall=0.736]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.77      0.74      0.76      3160
         LOC       0.37      0.41      0.39       482
         ORG       0.54      0.65      0.59      1645
         PER       0.85      0.90      0.88      1650

   micro avg       0.70      0.74      0.72      6937
   macro avg       0.63      0.68      0.65      6937
weighted avg       0.71      0.74      0.72      6937



Epoch: 28/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.41it/s, F1=0.954, train_acc=0.999, train_loss=0.108, train_precision=0.952, train_recall=0.958]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       424
         LOC       0.92      0.96      0.94        76
         ORG       0.98      1.00      0.99       256
         PER       1.00      1.00      1.00       362

   micro avg       0.99      1.00      0.99      1118
   macro avg       0.98      0.99      0.98      1118
weighted avg       0.99      1.00      0.99      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.10it/s, F1=0.725, eval_acc=0.963, eval_loss=11.1, eval_precision=0.716, eval_recall=0.741]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.77      0.76      0.77      3160
         LOC       0.38      0.41      0.40       482
         ORG       0.59      0.63      0.61      1645
         PER       0.85      0.90      0.87      1650

   micro avg       0.72      0.74      0.73      6937
   macro avg       0.65      0.68      0.66      6937
weighted avg       0.72      0.74      0.73      6937



Epoch: 29/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.70it/s, F1=0.97, train_acc=1, train_loss=0.0691, train_precision=0.971, train_recall=0.97]  


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.99      0.99       424
         LOC       1.00      0.99      0.99        76
         ORG       1.00      1.00      1.00       256
         PER       0.99      0.99      0.99       362

   micro avg       0.99      0.99      0.99      1118
   macro avg       1.00      0.99      0.99      1118
weighted avg       0.99      0.99      0.99      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.13it/s, F1=0.705, eval_acc=0.961, eval_loss=11.4, eval_precision=0.683, eval_recall=0.738]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.75      0.77      0.76      3160
         LOC       0.28      0.52      0.36       482
         ORG       0.60      0.57      0.58      1645
         PER       0.83      0.91      0.87      1650

   micro avg       0.68      0.74      0.71      6937
   macro avg       0.62      0.69      0.64      6937
weighted avg       0.70      0.74      0.72      6937



Epoch: 30/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.41it/s, F1=0.974, train_acc=0.999, train_loss=0.0944, train_precision=0.973, train_recall=0.975]


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.98      0.98       424
         LOC       0.97      0.99      0.98        76
         ORG       0.99      1.00      0.99       256
         PER       0.99      1.00      1.00       362

   micro avg       0.99      0.99      0.99      1118
   macro avg       0.99      0.99      0.99      1118
weighted avg       0.99      0.99      0.99      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.18it/s, F1=0.713, eval_acc=0.962, eval_loss=11.3, eval_precision=0.705, eval_recall=0.73] 


eval_reports:
              precision    recall  f1-score   support

         GPE       0.75      0.76      0.75      3160
         LOC       0.38      0.42      0.40       482
         ORG       0.57      0.59      0.58      1645
         PER       0.84      0.90      0.87      1650

   micro avg       0.70      0.73      0.72      6937
   macro avg       0.64      0.67      0.65      6937
weighted avg       0.70      0.73      0.72      6937



calculate data/few_shot/note4/train_1350.json etag: 100%|██████████| 518k/518k [00:00<00:00, 292MB/s]
calculate data/few_shot/note4/dev.json etag: 100%|██████████| 2.46M/2.46M [00:00<00:00, 321MB/s]
calculate data/few_shot/note4/test.json etag: 100%|██████████| 2.56M/2.56M [00:00<00:00, 373MB/s]
calculate data/few_shot/note4/labels.txt etag: 100%|██████████| 100/100 [00:00<00:00, 194kB/s]

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/note4/train_1350.json",
    "eval_file": "data/few_shot/note4/dev.json",
    "test_file": "data/few_shot/note4/test.json",
    "tag_file": "data/few_shot/note4/labels.txt",
    "bert_vocab_file": "./model/chinese_wwm_ext/vocab.txt",
    "output_eval": true,
    "max_scan_num": 1000000,
    "add_seq_vocab": false,
    "max_seq_length": 150,
    "max_word_num": 5,
    "default_tag": "O",
    "use_test": false,
    "do_shuffle": true,
    "do_predict": false,
    "task_name": "note4_pretrain_lebert_crf_1350_x3"
}
load cached ./temp/a92fb4e09540fd0fde5e16ec2dc288e7_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/lexicon_tree



count line size data/few_shot/note4/labels.txt: 19L [00:00, 166024.53L/s]
build line mapper: 19L [00:00, 151505.28L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 19/19 [00:00<00:00, 5492.95it/s]
load vocab from list: 100%|██████████| 18/18 [00:00<00:00, 183692.15it/s]
load dataset from data/few_shot/note4/train_1350.json: 0it [00:00, ?it/s]

load cached ./temp/a92fb4e09540fd0fde5e16ec2dc288e7_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/matched_words
load cached ./temp/a92fb4e09540fd0fde5e16ec2dc288e7_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/word_vocab
load cached ./temp/a92fb4e09540fd0fde5e16ec2dc288e7_459650795b3185143e4c407cbff316ae_fffb050c26d1ecf702c9514c0d73b692_f940bdbdfe1972ae40e4ceff85d92072/1000000/vocab_embedding


load dataset from data/few_shot/note4/train_1350.json: 1350it [00:01, 840.30it/s]
load dataset from data/few_shot/note4/dev.json: 4301it [00:07, 569.75it/s]


Load pretrained embedding from file.........


Some weights of the model checkpoint at save_pretrained/note4_pretrain_lebert_1350_pretraind_task/Bert_1290/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of LEBertModel were not initialized from the model checkpoint at save_pretrained/note4_pretrain_

train_reports:
              precision    recall  f1-score   support

         GPE       0.13      0.09      0.11       424
         LOC       0.00      0.00      0.00        76
         ORG       0.05      0.05      0.05       256
         PER       0.01      0.14      0.02       362
           _       0.00      0.00      0.00         0

   micro avg       0.02      0.09      0.03      1118
   macro avg       0.04      0.06      0.04      1118
weighted avg       0.06      0.09      0.06      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.06it/s, F1=0.383, eval_acc=0.938, eval_loss=8.9, eval_precision=0.409, eval_recall=0.367] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.25      0.29      0.27      3160
         LOC       0.00      0.00      0.00       482
         ORG       0.32      0.14      0.20      1645
         PER       0.76      0.78      0.77      1650

   micro avg       0.40      0.35      0.37      6937
   macro avg       0.33      0.30      0.31      6937
weighted avg       0.37      0.35      0.35      6937



Epoch: 2/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.67it/s, F1=0.616, train_acc=0.97, train_loss=3.04, train_precision=0.608, train_recall=0.651] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.58      0.72      0.64       424
         LOC       0.17      0.13      0.15        76
         ORG       0.51      0.56      0.53       256
         PER       0.79      0.84      0.81       362

   micro avg       0.61      0.68      0.64      1118
   macro avg       0.51      0.56      0.53      1118
weighted avg       0.60      0.68      0.64      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.09it/s, F1=0.665, eval_acc=0.962, eval_loss=5.3, eval_precision=0.627, eval_recall=0.718] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.65      0.73      0.69      3160
         LOC       0.18      0.21      0.19       482
         ORG       0.52      0.61      0.56      1645
         PER       0.83      0.93      0.87      1650

   micro avg       0.63      0.71      0.67      6937
   macro avg       0.54      0.62      0.58      6937
weighted avg       0.63      0.71      0.67      6937



Epoch: 3/30 Train: 100%|██████████| 169/169 [00:50<00:00,  3.38it/s, F1=0.769, train_acc=0.984, train_loss=1.63, train_precision=0.749, train_recall=0.808]


train_reports:
              precision    recall  f1-score   support

         GPE       0.79      0.87      0.83       424
         LOC       0.49      0.47      0.48        76
         ORG       0.67      0.79      0.73       256
         PER       0.89      0.92      0.91       362

   micro avg       0.77      0.84      0.81      1118
   macro avg       0.71      0.76      0.74      1118
weighted avg       0.78      0.84      0.81      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.14it/s, F1=0.611, eval_acc=0.952, eval_loss=6.56, eval_precision=0.616, eval_recall=0.614]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.60      0.65      0.62      3160
         LOC       0.27      0.37      0.31       482
         ORG       0.46      0.33      0.38      1645
         PER       0.89      0.88      0.88      1650

   micro avg       0.61      0.61      0.61      6937
   macro avg       0.55      0.56      0.55      6937
weighted avg       0.61      0.61      0.61      6937



Epoch: 4/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.67it/s, F1=0.862, train_acc=0.99, train_loss=0.941, train_precision=0.849, train_recall=0.887]


train_reports:
              precision    recall  f1-score   support

         GPE       0.88      0.93      0.90       424
         LOC       0.74      0.78      0.76        76
         ORG       0.77      0.84      0.80       256
         PER       0.93      0.97      0.95       362

   micro avg       0.86      0.91      0.89      1118
   macro avg       0.83      0.88      0.85      1118
weighted avg       0.86      0.91      0.89      1118



Eval Result: 100%|██████████| 68/68 [00:19<00:00,  3.42it/s, F1=0.703, eval_acc=0.96, eval_loss=6.19, eval_precision=0.666, eval_recall=0.755] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.68      0.83      0.75      3160
         LOC       0.28      0.38      0.32       482
         ORG       0.59      0.56      0.57      1645
         PER       0.85      0.92      0.88      1650

   micro avg       0.67      0.76      0.71      6937
   macro avg       0.60      0.67      0.63      6937
weighted avg       0.67      0.76      0.71      6937



Epoch: 5/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.68it/s, F1=0.91, train_acc=0.994, train_loss=0.655, train_precision=0.897, train_recall=0.931] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.90      0.94      0.92       424
         LOC       0.69      0.76      0.72        76
         ORG       0.87      0.93      0.90       256
         PER       0.95      0.98      0.96       362

   micro avg       0.89      0.94      0.92      1118
   macro avg       0.85      0.90      0.88      1118
weighted avg       0.90      0.94      0.92      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.12it/s, F1=0.69, eval_acc=0.96, eval_loss=7.56, eval_precision=0.631, eval_recall=0.773]  


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.60      0.88      0.71      3160
         LOC       0.29      0.33      0.31       482
         ORG       0.59      0.55      0.57      1645
         PER       0.86      0.92      0.89      1650

   micro avg       0.63      0.77      0.70      6937
   macro avg       0.58      0.67      0.62      6937
weighted avg       0.64      0.77      0.69      6937



Epoch: 6/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.64it/s, F1=0.919, train_acc=0.996, train_loss=0.519, train_precision=0.912, train_recall=0.931]


train_reports:
              precision    recall  f1-score   support

         GPE       0.93      0.96      0.94       424
         LOC       0.92      0.92      0.92        76
         ORG       0.91      0.95      0.93       256
         PER       0.97      0.98      0.97       362

   micro avg       0.94      0.96      0.95      1118
   macro avg       0.93      0.95      0.94      1118
weighted avg       0.94      0.96      0.95      1118



Eval Result: 100%|██████████| 68/68 [00:19<00:00,  3.46it/s, F1=0.679, eval_acc=0.96, eval_loss=7.7, eval_precision=0.71, eval_recall=0.658]   


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.72      0.65      0.68      3160
         LOC       0.36      0.34      0.35       482
         ORG       0.60      0.51      0.55      1645
         PER       0.87      0.90      0.88      1650

   micro avg       0.71      0.66      0.68      6937
   macro avg       0.64      0.60      0.62      6937
weighted avg       0.70      0.66      0.68      6937



Epoch: 7/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.66it/s, F1=0.926, train_acc=0.997, train_loss=0.343, train_precision=0.918, train_recall=0.939]


train_reports:
              precision    recall  f1-score   support

         GPE       0.96      0.98      0.97       424
         LOC       0.89      0.87      0.88        76
         ORG       0.92      0.95      0.93       256
         PER       0.97      0.99      0.98       362

   micro avg       0.95      0.97      0.96      1118
   macro avg       0.93      0.95      0.94      1118
weighted avg       0.95      0.97      0.96      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.16it/s, F1=0.701, eval_acc=0.96, eval_loss=7.71, eval_precision=0.653, eval_recall=0.766] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.66      0.85      0.74      3160
         LOC       0.28      0.33      0.30       482
         ORG       0.57      0.57      0.57      1645
         PER       0.82      0.91      0.86      1650

   micro avg       0.65      0.76      0.70      6937
   macro avg       0.58      0.66      0.62      6937
weighted avg       0.65      0.76      0.70      6937



Epoch: 8/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.68it/s, F1=0.954, train_acc=0.997, train_loss=0.28, train_precision=0.948, train_recall=0.963] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.99      0.98       424
         LOC       0.96      0.95      0.95        76
         ORG       0.96      0.96      0.96       256
         PER       0.97      0.99      0.98       362

   micro avg       0.97      0.98      0.98      1118
   macro avg       0.97      0.97      0.97      1118
weighted avg       0.97      0.98      0.98      1118



Eval Result: 100%|██████████| 68/68 [00:20<00:00,  3.39it/s, F1=0.701, eval_acc=0.962, eval_loss=8.21, eval_precision=0.702, eval_recall=0.708]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.72      0.75      0.73      3160
         LOC       0.30      0.35      0.33       482
         ORG       0.64      0.57      0.60      1645
         PER       0.82      0.86      0.84      1650

   micro avg       0.70      0.71      0.70      6937
   macro avg       0.62      0.63      0.63      6937
weighted avg       0.70      0.71      0.70      6937



Epoch: 9/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.63it/s, F1=0.939, train_acc=0.997, train_loss=0.325, train_precision=0.929, train_recall=0.955]


train_reports:
              precision    recall  f1-score   support

         GPE       0.96      0.98      0.97       424
         LOC       0.96      0.99      0.97        76
         ORG       0.95      0.96      0.96       256
         PER       0.97      0.99      0.98       362

   micro avg       0.96      0.98      0.97      1118
   macro avg       0.96      0.98      0.97      1118
weighted avg       0.96      0.98      0.97      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.02it/s, F1=0.706, eval_acc=0.962, eval_loss=7.36, eval_precision=0.68, eval_recall=0.742] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.70      0.76      0.73      3160
         LOC       0.29      0.43      0.34       482
         ORG       0.58      0.61      0.60      1645
         PER       0.89      0.91      0.90      1650

   micro avg       0.68      0.74      0.71      6937
   macro avg       0.62      0.68      0.64      6937
weighted avg       0.69      0.74      0.71      6937



Epoch: 10/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.66it/s, F1=0.953, train_acc=0.998, train_loss=0.181, train_precision=0.95, train_recall=0.958] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.97      0.99      0.98       424
         LOC       0.96      0.96      0.96        76
         ORG       0.97      0.99      0.98       256
         PER       0.99      0.99      0.99       362

   micro avg       0.98      0.99      0.98      1118
   macro avg       0.97      0.98      0.98      1118
weighted avg       0.98      0.99      0.98      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.01it/s, F1=0.711, eval_acc=0.963, eval_loss=7.42, eval_precision=0.679, eval_recall=0.756]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.70      0.80      0.74      3160
         LOC       0.33      0.39      0.36       482
         ORG       0.59      0.60      0.59      1645
         PER       0.82      0.92      0.87      1650

   micro avg       0.68      0.75      0.71      6937
   macro avg       0.61      0.68      0.64      6937
weighted avg       0.68      0.75      0.71      6937



Epoch: 11/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.39it/s, F1=0.966, train_acc=0.998, train_loss=0.23, train_precision=0.959, train_recall=0.978] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.99      0.99       424
         LOC       0.96      0.95      0.95        76
         ORG       0.96      0.98      0.97       256
         PER       0.96      0.98      0.97       362

   micro avg       0.97      0.98      0.98      1118
   macro avg       0.97      0.97      0.97      1118
weighted avg       0.97      0.98      0.98      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.04it/s, F1=0.699, eval_acc=0.96, eval_loss=8.37, eval_precision=0.656, eval_recall=0.759] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.68      0.77      0.73      3160
         LOC       0.28      0.43      0.34       482
         ORG       0.55      0.67      0.61      1645
         PER       0.87      0.90      0.89      1650

   micro avg       0.66      0.75      0.70      6937
   macro avg       0.60      0.69      0.64      6937
weighted avg       0.67      0.75      0.71      6937



Epoch: 12/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.69it/s, F1=0.961, train_acc=0.997, train_loss=0.385, train_precision=0.954, train_recall=0.972]


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.99      0.98       424
         LOC       0.94      0.96      0.95        76
         ORG       0.91      0.95      0.93       256
         PER       0.98      0.99      0.98       362

   micro avg       0.96      0.98      0.97      1118
   macro avg       0.95      0.97      0.96      1118
weighted avg       0.96      0.98      0.97      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.12it/s, F1=0.701, eval_acc=0.96, eval_loss=8.63, eval_precision=0.673, eval_recall=0.738] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.69      0.78      0.73      3160
         LOC       0.32      0.37      0.34       482
         ORG       0.59      0.60      0.60      1645
         PER       0.83      0.90      0.86      1650

   micro avg       0.67      0.74      0.70      6937
   macro avg       0.61      0.66      0.63      6937
weighted avg       0.67      0.74      0.70      6937



Epoch: 13/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.40it/s, F1=0.957, train_acc=0.998, train_loss=0.25, train_precision=0.957, train_recall=0.96]  


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.99      0.99       424
         LOC       0.95      0.95      0.95        76
         ORG       0.95      0.96      0.95       256
         PER       0.99      0.99      0.99       362

   micro avg       0.97      0.98      0.98      1118
   macro avg       0.97      0.97      0.97      1118
weighted avg       0.97      0.98      0.98      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.15it/s, F1=0.702, eval_acc=0.959, eval_loss=7.89, eval_precision=0.666, eval_recall=0.751]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.70      0.80      0.75      3160
         LOC       0.37      0.32      0.34       482
         ORG       0.51      0.65      0.57      1645
         PER       0.86      0.88      0.87      1650

   micro avg       0.67      0.75      0.70      6937
   macro avg       0.61      0.66      0.63      6937
weighted avg       0.67      0.75      0.71      6937



Epoch: 14/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.61it/s, F1=0.967, train_acc=0.999, train_loss=0.0955, train_precision=0.963, train_recall=0.972]


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.99      0.98       424
         LOC       0.94      0.95      0.94        76
         ORG       0.98      1.00      0.99       256
         PER       0.99      1.00      0.99       362

   micro avg       0.98      0.99      0.99      1118
   macro avg       0.97      0.98      0.98      1118
weighted avg       0.98      0.99      0.99      1118



Eval Result: 100%|██████████| 68/68 [00:19<00:00,  3.42it/s, F1=0.716, eval_acc=0.962, eval_loss=9.09, eval_precision=0.702, eval_recall=0.74] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.72      0.79      0.75      3160
         LOC       0.38      0.42      0.40       482
         ORG       0.64      0.59      0.61      1645
         PER       0.82      0.88      0.85      1650

   micro avg       0.70      0.74      0.72      6937
   macro avg       0.64      0.67      0.65      6937
weighted avg       0.70      0.74      0.72      6937



Epoch: 15/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.66it/s, F1=0.964, train_acc=0.999, train_loss=0.0745, train_precision=0.964, train_recall=0.965]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       424
         LOC       0.99      1.00      0.99        76
         ORG       0.97      0.98      0.98       256
         PER       1.00      1.00      1.00       362

   micro avg       0.99      0.99      0.99      1118
   macro avg       0.99      0.99      0.99      1118
weighted avg       0.99      0.99      0.99      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.18it/s, F1=0.702, eval_acc=0.96, eval_loss=10.8, eval_precision=0.714, eval_recall=0.699] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.74      0.76      0.75      3160
         LOC       0.40      0.41      0.41       482
         ORG       0.65      0.52      0.58      1645
         PER       0.83      0.88      0.85      1650

   micro avg       0.72      0.70      0.71      6937
   macro avg       0.66      0.64      0.65      6937
weighted avg       0.72      0.70      0.71      6937



Epoch: 16/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.64it/s, F1=0.958, train_acc=0.999, train_loss=0.0794, train_precision=0.955, train_recall=0.96] 


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       424
         LOC       1.00      1.00      1.00        76
         ORG       0.97      0.99      0.98       256
         PER       0.99      1.00      1.00       362

   micro avg       0.99      1.00      0.99      1118
   macro avg       0.99      1.00      0.99      1118
weighted avg       0.99      1.00      0.99      1118



Eval Result: 100%|██████████| 68/68 [00:19<00:00,  3.45it/s, F1=0.71, eval_acc=0.962, eval_loss=9.97, eval_precision=0.702, eval_recall=0.725] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.74      0.72      0.73      3160
         LOC       0.32      0.42      0.36       482
         ORG       0.61      0.63      0.62      1645
         PER       0.85      0.90      0.87      1650

   micro avg       0.70      0.72      0.71      6937
   macro avg       0.63      0.67      0.65      6937
weighted avg       0.71      0.72      0.71      6937



Epoch: 17/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.65it/s, F1=0.984, train_acc=1, train_loss=0.066, train_precision=0.983, train_recall=0.984]     


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       424
         LOC       0.99      1.00      0.99        76
         ORG       0.98      0.99      0.98       256
         PER       1.00      1.00      1.00       362

   micro avg       0.99      1.00      0.99      1118
   macro avg       0.99      1.00      0.99      1118
weighted avg       0.99      1.00      0.99      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.16it/s, F1=0.713, eval_acc=0.963, eval_loss=9.66, eval_precision=0.71, eval_recall=0.725] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.73      0.75      0.74      3160
         LOC       0.35      0.35      0.35       482
         ORG       0.62      0.64      0.63      1645
         PER       0.86      0.88      0.87      1650

   micro avg       0.71      0.73      0.72      6937
   macro avg       0.64      0.65      0.65      6937
weighted avg       0.71      0.73      0.72      6937



Epoch: 18/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.65it/s, F1=0.958, train_acc=0.999, train_loss=0.124, train_precision=0.958, train_recall=0.96]  


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.99      0.98       424
         LOC       0.89      0.93      0.91        76
         ORG       0.99      1.00      0.99       256
         PER       1.00      1.00      1.00       362

   micro avg       0.98      0.99      0.99      1118
   macro avg       0.96      0.98      0.97      1118
weighted avg       0.98      0.99      0.99      1118



Eval Result: 100%|██████████| 68/68 [00:19<00:00,  3.40it/s, F1=0.702, eval_acc=0.962, eval_loss=8.56, eval_precision=0.695, eval_recall=0.719]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.73      0.72      0.73      3160
         LOC       0.36      0.41      0.38       482
         ORG       0.65      0.60      0.63      1645
         PER       0.78      0.91      0.84      1650

   micro avg       0.70      0.72      0.71      6937
   macro avg       0.63      0.66      0.64      6937
weighted avg       0.70      0.72      0.71      6937



Epoch: 19/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.68it/s, F1=0.948, train_acc=0.999, train_loss=0.165, train_precision=0.944, train_recall=0.954]


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.99      0.98       424
         LOC       0.91      0.95      0.93        76
         ORG       0.98      0.99      0.98       256
         PER       0.98      0.99      0.99       362

   micro avg       0.98      0.99      0.98      1118
   macro avg       0.96      0.98      0.97      1118
weighted avg       0.98      0.99      0.98      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.17it/s, F1=0.71, eval_acc=0.961, eval_loss=9.58, eval_precision=0.698, eval_recall=0.731] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.73      0.81      0.77      3160
         LOC       0.30      0.44      0.36       482
         ORG       0.62      0.58      0.60      1645
         PER       0.87      0.83      0.85      1650

   micro avg       0.70      0.73      0.72      6937
   macro avg       0.63      0.67      0.64      6937
weighted avg       0.71      0.73      0.72      6937



Epoch: 20/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.42it/s, F1=0.929, train_acc=0.998, train_loss=0.266, train_precision=0.925, train_recall=0.935]


train_reports:
              precision    recall  f1-score   support

         GPE       0.97      0.98      0.98       424
         LOC       0.99      1.00      0.99        76
         ORG       0.95      0.96      0.96       256
         PER       0.98      0.98      0.98       362

   micro avg       0.97      0.98      0.97      1118
   macro avg       0.97      0.98      0.98      1118
weighted avg       0.97      0.98      0.97      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.16it/s, F1=0.704, eval_acc=0.96, eval_loss=7.69, eval_precision=0.659, eval_recall=0.768] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.74      0.77      0.75      3160
         LOC       0.34      0.46      0.39       482
         ORG       0.52      0.70      0.60      1645
         PER       0.83      0.92      0.87      1650

   micro avg       0.66      0.77      0.71      6937
   macro avg       0.60      0.71      0.65      6937
weighted avg       0.68      0.77      0.72      6937



Epoch: 21/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.64it/s, F1=0.982, train_acc=0.999, train_loss=0.129, train_precision=0.98, train_recall=0.986] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.99      0.99       424
         LOC       1.00      1.00      1.00        76
         ORG       0.97      0.99      0.98       256
         PER       0.99      0.99      0.99       362

   micro avg       0.98      0.99      0.99      1118
   macro avg       0.99      0.99      0.99      1118
weighted avg       0.98      0.99      0.99      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.11it/s, F1=0.714, eval_acc=0.961, eval_loss=9.58, eval_precision=0.723, eval_recall=0.714]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.74      0.77      0.75      3160
         LOC       0.33      0.40      0.36       482
         ORG       0.68      0.57      0.62      1645
         PER       0.88      0.85      0.86      1650

   micro avg       0.73      0.72      0.72      6937
   macro avg       0.66      0.65      0.65      6937
weighted avg       0.73      0.72      0.72      6937



Epoch: 22/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.41it/s, F1=0.984, train_acc=1, train_loss=0.0587, train_precision=0.984, train_recall=0.985]


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      1.00      1.00       424
         LOC       0.99      1.00      0.99        76
         ORG       1.00      1.00      1.00       256
         PER       0.99      1.00      1.00       362

   micro avg       0.99      1.00      1.00      1118
   macro avg       0.99      1.00      1.00      1118
weighted avg       0.99      1.00      1.00      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.16it/s, F1=0.723, eval_acc=0.963, eval_loss=9.03, eval_precision=0.727, eval_recall=0.728]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.76      0.76      0.76      3160
         LOC       0.40      0.39      0.39       482
         ORG       0.63      0.61      0.62      1645
         PER       0.85      0.88      0.87      1650

   micro avg       0.73      0.73      0.73      6937
   macro avg       0.66      0.66      0.66      6937
weighted avg       0.73      0.73      0.73      6937



Epoch: 23/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.65it/s, F1=0.973, train_acc=0.999, train_loss=0.0703, train_precision=0.972, train_recall=0.975]


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      1.00      0.99       424
         LOC       1.00      1.00      1.00        76
         ORG       0.99      0.99      0.99       256
         PER       0.99      1.00      0.99       362

   micro avg       0.99      1.00      0.99      1118
   macro avg       0.99      1.00      0.99      1118
weighted avg       0.99      1.00      0.99      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.12it/s, F1=0.713, eval_acc=0.961, eval_loss=9.8, eval_precision=0.697, eval_recall=0.737] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.73      0.78      0.75      3160
         LOC       0.28      0.44      0.34       482
         ORG       0.64      0.59      0.62      1645
         PER       0.88      0.89      0.88      1650

   micro avg       0.70      0.74      0.72      6937
   macro avg       0.63      0.67      0.65      6937
weighted avg       0.71      0.74      0.72      6937



Epoch: 24/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.40it/s, F1=0.988, train_acc=0.999, train_loss=0.0894, train_precision=0.99, train_recall=0.989] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.98      0.98      0.98       424
         LOC       0.96      0.97      0.97        76
         ORG       0.98      0.99      0.99       256
         PER       1.00      1.00      1.00       362

   micro avg       0.98      0.99      0.99      1118
   macro avg       0.98      0.99      0.98      1118
weighted avg       0.98      0.99      0.99      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.11it/s, F1=0.675, eval_acc=0.954, eval_loss=10.7, eval_precision=0.671, eval_recall=0.691]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.76      0.57      0.65      3160
         LOC       0.28      0.38      0.32       482
         ORG       0.53      0.73      0.62      1645
         PER       0.86      0.90      0.88      1650

   micro avg       0.67      0.67      0.67      6937
   macro avg       0.61      0.64      0.62      6937
weighted avg       0.70      0.67      0.67      6937



Epoch: 25/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.67it/s, F1=0.982, train_acc=0.999, train_loss=0.138, train_precision=0.979, train_recall=0.985] 


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.99      0.99       424
         LOC       0.97      0.96      0.97        76
         ORG       0.99      1.00      0.99       256
         PER       1.00      1.00      1.00       362

   micro avg       0.99      0.99      0.99      1118
   macro avg       0.99      0.99      0.99      1118
weighted avg       0.99      0.99      0.99      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.01it/s, F1=0.719, eval_acc=0.962, eval_loss=9.74, eval_precision=0.747, eval_recall=0.702]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.75      0.71      0.73      3160
         LOC       0.40      0.39      0.39       482
         ORG       0.70      0.59      0.64      1645
         PER       0.86      0.89      0.87      1650

   micro avg       0.74      0.70      0.72      6937
   macro avg       0.68      0.64      0.66      6937
weighted avg       0.74      0.70      0.72      6937



Epoch: 26/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.43it/s, F1=0.992, train_acc=1, train_loss=0.0387, train_precision=0.993, train_recall=0.993]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       424
         LOC       0.99      1.00      0.99        76
         ORG       1.00      0.99      1.00       256
         PER       1.00      1.00      1.00       362

   micro avg       1.00      1.00      1.00      1118
   macro avg       1.00      1.00      1.00      1118
weighted avg       1.00      1.00      1.00      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.17it/s, F1=0.718, eval_acc=0.962, eval_loss=10.1, eval_precision=0.72, eval_recall=0.724] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.74      0.73      0.73      3160
         LOC       0.38      0.41      0.39       482
         ORG       0.63      0.63      0.63      1645
         PER       0.86      0.89      0.88      1650

   micro avg       0.72      0.72      0.72      6937
   macro avg       0.65      0.66      0.66      6937
weighted avg       0.72      0.72      0.72      6937



Epoch: 27/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.65it/s, F1=0.968, train_acc=1, train_loss=0.0255, train_precision=0.968, train_recall=0.968]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      1.00      1.00       424
         LOC       0.99      0.99      0.99        76
         ORG       0.99      0.99      0.99       256
         PER       1.00      1.00      1.00       362

   micro avg       1.00      1.00      1.00      1118
   macro avg       0.99      0.99      0.99      1118
weighted avg       1.00      1.00      1.00      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.08it/s, F1=0.717, eval_acc=0.962, eval_loss=10.7, eval_precision=0.723, eval_recall=0.72] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.75      0.73      0.74      3160
         LOC       0.36      0.42      0.39       482
         ORG       0.63      0.62      0.63      1645
         PER       0.86      0.89      0.88      1650

   micro avg       0.72      0.72      0.72      6937
   macro avg       0.65      0.66      0.66      6937
weighted avg       0.72      0.72      0.72      6937



Epoch: 28/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.40it/s, F1=0.969, train_acc=0.999, train_loss=0.113, train_precision=0.969, train_recall=0.969]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      0.98      0.99       424
         LOC       0.95      0.97      0.96        76
         ORG       0.99      1.00      0.99       256
         PER       1.00      1.00      1.00       362

   micro avg       0.99      0.99      0.99      1118
   macro avg       0.98      0.99      0.99      1118
weighted avg       0.99      0.99      0.99      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.13it/s, F1=0.715, eval_acc=0.961, eval_loss=9.09, eval_precision=0.692, eval_recall=0.748]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.69      0.75      0.72      3160
         LOC       0.32      0.40      0.36       482
         ORG       0.63      0.65      0.64      1645
         PER       0.87      0.91      0.89      1650

   micro avg       0.69      0.74      0.71      6937
   macro avg       0.63      0.68      0.65      6937
weighted avg       0.69      0.74      0.71      6937



Epoch: 29/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.65it/s, F1=0.973, train_acc=0.999, train_loss=0.111, train_precision=0.973, train_recall=0.974]


train_reports:
              precision    recall  f1-score   support

         GPE       1.00      0.99      0.99       424
         LOC       0.92      0.96      0.94        76
         ORG       1.00      1.00      1.00       256
         PER       0.99      0.99      0.99       362

   micro avg       0.99      0.99      0.99      1118
   macro avg       0.98      0.98      0.98      1118
weighted avg       0.99      0.99      0.99      1118



Eval Result: 100%|██████████| 68/68 [00:20<00:00,  3.39it/s, F1=0.722, eval_acc=0.962, eval_loss=9.54, eval_precision=0.722, eval_recall=0.731]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

         GPE       0.74      0.72      0.73      3160
         LOC       0.42      0.32      0.36       482
         ORG       0.62      0.68      0.65      1645
         PER       0.86      0.91      0.89      1650

   micro avg       0.72      0.73      0.73      6937
   macro avg       0.66      0.66      0.66      6937
weighted avg       0.72      0.73      0.72      6937



Epoch: 30/30 Train: 100%|██████████| 169/169 [00:46<00:00,  3.67it/s, F1=0.975, train_acc=0.999, train_loss=0.0926, train_precision=0.975, train_recall=0.976]


train_reports:
              precision    recall  f1-score   support

         GPE       0.99      0.99      0.99       424
         LOC       0.95      0.96      0.95        76
         ORG       1.00      1.00      1.00       256
         PER       1.00      1.00      1.00       362

   micro avg       0.99      0.99      0.99      1118
   macro avg       0.98      0.99      0.99      1118
weighted avg       0.99      0.99      0.99      1118



Eval Result: 100%|██████████| 68/68 [00:16<00:00,  4.17it/s, F1=0.686, eval_acc=0.96, eval_loss=9.37, eval_precision=0.675, eval_recall=0.705] 


eval_reports:
              precision    recall  f1-score   support

         GPE       0.73      0.64      0.68      3160
         LOC       0.24      0.49      0.32       482
         ORG       0.64      0.67      0.65      1645
         PER       0.88      0.90      0.89      1650

   micro avg       0.67      0.70      0.69      6937
   macro avg       0.62      0.67      0.64      6937
weighted avg       0.71      0.70      0.70      6937



calculate data/few_shot/msra/train_250.json etag: 100%|██████████| 161k/161k [00:00<00:00, 8.22MB/s]
calculate data/few_shot/msra/dev.json etag: 100%|██████████| 2.12M/2.12M [00:00<00:00, 326MB/s]
calculate data/few_shot/msra/test.json etag: 100%|██████████| 2.12M/2.12M [00:00<00:00, 370MB/s]
calculate data/few_shot/msra/labels.txt etag: 100%|██████████| 62.0/62.0 [00:00<00:00, 119kB/s]

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/msra/train_250.json",
    "eval_file": "data/few_shot/msra/dev.json",
    "test_file": "data/few_shot/msra/test.json",
    "tag_file": "data/few_shot/msra/labels.txt",
    "bert_vocab_file": "./model/chinese_wwm_ext/vocab.txt",
    "output_eval": true,
    "max_scan_num": 1000000,
    "add_seq_vocab": false,
    "max_seq_length": 150,
    "max_word_num": 5,
    "default_tag": "O",
    "use_test": false,
    "do_shuffle": true,
    "do_predict": false,
    "task_name": "msra_pretrain_lebert_crf_250_x1"
}
load cached ./temp/55046d54bc5d0cbdb156a3a356c4d7f9_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/lexicon_tree



count line size data/few_shot/msra/labels.txt: 14L [00:00, 110169.34L/s]
build line mapper: 14L [00:00, 21152.83L/s]4 [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 14/14 [00:00<00:00, 4304.06it/s]
load vocab from list: 100%|██████████| 13/13 [00:00<00:00, 152733.76it/s]

load cached ./temp/55046d54bc5d0cbdb156a3a356c4d7f9_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/matched_words
load cached ./temp/55046d54bc5d0cbdb156a3a356c4d7f9_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/word_vocab
load cached ./temp/55046d54bc5d0cbdb156a3a356c4d7f9_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/vocab_embedding



load dataset from data/few_shot/msra/train_250.json: 250it [00:00, 541.65it/s]
load dataset from data/few_shot/msra/dev.json: 4365it [00:07, 583.70it/s]
Some weights of the model checkpoint at save_pretrained/msra_pretrain_lebert_250_pretraind_task/Bert_240/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model fro

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.30it/s, F1=0.000137, train_acc=0.341, train_loss=88.2, train_precision=6.94e-5, train_recall=0.00446]  


train_reports:
              precision    recall  f1-score   support

          NR       0.03      0.01      0.02        83
          NS       0.00      0.00      0.00       222
          NT       0.00      0.00      0.00       105

   micro avg       0.00      0.00      0.00       410
   macro avg       0.01      0.00      0.01       410
weighted avg       0.01      0.00      0.00       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.39it/s, F1=0, eval_acc=0.897, eval_loss=25.5, eval_precision=0, eval_recall=0]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.00      0.00      0.00      1416
          NS       0.00      0.00      0.00      2857
          NT       0.00      0.00      0.00      1314

   micro avg       0.00      0.00      0.00      5587
   macro avg       0.00      0.00      0.00      5587
weighted avg       0.00      0.00      0.00      5587



Epoch: 2/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.35it/s, F1=0, train_acc=0.889, train_loss=29.7, train_precision=0, train_recall=0]


train_reports:
              precision    recall  f1-score   support

          NR       0.00      0.00      0.00        83
          NS       0.00      0.00      0.00       222
          NT       0.00      0.00      0.00       105

   micro avg       0.00      0.00      0.00       410
   macro avg       0.00      0.00      0.00       410
weighted avg       0.00      0.00      0.00       410



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.30it/s, F1=0, eval_acc=0.897, eval_loss=20.5, eval_precision=0, eval_recall=0]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.00      0.00      0.00      1416
          NS       0.00      0.00      0.00      2857
          NT       0.00      0.00      0.00      1314

   micro avg       0.00      0.00      0.00      5587
   macro avg       0.00      0.00      0.00      5587
weighted avg       0.00      0.00      0.00      5587



Epoch: 3/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.40it/s, F1=0, train_acc=0.891, train_loss=20.6, train_precision=0, train_recall=0]


train_reports:
              precision    recall  f1-score   support

          NR       0.00      0.00      0.00        83
          NS       0.00      0.00      0.00       222
          NT       0.00      0.00      0.00       105

   micro avg       0.00      0.00      0.00       410
   macro avg       0.00      0.00      0.00       410
weighted avg       0.00      0.00      0.00       410



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.58it/s, F1=0.00267, eval_acc=0.902, eval_loss=12.7, eval_precision=0.00687, eval_recall=0.00178]  


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.00      0.00      0.00      1416
          NS       0.01      0.00      0.00      2857
          NT       0.00      0.00      0.00      1314

   micro avg       0.00      0.00      0.00      5587
   macro avg       0.00      0.00      0.00      5587
weighted avg       0.00      0.00      0.00      5587



Epoch: 4/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.46it/s, F1=0.113, train_acc=0.926, train_loss=12.5, train_precision=0.11, train_recall=0.125]      


train_reports:
              precision    recall  f1-score   support

          NR       0.00      0.00      0.00        83
          NS       0.13      0.19      0.16       222
          NT       0.03      0.05      0.03       105

   micro avg       0.08      0.12      0.10       410
   macro avg       0.05      0.08      0.06       410
weighted avg       0.08      0.12      0.09       410



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.27it/s, F1=0.248, eval_acc=0.939, eval_loss=7.75, eval_precision=0.242, eval_recall=0.266]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.00      0.00      0.00      1416
          NS       0.30      0.46      0.37      2857
          NT       0.07      0.07      0.07      1314

   micro avg       0.21      0.25      0.23      5587
   macro avg       0.12      0.18      0.15      5587
weighted avg       0.17      0.25      0.20      5587



Epoch: 5/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.42it/s, F1=0.506, train_acc=0.97, train_loss=5.82, train_precision=0.485, train_recall=0.556] 


train_reports:
              precision    recall  f1-score   support

          NR       0.49      0.58      0.53        83
          NS       0.44      0.58      0.50       222
          NT       0.41      0.51      0.46       105

   micro avg       0.45      0.56      0.50       410
   macro avg       0.45      0.56      0.50       410
weighted avg       0.45      0.56      0.50       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.38it/s, F1=0.634, eval_acc=0.964, eval_loss=5.21, eval_precision=0.59, eval_recall=0.698] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.83      0.90      0.86      1416
          NS       0.54      0.66      0.59      2857
          NT       0.40      0.47      0.43      1314

   micro avg       0.57      0.68      0.62      5587
   macro avg       0.59      0.68      0.63      5587
weighted avg       0.58      0.68      0.62      5587



Epoch: 6/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.43it/s, F1=0.806, train_acc=0.986, train_loss=2.91, train_precision=0.796, train_recall=0.823]


train_reports:
              precision    recall  f1-score   support

          NR       0.89      0.89      0.89        83
          NS       0.81      0.83      0.82       222
          NT       0.69      0.78      0.73       105

   micro avg       0.79      0.83      0.81       410
   macro avg       0.80      0.84      0.81       410
weighted avg       0.79      0.83      0.81       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.38it/s, F1=0.728, eval_acc=0.971, eval_loss=4.24, eval_precision=0.704, eval_recall=0.763]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.89      0.90      0.89      1416
          NS       0.66      0.71      0.68      2857
          NT       0.53      0.63      0.58      1314

   micro avg       0.68      0.74      0.71      5587
   macro avg       0.69      0.75      0.72      5587
weighted avg       0.69      0.74      0.71      5587



Epoch: 7/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.45it/s, F1=0.93, train_acc=0.995, train_loss=1.34, train_precision=0.945, train_recall=0.921] 


train_reports:
              precision    recall  f1-score   support

          NR       0.95      0.93      0.94        83
          NS       0.97      0.91      0.94       222
          NT       0.89      0.91      0.90       105

   micro avg       0.94      0.92      0.93       410
   macro avg       0.94      0.92      0.93       410
weighted avg       0.94      0.92      0.93       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.35it/s, F1=0.734, eval_acc=0.967, eval_loss=4.82, eval_precision=0.695, eval_recall=0.789]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.90      0.89      0.90      1416
          NS       0.72      0.73      0.73      2857
          NT       0.51      0.76      0.61      1314

   micro avg       0.70      0.78      0.74      5587
   macro avg       0.71      0.79      0.75      5587
weighted avg       0.72      0.78      0.74      5587



Epoch: 8/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.43it/s, F1=0.931, train_acc=0.994, train_loss=1.33, train_precision=0.933, train_recall=0.931]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      0.98      0.99        83
          NS       0.93      0.91      0.92       222
          NT       0.88      0.93      0.91       105

   micro avg       0.93      0.93      0.93       410
   macro avg       0.94      0.94      0.94       410
weighted avg       0.93      0.93      0.93       410



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.60it/s, F1=0.76, eval_acc=0.973, eval_loss=4.16, eval_precision=0.733, eval_recall=0.801] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.90      0.92      0.91      1416
          NS       0.70      0.81      0.75      2857
          NT       0.62      0.63      0.63      1314

   micro avg       0.73      0.79      0.76      5587
   macro avg       0.74      0.78      0.76      5587
weighted avg       0.73      0.79      0.76      5587



Epoch: 9/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.42it/s, F1=0.959, train_acc=0.998, train_loss=0.555, train_precision=0.955, train_recall=0.964]


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.95      0.96        83
          NS       0.96      0.98      0.97       222
          NT       0.95      0.95      0.95       105

   micro avg       0.96      0.97      0.96       410
   macro avg       0.96      0.96      0.96       410
weighted avg       0.96      0.97      0.96       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.32it/s, F1=0.785, eval_acc=0.972, eval_loss=4.74, eval_precision=0.765, eval_recall=0.814]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.91      0.92      0.92      1416
          NS       0.80      0.77      0.79      2857
          NT       0.56      0.75      0.64      1314

   micro avg       0.76      0.80      0.78      5587
   macro avg       0.76      0.81      0.78      5587
weighted avg       0.77      0.80      0.79      5587



Epoch: 10/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.37it/s, F1=0.979, train_acc=0.998, train_loss=0.42, train_precision=0.98, train_recall=0.979]  


train_reports:
              precision    recall  f1-score   support

          NR       1.00      0.96      0.98        83
          NS       0.97      0.98      0.98       222
          NT       0.98      0.99      0.99       105

   micro avg       0.98      0.98      0.98       410
   macro avg       0.98      0.98      0.98       410
weighted avg       0.98      0.98      0.98       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.35it/s, F1=0.805, eval_acc=0.976, eval_loss=4.29, eval_precision=0.799, eval_recall=0.815]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.91      0.92      0.92      1416
          NS       0.81      0.80      0.81      2857
          NT       0.62      0.69      0.66      1314

   micro avg       0.79      0.81      0.80      5587
   macro avg       0.78      0.81      0.80      5587
weighted avg       0.79      0.81      0.80      5587



Epoch: 11/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.38it/s, F1=0.966, train_acc=0.998, train_loss=0.364, train_precision=0.967, train_recall=0.965]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      0.98      0.99        83
          NS       1.00      1.00      1.00       222
          NT       0.99      1.00      1.00       105

   micro avg       1.00      0.99      1.00       410
   macro avg       1.00      0.99      0.99       410
weighted avg       1.00      0.99      1.00       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.36it/s, F1=0.794, eval_acc=0.975, eval_loss=4.48, eval_precision=0.783, eval_recall=0.812]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.92      0.93      0.92      1416
          NS       0.78      0.80      0.79      2857
          NT       0.62      0.68      0.65      1314

   micro avg       0.77      0.80      0.79      5587
   macro avg       0.77      0.80      0.79      5587
weighted avg       0.77      0.80      0.79      5587



Epoch: 12/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.40it/s, F1=0.993, train_acc=0.999, train_loss=0.205, train_precision=0.995, train_recall=0.991]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      0.94      0.97        83
          NS       0.99      1.00      0.99       222
          NT       1.00      1.00      1.00       105

   micro avg       0.99      0.99      0.99       410
   macro avg       1.00      0.98      0.99       410
weighted avg       0.99      0.99      0.99       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.35it/s, F1=0.8, eval_acc=0.974, eval_loss=4.91, eval_precision=0.8, eval_recall=0.805]    


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.91      0.92      0.92      1416
          NS       0.81      0.79      0.80      2857
          NT       0.61      0.68      0.64      1314

   micro avg       0.79      0.79      0.79      5587
   macro avg       0.78      0.79      0.79      5587
weighted avg       0.79      0.79      0.79      5587



Epoch: 13/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.42it/s, F1=0.961, train_acc=1, train_loss=0.126, train_precision=0.965, train_recall=0.958]    


train_reports:
              precision    recall  f1-score   support

          NR       1.00      0.96      0.98        83
          NS       1.00      1.00      1.00       222
          NT       0.99      0.99      0.99       105

   micro avg       1.00      0.99      0.99       410
   macro avg       1.00      0.98      0.99       410
weighted avg       1.00      0.99      0.99       410



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.58it/s, F1=0.802, eval_acc=0.976, eval_loss=4.51, eval_precision=0.791, eval_recall=0.818]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.92      0.92      0.92      1416
          NS       0.80      0.80      0.80      2857
          NT       0.63      0.71      0.66      1314

   micro avg       0.78      0.81      0.80      5587
   macro avg       0.78      0.81      0.79      5587
weighted avg       0.79      0.81      0.80      5587



Epoch: 14/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.30it/s, F1=1, train_acc=1, train_loss=0.0883, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00        83
          NS       1.00      1.00      1.00       222
          NT       1.00      1.00      1.00       105

   micro avg       1.00      1.00      1.00       410
   macro avg       1.00      1.00      1.00       410
weighted avg       1.00      1.00      1.00       410



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.21it/s, F1=0.801, eval_acc=0.976, eval_loss=4.6, eval_precision=0.786, eval_recall=0.82]  


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.91      0.92      0.92      1416
          NS       0.80      0.80      0.80      2857
          NT       0.62      0.72      0.67      1314

   micro avg       0.78      0.81      0.80      5587
   macro avg       0.78      0.81      0.79      5587
weighted avg       0.79      0.81      0.80      5587



Epoch: 15/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.41it/s, F1=0.969, train_acc=1, train_loss=0.0642, train_precision=0.969, train_recall=0.969]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00        83
          NS       1.00      1.00      1.00       222
          NT       1.00      1.00      1.00       105

   micro avg       1.00      1.00      1.00       410
   macro avg       1.00      1.00      1.00       410
weighted avg       1.00      1.00      1.00       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.32it/s, F1=0.804, eval_acc=0.976, eval_loss=4.78, eval_precision=0.789, eval_recall=0.825]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.91      0.92      0.92      1416
          NS       0.80      0.80      0.80      2857
          NT       0.62      0.73      0.67      1314

   micro avg       0.78      0.82      0.80      5587
   macro avg       0.78      0.82      0.80      5587
weighted avg       0.79      0.82      0.80      5587



Epoch: 16/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.45it/s, F1=1, train_acc=1, train_loss=0.0575, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00        83
          NS       1.00      1.00      1.00       222
          NT       1.00      1.00      1.00       105

   micro avg       1.00      1.00      1.00       410
   macro avg       1.00      1.00      1.00       410
weighted avg       1.00      1.00      1.00       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.35it/s, F1=0.796, eval_acc=0.976, eval_loss=4.76, eval_precision=0.78, eval_recall=0.818] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.91      0.92      0.91      1416
          NS       0.77      0.81      0.79      2857
          NT       0.64      0.70      0.67      1314

   micro avg       0.77      0.81      0.79      5587
   macro avg       0.77      0.81      0.79      5587
weighted avg       0.78      0.81      0.79      5587



Epoch: 17/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.31it/s, F1=1, train_acc=1, train_loss=0.0466, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00        83
          NS       1.00      1.00      1.00       222
          NT       1.00      1.00      1.00       105

   micro avg       1.00      1.00      1.00       410
   macro avg       1.00      1.00      1.00       410
weighted avg       1.00      1.00      1.00       410



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.23it/s, F1=0.802, eval_acc=0.976, eval_loss=4.84, eval_precision=0.786, eval_recall=0.824]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.91      0.92      0.91      1416
          NS       0.79      0.81      0.80      2857
          NT       0.63      0.72      0.67      1314

   micro avg       0.78      0.82      0.80      5587
   macro avg       0.78      0.82      0.80      5587
weighted avg       0.78      0.82      0.80      5587



Epoch: 18/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.45it/s, F1=0.998, train_acc=1, train_loss=0.0526, train_precision=0.998, train_recall=0.998]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00        83
          NS       1.00      1.00      1.00       222
          NT       0.99      1.00      1.00       105

   micro avg       1.00      1.00      1.00       410
   macro avg       1.00      1.00      1.00       410
weighted avg       1.00      1.00      1.00       410



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.54it/s, F1=0.793, eval_acc=0.974, eval_loss=5.98, eval_precision=0.8, eval_recall=0.792]  


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.91      0.91      0.91      1416
          NS       0.78      0.81      0.80      2857
          NT       0.65      0.56      0.60      1314

   micro avg       0.79      0.78      0.78      5587
   macro avg       0.78      0.76      0.77      5587
weighted avg       0.78      0.78      0.78      5587



Epoch: 19/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.42it/s, F1=0.922, train_acc=0.997, train_loss=0.819, train_precision=0.918, train_recall=0.928]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      1.00      0.99        83
          NS       0.98      0.98      0.98       222
          NT       0.90      0.91      0.91       105

   micro avg       0.96      0.97      0.96       410
   macro avg       0.95      0.96      0.96       410
weighted avg       0.96      0.97      0.96       410



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.28it/s, F1=0.758, eval_acc=0.97, eval_loss=5.81, eval_precision=0.724, eval_recall=0.806] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.90      0.93      0.91      1416
          NS       0.71      0.79      0.75      2857
          NT       0.56      0.65      0.60      1314

   micro avg       0.72      0.79      0.75      5587
   macro avg       0.72      0.79      0.75      5587
weighted avg       0.72      0.79      0.76      5587



Epoch: 20/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.40it/s, F1=0.986, train_acc=0.999, train_loss=0.314, train_precision=0.983, train_recall=0.989]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00        83
          NS       0.99      0.99      0.99       222
          NT       0.95      0.98      0.97       105

   micro avg       0.98      0.99      0.99       410
   macro avg       0.98      0.99      0.99       410
weighted avg       0.98      0.99      0.99       410



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.29it/s, F1=0.783, eval_acc=0.973, eval_loss=4.97, eval_precision=0.762, eval_recall=0.811]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.88      0.92      0.90      1416
          NS       0.77      0.79      0.78      2857
          NT       0.60      0.70      0.65      1314

   micro avg       0.76      0.80      0.78      5587
   macro avg       0.75      0.80      0.78      5587
weighted avg       0.76      0.80      0.78      5587



Epoch: 21/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.45it/s, F1=0.986, train_acc=0.999, train_loss=0.291, train_precision=0.98, train_recall=0.994] 


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.99      0.98        83
          NS       0.99      0.98      0.98       222
          NT       0.97      1.00      0.99       105

   micro avg       0.98      0.99      0.98       410
   macro avg       0.98      0.99      0.98       410
weighted avg       0.98      0.99      0.98       410



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.26it/s, F1=0.774, eval_acc=0.972, eval_loss=4.97, eval_precision=0.736, eval_recall=0.826]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.89      0.93      0.91      1416
          NS       0.73      0.81      0.77      2857
          NT       0.61      0.71      0.65      1314

   micro avg       0.74      0.82      0.77      5587
   macro avg       0.74      0.82      0.78      5587
weighted avg       0.74      0.82      0.78      5587



Epoch: 22/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.41it/s, F1=0.969, train_acc=0.997, train_loss=0.665, train_precision=0.965, train_recall=0.974]


train_reports:
              precision    recall  f1-score   support

          NR       0.94      0.96      0.95        83
          NS       0.95      0.98      0.97       222
          NT       0.94      0.96      0.95       105

   micro avg       0.95      0.97      0.96       410
   macro avg       0.95      0.97      0.96       410
weighted avg       0.95      0.97      0.96       410



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.31it/s, F1=0.797, eval_acc=0.974, eval_loss=4.68, eval_precision=0.785, eval_recall=0.813]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.89      0.93      0.91      1416
          NS       0.82      0.78      0.80      2857
          NT       0.60      0.74      0.67      1314

   micro avg       0.78      0.81      0.79      5587
   macro avg       0.77      0.82      0.79      5587
weighted avg       0.79      0.81      0.80      5587



Epoch: 23/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.44it/s, F1=0.969, train_acc=1, train_loss=0.0761, train_precision=0.969, train_recall=0.969]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00        83
          NS       1.00      1.00      1.00       222
          NT       1.00      1.00      1.00       105

   micro avg       1.00      1.00      1.00       410
   macro avg       1.00      1.00      1.00       410
weighted avg       1.00      1.00      1.00       410



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.57it/s, F1=0.8, eval_acc=0.975, eval_loss=4.74, eval_precision=0.784, eval_recall=0.821]  


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.90      0.94      0.92      1416
          NS       0.79      0.79      0.79      2857
          NT       0.62      0.73      0.67      1314

   micro avg       0.78      0.81      0.79      5587
   macro avg       0.77      0.82      0.79      5587
weighted avg       0.78      0.81      0.80      5587



Epoch: 24/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.45it/s, F1=0.999, train_acc=1, train_loss=0.102, train_precision=0.999, train_recall=0.999] 


train_reports:
              precision    recall  f1-score   support

          NR       1.00      0.99      0.99        83
          NS       1.00      1.00      1.00       222
          NT       0.99      1.00      1.00       105

   micro avg       1.00      1.00      1.00       410
   macro avg       1.00      1.00      1.00       410
weighted avg       1.00      1.00      1.00       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.34it/s, F1=0.794, eval_acc=0.975, eval_loss=4.95, eval_precision=0.781, eval_recall=0.813]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.87      0.94      0.90      1416
          NS       0.79      0.79      0.79      2857
          NT       0.65      0.69      0.67      1314

   micro avg       0.77      0.81      0.79      5587
   macro avg       0.77      0.81      0.79      5587
weighted avg       0.77      0.81      0.79      5587



Epoch: 25/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.39it/s, F1=0.993, train_acc=0.999, train_loss=0.305, train_precision=0.992, train_recall=0.994]


train_reports:
              precision    recall  f1-score   support

          NR       0.97      1.00      0.98        83
          NS       1.00      1.00      1.00       222
          NT       0.99      0.98      0.99       105

   micro avg       0.99      0.99      0.99       410
   macro avg       0.99      0.99      0.99       410
weighted avg       0.99      0.99      0.99       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.35it/s, F1=0.795, eval_acc=0.975, eval_loss=5.26, eval_precision=0.783, eval_recall=0.813]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.91      0.90      0.91      1416
          NS       0.80      0.79      0.79      2857
          NT       0.61      0.74      0.66      1314

   micro avg       0.77      0.81      0.79      5587
   macro avg       0.77      0.81      0.79      5587
weighted avg       0.78      0.81      0.79      5587



Epoch: 26/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.33it/s, F1=0.998, train_acc=1, train_loss=0.0485, train_precision=0.997, train_recall=0.998]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00        83
          NS       1.00      1.00      1.00       222
          NT       0.98      0.99      0.99       105

   micro avg       1.00      1.00      1.00       410
   macro avg       0.99      1.00      1.00       410
weighted avg       1.00      1.00      1.00       410



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.26it/s, F1=0.795, eval_acc=0.975, eval_loss=5.51, eval_precision=0.79, eval_recall=0.806] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.91      0.90      0.91      1416
          NS       0.80      0.79      0.79      2857
          NT       0.62      0.71      0.66      1314

   micro avg       0.78      0.80      0.79      5587
   macro avg       0.78      0.80      0.79      5587
weighted avg       0.78      0.80      0.79      5587



Epoch: 27/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.36it/s, F1=0.998, train_acc=1, train_loss=0.0488, train_precision=0.998, train_recall=0.998]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      1.00      0.99        83
          NS       1.00      1.00      1.00       222
          NT       1.00      0.99      1.00       105

   micro avg       1.00      1.00      1.00       410
   macro avg       1.00      1.00      1.00       410
weighted avg       1.00      1.00      1.00       410



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.26it/s, F1=0.793, eval_acc=0.974, eval_loss=5.38, eval_precision=0.779, eval_recall=0.814]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.92      0.90      0.91      1416
          NS       0.79      0.79      0.79      2857
          NT       0.60      0.74      0.67      1314

   micro avg       0.77      0.81      0.79      5587
   macro avg       0.77      0.81      0.79      5587
weighted avg       0.78      0.81      0.79      5587



Epoch: 28/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.41it/s, F1=0.998, train_acc=1, train_loss=0.0374, train_precision=0.997, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00        83
          NS       0.99      1.00      0.99       222
          NT       1.00      1.00      1.00       105

   micro avg       0.99      1.00      1.00       410
   macro avg       1.00      1.00      1.00       410
weighted avg       0.99      1.00      1.00       410



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.57it/s, F1=0.795, eval_acc=0.974, eval_loss=5.5, eval_precision=0.784, eval_recall=0.813] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.92      0.89      0.91      1416
          NS       0.81      0.80      0.80      2857
          NT       0.60      0.74      0.66      1314

   micro avg       0.78      0.81      0.79      5587
   macro avg       0.78      0.81      0.79      5587
weighted avg       0.79      0.81      0.80      5587



Epoch: 29/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.29it/s, F1=1, train_acc=1, train_loss=0.0239, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00        83
          NS       1.00      1.00      1.00       222
          NT       1.00      1.00      1.00       105

   micro avg       1.00      1.00      1.00       410
   macro avg       1.00      1.00      1.00       410
weighted avg       1.00      1.00      1.00       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.32it/s, F1=0.795, eval_acc=0.975, eval_loss=5.61, eval_precision=0.785, eval_recall=0.811]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.92      0.89      0.91      1416
          NS       0.80      0.79      0.80      2857
          NT       0.60      0.73      0.66      1314

   micro avg       0.78      0.80      0.79      5587
   macro avg       0.77      0.80      0.79      5587
weighted avg       0.78      0.80      0.79      5587



Epoch: 30/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.45it/s, F1=0.999, train_acc=1, train_loss=0.0317, train_precision=0.998, train_recall=1]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00        83
          NS       1.00      1.00      1.00       222
          NT       0.99      1.00      1.00       105

   micro avg       1.00      1.00      1.00       410
   macro avg       1.00      1.00      1.00       410
weighted avg       1.00      1.00      1.00       410



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.22it/s, F1=0.795, eval_acc=0.974, eval_loss=5.93, eval_precision=0.789, eval_recall=0.807]


eval_reports:


calculate data/few_shot/msra/train_250.json etag: 100%|██████████| 161k/161k [00:00<00:00, 212MB/s]
calculate data/few_shot/msra/dev.json etag:   0%|          | 0.00/2.12M [00:00<?, ?B/s]

              precision    recall  f1-score   support

          NR       0.91      0.89      0.90      1416
          NS       0.79      0.80      0.79      2857
          NT       0.62      0.70      0.66      1314

   micro avg       0.78      0.80      0.79      5587
   macro avg       0.77      0.80      0.78      5587
weighted avg       0.78      0.80      0.79      5587

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/msra/train_250.json",
    "eval_file": "data/few_shot/msra/dev.json",
    "test_file": "data/few_shot/msra/test.json",
    "tag_file": "data/few_shot/msra/labels.txt",
    "bert_vocab_file": "./model/chinese_wwm_ext/vocab.txt",
    "output_eval": true,
    "max_scan_num": 1000000,
    "add_seq_vocab": false,
    "max_seq_length": 150,
    "max_word_num": 5,
    "default_ta

calculate data/few_shot/msra/dev.json etag: 100%|██████████| 2.12M/2.12M [00:00<00:00, 316MB/s]
calculate data/few_shot/msra/test.json etag: 100%|██████████| 2.12M/2.12M [00:00<00:00, 369MB/s]
calculate data/few_shot/msra/labels.txt etag: 100%|██████████| 62.0/62.0 [00:00<00:00, 123kB/s]


load cached ./temp/55046d54bc5d0cbdb156a3a356c4d7f9_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/lexicon_tree


count line size data/few_shot/msra/labels.txt: 14L [00:00, 124407.32L/s]
build line mapper: 14L [00:00, 108339.96L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 14/14 [00:00<00:00, 4191.91it/s]
load vocab from list: 100%|██████████| 13/13 [00:00<00:00, 156234.82it/s]
load dataset from data/few_shot/msra/train_250.json: 44it [00:00, 423.20it/s]

load cached ./temp/55046d54bc5d0cbdb156a3a356c4d7f9_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/matched_words
load cached ./temp/55046d54bc5d0cbdb156a3a356c4d7f9_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/word_vocab
load cached ./temp/55046d54bc5d0cbdb156a3a356c4d7f9_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/vocab_embedding


load dataset from data/few_shot/msra/train_250.json: 250it [00:00, 382.31it/s]
load dataset from data/few_shot/msra/dev.json: 4365it [00:09, 469.50it/s]
Some weights of the model checkpoint at save_pretrained/msra_pretrain_lebert_250_pretraind_task/Bert_240/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.29it/s, F1=0.00226, train_acc=0.301, train_loss=113, train_precision=0.00117, train_recall=0.0355]  


train_reports:
              precision    recall  f1-score   support

          NR       0.00      0.01      0.00        83
          NS       0.00      0.06      0.00       222
          NT       0.00      0.00      0.00       105

   micro avg       0.00      0.03      0.00       410
   macro avg       0.00      0.02      0.00       410
weighted avg       0.00      0.03      0.00       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.41it/s, F1=0, eval_acc=0.897, eval_loss=26.7, eval_precision=0, eval_recall=0]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.00      0.00      0.00      1416
          NS       0.00      0.00      0.00      2857
          NT       0.00      0.00      0.00      1314

   micro avg       0.00      0.00      0.00      5587
   macro avg       0.00      0.00      0.00      5587
weighted avg       0.00      0.00      0.00      5587



Epoch: 2/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.31it/s, F1=0, train_acc=0.889, train_loss=32.2, train_precision=0, train_recall=0]


train_reports:
              precision    recall  f1-score   support

          NR       0.00      0.00      0.00        83
          NS       0.00      0.00      0.00       222
          NT       0.00      0.00      0.00       105

   micro avg       0.00      0.00      0.00       410
   macro avg       0.00      0.00      0.00       410
weighted avg       0.00      0.00      0.00       410



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.29it/s, F1=0, eval_acc=0.897, eval_loss=21.1, eval_precision=0, eval_recall=0]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.00      0.00      0.00      1416
          NS       0.00      0.00      0.00      2857
          NT       0.00      0.00      0.00      1314

   micro avg       0.00      0.00      0.00      5587
   macro avg       0.00      0.00      0.00      5587
weighted avg       0.00      0.00      0.00      5587



Epoch: 3/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.47it/s, F1=0, train_acc=0.893, train_loss=22.7, train_precision=0, train_recall=0]


train_reports:
              precision    recall  f1-score   support

          NR       0.00      0.00      0.00        83
          NS       0.00      0.00      0.00       222
          NT       0.00      0.00      0.00       105

   micro avg       0.00      0.00      0.00       410
   macro avg       0.00      0.00      0.00       410
weighted avg       0.00      0.00      0.00       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.36it/s, F1=0.00233, eval_acc=0.9, eval_loss=14.3, eval_precision=0.00785, eval_recall=0.00162]  


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.00      0.00      0.00      1416
          NS       0.01      0.00      0.00      2857
          NT       0.00      0.00      0.00      1314

   micro avg       0.00      0.00      0.00      5587
   macro avg       0.00      0.00      0.00      5587
weighted avg       0.00      0.00      0.00      5587



Epoch: 4/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.45it/s, F1=0.00536, train_acc=0.911, train_loss=15, train_precision=0.00419, train_recall=0.00799]  


train_reports:
              precision    recall  f1-score   support

          NR       0.00      0.00      0.00        83
          NS       0.01      0.01      0.01       222
          NT       0.01      0.02      0.01       105

   micro avg       0.01      0.01      0.01       410
   macro avg       0.00      0.01      0.01       410
weighted avg       0.01      0.01      0.01       410



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.54it/s, F1=0.018, eval_acc=0.928, eval_loss=9.79, eval_precision=0.0141, eval_recall=0.0255] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.00      0.00      0.00      1416
          NS       0.03      0.06      0.04      2857
          NT       0.00      0.01      0.01      1314

   micro avg       0.02      0.03      0.02      5587
   macro avg       0.01      0.02      0.01      5587
weighted avg       0.01      0.03      0.02      5587



Epoch: 5/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.34it/s, F1=0.236, train_acc=0.953, train_loss=8.8, train_precision=0.199, train_recall=0.307]    


train_reports:
              precision    recall  f1-score   support

          NR       0.43      0.51      0.47        83
          NS       0.11      0.21      0.15       222
          NT       0.14      0.32      0.20       105

   micro avg       0.16      0.30      0.21       410
   macro avg       0.23      0.35      0.27       410
weighted avg       0.19      0.30      0.22       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.35it/s, F1=0.548, eval_acc=0.962, eval_loss=6.12, eval_precision=0.499, eval_recall=0.624]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.73      0.79      0.76      1416
          NS       0.47      0.64      0.54      2857
          NT       0.22      0.33      0.26      1314

   micro avg       0.46      0.60      0.52      5587
   macro avg       0.47      0.59      0.52      5587
weighted avg       0.48      0.60      0.53      5587



Epoch: 6/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.45it/s, F1=0.77, train_acc=0.986, train_loss=3.28, train_precision=0.742, train_recall=0.811] 


train_reports:
              precision    recall  f1-score   support

          NR       0.75      0.83      0.79        83
          NS       0.76      0.82      0.79       222
          NT       0.63      0.74      0.68       105

   micro avg       0.72      0.80      0.76       410
   macro avg       0.71      0.80      0.75       410
weighted avg       0.72      0.80      0.76       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.36it/s, F1=0.716, eval_acc=0.969, eval_loss=5.28, eval_precision=0.668, eval_recall=0.779]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.81      0.88      0.85      1416
          NS       0.70      0.71      0.71      2857
          NT       0.47      0.72      0.57      1314

   micro avg       0.65      0.76      0.70      5587
   macro avg       0.66      0.77      0.71      5587
weighted avg       0.68      0.76      0.71      5587



Epoch: 7/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.39it/s, F1=0.862, train_acc=0.992, train_loss=1.72, train_precision=0.865, train_recall=0.862]


train_reports:
              precision    recall  f1-score   support

          NR       0.85      0.88      0.86        83
          NS       0.91      0.92      0.91       222
          NT       0.88      0.88      0.88       105

   micro avg       0.89      0.90      0.89       410
   macro avg       0.88      0.89      0.89       410
weighted avg       0.89      0.90      0.89       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.34it/s, F1=0.716, eval_acc=0.971, eval_loss=4.89, eval_precision=0.66, eval_recall=0.792] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.85      0.86      0.86      1416
          NS       0.67      0.78      0.72      2857
          NT       0.46      0.72      0.56      1314

   micro avg       0.65      0.79      0.71      5587
   macro avg       0.66      0.79      0.71      5587
weighted avg       0.67      0.79      0.72      5587



Epoch: 8/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.36it/s, F1=0.896, train_acc=0.993, train_loss=1.29, train_precision=0.887, train_recall=0.911]


train_reports:
              precision    recall  f1-score   support

          NR       0.95      0.95      0.95        83
          NS       0.92      0.94      0.93       222
          NT       0.86      0.91      0.89       105

   micro avg       0.91      0.94      0.92       410
   macro avg       0.91      0.94      0.92       410
weighted avg       0.91      0.94      0.92       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.40it/s, F1=0.759, eval_acc=0.972, eval_loss=5.42, eval_precision=0.734, eval_recall=0.792]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.88      0.88      0.88      1416
          NS       0.75      0.80      0.77      2857
          NT       0.54      0.67      0.59      1314

   micro avg       0.72      0.79      0.75      5587
   macro avg       0.72      0.78      0.75      5587
weighted avg       0.73      0.79      0.76      5587



Epoch: 9/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.43it/s, F1=0.941, train_acc=0.996, train_loss=1, train_precision=0.936, train_recall=0.949]    


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.96      0.98        83
          NS       0.95      0.96      0.96       222
          NT       0.85      0.93      0.89       105

   micro avg       0.93      0.95      0.94       410
   macro avg       0.93      0.95      0.94       410
weighted avg       0.93      0.95      0.94       410



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.60it/s, F1=0.782, eval_acc=0.974, eval_loss=5.24, eval_precision=0.779, eval_recall=0.792]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.89      0.92      0.90      1416
          NS       0.80      0.78      0.79      2857
          NT       0.57      0.63      0.60      1314

   micro avg       0.76      0.78      0.77      5587
   macro avg       0.75      0.78      0.76      5587
weighted avg       0.77      0.78      0.77      5587



Epoch: 10/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.42it/s, F1=0.969, train_acc=0.998, train_loss=0.522, train_precision=0.97, train_recall=0.969] 


train_reports:
              precision    recall  f1-score   support

          NR       1.00      0.95      0.98        83
          NS       0.98      0.98      0.98       222
          NT       0.94      0.96      0.95       105

   micro avg       0.97      0.97      0.97       410
   macro avg       0.97      0.96      0.97       410
weighted avg       0.97      0.97      0.97       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.34it/s, F1=0.778, eval_acc=0.972, eval_loss=5.56, eval_precision=0.749, eval_recall=0.818]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.88      0.92      0.90      1416
          NS       0.81      0.78      0.79      2857
          NT       0.55      0.74      0.63      1314

   micro avg       0.75      0.81      0.78      5587
   macro avg       0.74      0.82      0.77      5587
weighted avg       0.76      0.81      0.78      5587



Epoch: 11/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.37it/s, F1=0.989, train_acc=0.999, train_loss=0.303, train_precision=0.99, train_recall=0.989] 


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.96      0.97        83
          NS       0.98      0.99      0.99       222
          NT       1.00      0.99      1.00       105

   micro avg       0.99      0.99      0.99       410
   macro avg       0.99      0.98      0.98       410
weighted avg       0.99      0.99      0.99       410



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.28it/s, F1=0.779, eval_acc=0.972, eval_loss=6.07, eval_precision=0.746, eval_recall=0.822]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.87      0.93      0.90      1416
          NS       0.82      0.76      0.79      2857
          NT       0.55      0.79      0.65      1314

   micro avg       0.75      0.81      0.78      5587
   macro avg       0.75      0.83      0.78      5587
weighted avg       0.77      0.81      0.78      5587



Epoch: 12/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.32it/s, F1=0.983, train_acc=0.999, train_loss=0.203, train_precision=0.985, train_recall=0.982]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.95      0.97        83
          NS       0.98      1.00      0.99       222
          NT       1.00      1.00      1.00       105

   micro avg       0.99      0.99      0.99       410
   macro avg       0.99      0.98      0.99       410
weighted avg       0.99      0.99      0.99       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.34it/s, F1=0.795, eval_acc=0.974, eval_loss=5.82, eval_precision=0.773, eval_recall=0.824]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.90      0.92      0.91      1416
          NS       0.82      0.78      0.80      2857
          NT       0.58      0.78      0.67      1314

   micro avg       0.77      0.81      0.79      5587
   macro avg       0.77      0.83      0.79      5587
weighted avg       0.78      0.81      0.80      5587



Epoch: 13/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.35it/s, F1=0.963, train_acc=0.999, train_loss=0.233, train_precision=0.964, train_recall=0.962]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.98      0.98        83
          NS       1.00      1.00      1.00       222
          NT       0.99      0.99      0.99       105

   micro avg       0.99      0.99      0.99       410
   macro avg       0.99      0.99      0.99       410
weighted avg       0.99      0.99      0.99       410



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.31it/s, F1=0.798, eval_acc=0.975, eval_loss=5.62, eval_precision=0.782, eval_recall=0.819]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.87      0.92      0.90      1416
          NS       0.82      0.79      0.80      2857
          NT       0.59      0.73      0.65      1314

   micro avg       0.77      0.81      0.79      5587
   macro avg       0.76      0.81      0.78      5587
weighted avg       0.78      0.81      0.79      5587



Epoch: 14/30 Train: 100%|██████████| 32/32 [00:12<00:00,  2.50it/s, F1=0.985, train_acc=0.999, train_loss=0.198, train_precision=0.986, train_recall=0.985]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00        83
          NS       0.99      0.98      0.98       222
          NT       0.99      1.00      1.00       105

   micro avg       0.99      0.99      0.99       410
   macro avg       0.99      0.99      0.99       410
weighted avg       0.99      0.99      0.99       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.32it/s, F1=0.782, eval_acc=0.974, eval_loss=5.64, eval_precision=0.741, eval_recall=0.834]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.87      0.92      0.89      1416
          NS       0.76      0.80      0.78      2857
          NT       0.57      0.76      0.65      1314

   micro avg       0.73      0.82      0.77      5587
   macro avg       0.73      0.83      0.77      5587
weighted avg       0.74      0.82      0.78      5587



Epoch: 15/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.37it/s, F1=0.993, train_acc=1, train_loss=0.125, train_precision=0.992, train_recall=0.994]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99        83
          NS       1.00      1.00      1.00       222
          NT       0.98      0.99      0.99       105

   micro avg       0.99      1.00      0.99       410
   macro avg       0.99      0.99      0.99       410
weighted avg       0.99      1.00      0.99       410



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.31it/s, F1=0.789, eval_acc=0.974, eval_loss=5.77, eval_precision=0.761, eval_recall=0.825]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.86      0.92      0.89      1416
          NS       0.79      0.79      0.79      2857
          NT       0.57      0.75      0.65      1314

   micro avg       0.75      0.81      0.78      5587
   macro avg       0.74      0.82      0.78      5587
weighted avg       0.76      0.81      0.78      5587



Epoch: 16/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.38it/s, F1=1, train_acc=1, train_loss=0.0699, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00        83
          NS       1.00      1.00      1.00       222
          NT       1.00      1.00      1.00       105

   micro avg       1.00      1.00      1.00       410
   macro avg       1.00      1.00      1.00       410
weighted avg       1.00      1.00      1.00       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.37it/s, F1=0.793, eval_acc=0.974, eval_loss=5.92, eval_precision=0.764, eval_recall=0.831]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.88      0.93      0.90      1416
          NS       0.80      0.80      0.80      2857
          NT       0.57      0.76      0.65      1314

   micro avg       0.75      0.82      0.79      5587
   macro avg       0.75      0.83      0.78      5587
weighted avg       0.77      0.82      0.79      5587



Epoch: 17/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.36it/s, F1=0.999, train_acc=1, train_loss=0.0804, train_precision=1, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      0.99      0.99        83
          NS       1.00      1.00      1.00       222
          NT       1.00      1.00      1.00       105

   micro avg       1.00      1.00      1.00       410
   macro avg       1.00      1.00      1.00       410
weighted avg       1.00      1.00      1.00       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.34it/s, F1=0.794, eval_acc=0.974, eval_loss=6.09, eval_precision=0.763, eval_recall=0.834]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.88      0.93      0.91      1416
          NS       0.80      0.80      0.80      2857
          NT       0.57      0.77      0.66      1314

   micro avg       0.76      0.82      0.79      5587
   macro avg       0.75      0.83      0.79      5587
weighted avg       0.77      0.82      0.79      5587



Epoch: 18/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.39it/s, F1=0.966, train_acc=1, train_loss=0.0589, train_precision=0.964, train_recall=0.968]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00        83
          NS       0.99      1.00      0.99       222
          NT       1.00      1.00      1.00       105

   micro avg       1.00      1.00      1.00       410
   macro avg       1.00      1.00      1.00       410
weighted avg       1.00      1.00      1.00       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.38it/s, F1=0.795, eval_acc=0.975, eval_loss=5.92, eval_precision=0.766, eval_recall=0.831]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.89      0.93      0.91      1416
          NS       0.80      0.80      0.80      2857
          NT       0.58      0.75      0.66      1314

   micro avg       0.76      0.82      0.79      5587
   macro avg       0.76      0.83      0.79      5587
weighted avg       0.77      0.82      0.79      5587



Epoch: 19/30 Train: 100%|██████████| 32/32 [00:12<00:00,  2.52it/s, F1=0.999, train_acc=1, train_loss=0.0496, train_precision=0.999, train_recall=1]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      1.00      0.99        83
          NS       1.00      1.00      1.00       222
          NT       1.00      1.00      1.00       105

   micro avg       1.00      1.00      1.00       410
   macro avg       1.00      1.00      1.00       410
weighted avg       1.00      1.00      1.00       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.32it/s, F1=0.805, eval_acc=0.976, eval_loss=6.16, eval_precision=0.796, eval_recall=0.821]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.91      0.93      0.92      1416
          NS       0.82      0.79      0.81      2857
          NT       0.60      0.72      0.65      1314

   micro avg       0.78      0.81      0.80      5587
   macro avg       0.78      0.81      0.79      5587
weighted avg       0.79      0.81      0.80      5587



Epoch: 20/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.45it/s, F1=1, train_acc=1, train_loss=0.0309, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00        83
          NS       1.00      1.00      1.00       222
          NT       1.00      1.00      1.00       105

   micro avg       1.00      1.00      1.00       410
   macro avg       1.00      1.00      1.00       410
weighted avg       1.00      1.00      1.00       410



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.26it/s, F1=0.806, eval_acc=0.975, eval_loss=6.31, eval_precision=0.789, eval_recall=0.829]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.91      0.93      0.92      1416
          NS       0.83      0.79      0.81      2857
          NT       0.60      0.75      0.67      1314

   micro avg       0.78      0.82      0.80      5587
   macro avg       0.78      0.82      0.80      5587
weighted avg       0.79      0.82      0.80      5587



Epoch: 21/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.46it/s, F1=0.998, train_acc=1, train_loss=0.0432, train_precision=0.996, train_recall=1]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00        83
          NS       1.00      1.00      1.00       222
          NT       1.00      1.00      1.00       105

   micro avg       1.00      1.00      1.00       410
   macro avg       1.00      1.00      1.00       410
weighted avg       1.00      1.00      1.00       410



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.31it/s, F1=0.797, eval_acc=0.976, eval_loss=6.72, eval_precision=0.809, eval_recall=0.793]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.91      0.92      0.91      1416
          NS       0.84      0.77      0.80      2857
          NT       0.60      0.69      0.64      1314

   micro avg       0.79      0.79      0.79      5587
   macro avg       0.78      0.79      0.79      5587
weighted avg       0.80      0.79      0.79      5587



Epoch: 22/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.42it/s, F1=0.989, train_acc=1, train_loss=0.111, train_precision=0.986, train_recall=0.993]   


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00        83
          NS       1.00      1.00      1.00       222
          NT       0.96      0.99      0.98       105

   micro avg       0.99      1.00      0.99       410
   macro avg       0.99      1.00      0.99       410
weighted avg       0.99      1.00      0.99       410



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.29it/s, F1=0.771, eval_acc=0.975, eval_loss=5.55, eval_precision=0.739, eval_recall=0.815]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.90      0.93      0.91      1416
          NS       0.75      0.80      0.78      2857
          NT       0.50      0.67      0.57      1314

   micro avg       0.71      0.80      0.76      5587
   macro avg       0.72      0.80      0.75      5587
weighted avg       0.73      0.80      0.76      5587



Epoch: 23/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.39it/s, F1=1, train_acc=1, train_loss=0.0543, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00        83
          NS       1.00      1.00      1.00       222
          NT       1.00      1.00      1.00       105

   micro avg       1.00      1.00      1.00       410
   macro avg       1.00      1.00      1.00       410
weighted avg       1.00      1.00      1.00       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.32it/s, F1=0.794, eval_acc=0.975, eval_loss=6.22, eval_precision=0.769, eval_recall=0.827]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.90      0.94      0.92      1416
          NS       0.80      0.79      0.79      2857
          NT       0.58      0.75      0.66      1314

   micro avg       0.76      0.82      0.79      5587
   macro avg       0.76      0.83      0.79      5587
weighted avg       0.77      0.82      0.79      5587



Epoch: 24/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.31it/s, F1=1, train_acc=1, train_loss=0.0264, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00        83
          NS       1.00      1.00      1.00       222
          NT       1.00      1.00      1.00       105

   micro avg       1.00      1.00      1.00       410
   macro avg       1.00      1.00      1.00       410
weighted avg       1.00      1.00      1.00       410



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.58it/s, F1=0.794, eval_acc=0.974, eval_loss=6.47, eval_precision=0.766, eval_recall=0.832]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.90      0.93      0.92      1416
          NS       0.81      0.79      0.80      2857
          NT       0.57      0.77      0.66      1314

   micro avg       0.76      0.82      0.79      5587
   macro avg       0.76      0.83      0.79      5587
weighted avg       0.78      0.82      0.80      5587



Epoch: 25/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.33it/s, F1=1, train_acc=1, train_loss=0.019, train_precision=1, train_recall=1] 


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00        83
          NS       1.00      1.00      1.00       222
          NT       1.00      1.00      1.00       105

   micro avg       1.00      1.00      1.00       410
   macro avg       1.00      1.00      1.00       410
weighted avg       1.00      1.00      1.00       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.36it/s, F1=0.795, eval_acc=0.974, eval_loss=6.47, eval_precision=0.767, eval_recall=0.832]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.90      0.93      0.92      1416
          NS       0.81      0.79      0.80      2857
          NT       0.57      0.77      0.66      1314

   micro avg       0.76      0.82      0.79      5587
   macro avg       0.76      0.83      0.79      5587
weighted avg       0.78      0.82      0.80      5587



Epoch: 26/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.43it/s, F1=0.999, train_acc=1, train_loss=0.0206, train_precision=0.998, train_recall=1]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      1.00      0.99        83
          NS       1.00      1.00      1.00       222
          NT       1.00      1.00      1.00       105

   micro avg       1.00      1.00      1.00       410
   macro avg       1.00      1.00      1.00       410
weighted avg       1.00      1.00      1.00       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.34it/s, F1=0.797, eval_acc=0.975, eval_loss=6.47, eval_precision=0.777, eval_recall=0.825]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.91      0.93      0.92      1416
          NS       0.81      0.79      0.80      2857
          NT       0.58      0.75      0.66      1314

   micro avg       0.77      0.82      0.79      5587
   macro avg       0.77      0.82      0.79      5587
weighted avg       0.78      0.82      0.80      5587



Epoch: 27/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.35it/s, F1=1, train_acc=1, train_loss=0.0195, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00        83
          NS       1.00      1.00      1.00       222
          NT       1.00      1.00      1.00       105

   micro avg       1.00      1.00      1.00       410
   macro avg       1.00      1.00      1.00       410
weighted avg       1.00      1.00      1.00       410



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.26it/s, F1=0.8, eval_acc=0.975, eval_loss=6.53, eval_precision=0.785, eval_recall=0.823]  


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.91      0.92      0.92      1416
          NS       0.81      0.79      0.80      2857
          NT       0.59      0.74      0.65      1314

   micro avg       0.77      0.81      0.79      5587
   macro avg       0.77      0.82      0.79      5587
weighted avg       0.78      0.81      0.80      5587



Epoch: 28/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.47it/s, F1=1, train_acc=1, train_loss=0.0155, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00        83
          NS       1.00      1.00      1.00       222
          NT       1.00      1.00      1.00       105

   micro avg       1.00      1.00      1.00       410
   macro avg       1.00      1.00      1.00       410
weighted avg       1.00      1.00      1.00       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.34it/s, F1=0.8, eval_acc=0.975, eval_loss=6.51, eval_precision=0.78, eval_recall=0.827]   


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.91      0.92      0.92      1416
          NS       0.81      0.80      0.80      2857
          NT       0.58      0.75      0.66      1314

   micro avg       0.77      0.82      0.79      5587
   macro avg       0.77      0.82      0.79      5587
weighted avg       0.78      0.82      0.80      5587



Epoch: 29/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.46it/s, F1=0.988, train_acc=0.999, train_loss=0.292, train_precision=0.985, train_recall=0.99] 


train_reports:
              precision    recall  f1-score   support

          NR       0.97      1.00      0.98        83
          NS       1.00      1.00      1.00       222
          NT       0.97      0.97      0.97       105

   micro avg       0.98      0.99      0.99       410
   macro avg       0.98      0.99      0.98       410
weighted avg       0.98      0.99      0.99       410



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.58it/s, F1=0.794, eval_acc=0.975, eval_loss=6.24, eval_precision=0.775, eval_recall=0.819]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.91      0.91      0.91      1416
          NS       0.80      0.80      0.80      2857
          NT       0.59      0.74      0.66      1314

   micro avg       0.77      0.81      0.79      5587
   macro avg       0.76      0.82      0.79      5587
weighted avg       0.78      0.81      0.79      5587



Epoch: 30/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.35it/s, F1=0.996, train_acc=0.999, train_loss=0.173, train_precision=0.997, train_recall=0.995]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99        83
          NS       1.00      1.00      1.00       222
          NT       0.99      0.98      0.99       105

   micro avg       1.00      0.99      0.99       410
   macro avg       0.99      0.99      0.99       410
weighted avg       1.00      0.99      0.99       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.38it/s, F1=0.797, eval_acc=0.975, eval_loss=6.47, eval_precision=0.789, eval_recall=0.812]


eval_reports:
              precision    recall  f1-score   support

          NR       0.89      0.93      0.91      1416
          NS       0.83      0.77      0.80      2857
          NT       0.59      0.73      0.65      1314

   micro avg       0.78      0.80      0.79      5587
   macro avg       0.77      0.81      0.79      5587
weighted avg       0.79      0.80      0.79      5587



calculate data/few_shot/msra/train_250.json etag: 100%|██████████| 161k/161k [00:00<00:00, 180MB/s]
calculate data/few_shot/msra/dev.json etag: 100%|██████████| 2.12M/2.12M [00:00<00:00, 328MB/s]
calculate data/few_shot/msra/test.json etag: 100%|██████████| 2.12M/2.12M [00:00<00:00, 369MB/s]
calculate data/few_shot/msra/labels.txt etag: 100%|██████████| 62.0/62.0 [00:00<00:00, 284kB/s]

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/msra/train_250.json",
    "eval_file": "data/few_shot/msra/dev.json",
    "test_file": "data/few_shot/msra/test.json",
    "tag_file": "data/few_shot/msra/labels.txt",
    "bert_vocab_file": "./model/chinese_wwm_ext/vocab.txt",
    "output_eval": true,
    "max_scan_num": 1000000,
    "add_seq_vocab": false,
    "max_seq_length": 150,
    "max_word_num": 5,
    "default_tag": "O",
    "use_test": false,
    "do_shuffle": true,
    "do_predict": false,
    "task_name": "msra_pretrain_lebert_crf_250_x3"
}
load cached ./temp/55046d54bc5d0cbdb156a3a356c4d7f9_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/lexicon_tree



count line size data/few_shot/msra/labels.txt: 14L [00:00, 114912.44L/s]
build line mapper: 14L [00:00, 25608.48L/s]4 [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 14/14 [00:00<00:00, 4097.72it/s]
load vocab from list: 100%|██████████| 13/13 [00:00<00:00, 161798.08it/s]
load dataset from data/few_shot/msra/train_250.json: 59it [00:00, 586.71it/s]

load cached ./temp/55046d54bc5d0cbdb156a3a356c4d7f9_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/matched_words
load cached ./temp/55046d54bc5d0cbdb156a3a356c4d7f9_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/word_vocab
load cached ./temp/55046d54bc5d0cbdb156a3a356c4d7f9_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/vocab_embedding


load dataset from data/few_shot/msra/train_250.json: 250it [00:00, 551.57it/s]
load dataset from data/few_shot/msra/dev.json: 4365it [00:06, 663.38it/s]
Some weights of the model checkpoint at save_pretrained/msra_pretrain_lebert_250_pretraind_task/Bert_240/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.32it/s, F1=0.00144, train_acc=0.306, train_loss=140, train_precision=0.000761, train_recall=0.0177] 


train_reports:
              precision    recall  f1-score   support

          NR       0.00      0.00      0.00        83
          NS       0.00      0.02      0.00       222
          NT       0.00      0.01      0.00       105

   micro avg       0.00      0.01      0.00       410
   macro avg       0.00      0.01      0.00       410
weighted avg       0.00      0.01      0.00       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.37it/s, F1=0, eval_acc=0.894, eval_loss=39.2, eval_precision=0, eval_recall=0]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.00      0.00      0.00      1416
          NS       0.00      0.00      0.00      2857
          NT       0.00      0.00      0.00      1314

   micro avg       0.00      0.00      0.00      5587
   macro avg       0.00      0.00      0.00      5587
weighted avg       0.00      0.00      0.00      5587



Epoch: 2/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.39it/s, F1=0, train_acc=0.888, train_loss=36.9, train_precision=0, train_recall=0]


train_reports:
              precision    recall  f1-score   support

          NR       0.00      0.00      0.00        83
          NS       0.00      0.00      0.00       222
          NT       0.00      0.00      0.00       105

   micro avg       0.00      0.00      0.00       410
   macro avg       0.00      0.00      0.00       410
weighted avg       0.00      0.00      0.00       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.38it/s, F1=0, eval_acc=0.897, eval_loss=24.3, eval_precision=0, eval_recall=0]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.00      0.00      0.00      1416
          NS       0.00      0.00      0.00      2857
          NT       0.00      0.00      0.00      1314

   micro avg       0.00      0.00      0.00      5587
   macro avg       0.00      0.00      0.00      5587
weighted avg       0.00      0.00      0.00      5587



Epoch: 3/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.36it/s, F1=0, train_acc=0.89, train_loss=27.4, train_precision=0, train_recall=0] 


train_reports:
              precision    recall  f1-score   support

          NR       0.00      0.00      0.00        83
          NS       0.00      0.00      0.00       222
          NT       0.00      0.00      0.00       105

   micro avg       0.00      0.00      0.00       410
   macro avg       0.00      0.00      0.00       410
weighted avg       0.00      0.00      0.00       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.32it/s, F1=0.00277, eval_acc=0.898, eval_loss=16.1, eval_precision=0.014, eval_recall=0.00167]    


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.00      0.00      0.00      1416
          NS       0.01      0.00      0.00      2857
          NT       0.00      0.00      0.00      1314

   micro avg       0.01      0.00      0.00      5587
   macro avg       0.01      0.00      0.00      5587
weighted avg       0.01      0.00      0.00      5587



Epoch: 4/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.44it/s, F1=0.0281, train_acc=0.918, train_loss=15.6, train_precision=0.0232, train_recall=0.0379]   


train_reports:
              precision    recall  f1-score   support

          NR       0.10      0.01      0.02        83
          NS       0.01      0.02      0.01       222
          NT       0.05      0.10      0.06       105

   micro avg       0.02      0.04      0.03       410
   macro avg       0.05      0.04      0.03       410
weighted avg       0.04      0.04      0.03       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.34it/s, F1=0.0603, eval_acc=0.926, eval_loss=10.2, eval_precision=0.0434, eval_recall=0.101] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.10      0.14      0.12      1416
          NS       0.04      0.12      0.06      2857
          NT       0.02      0.06      0.03      1314

   micro avg       0.04      0.11      0.06      5587
   macro avg       0.06      0.10      0.07      5587
weighted avg       0.05      0.11      0.07      5587



Epoch: 5/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.44it/s, F1=0.243, train_acc=0.948, train_loss=9.32, train_precision=0.197, train_recall=0.327]  


train_reports:
              precision    recall  f1-score   support

          NR       0.25      0.40      0.31        83
          NS       0.17      0.31      0.22       222
          NT       0.13      0.30      0.18       105

   micro avg       0.17      0.32      0.22       410
   macro avg       0.18      0.33      0.24       410
weighted avg       0.18      0.32      0.23       410



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.31it/s, F1=0.397, eval_acc=0.955, eval_loss=6.12, eval_precision=0.333, eval_recall=0.504]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.17      0.29      0.22      1416
          NS       0.39      0.56      0.46      2857
          NT       0.31      0.54      0.39      1314

   micro avg       0.31      0.49      0.38      5587
   macro avg       0.29      0.46      0.36      5587
weighted avg       0.32      0.49      0.38      5587



Epoch: 6/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.41it/s, F1=0.541, train_acc=0.977, train_loss=4.37, train_precision=0.495, train_recall=0.61] 


train_reports:
              precision    recall  f1-score   support

          NR       0.58      0.75      0.65        83
          NS       0.44      0.59      0.50       222
          NT       0.44      0.69      0.54       105

   micro avg       0.46      0.65      0.54       410
   macro avg       0.49      0.67      0.56       410
weighted avg       0.47      0.65      0.54       410



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.55it/s, F1=0.694, eval_acc=0.972, eval_loss=4.79, eval_precision=0.673, eval_recall=0.723]


eval_reports:
              precision    recall  f1-score   support

          NR       0.85      0.88      0.86      1416
          NS       0.65      0.65      0.65      2857
          NT       0.50      0.66      0.57      1314

   micro avg       0.65      0.71      0.68      5587
   macro avg       0.66      0.73      0.69      5587
weighted avg       0.66      0.71      0.68      5587



Epoch: 7/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.37it/s, F1=0.814, train_acc=0.991, train_loss=2.16, train_precision=0.793, train_recall=0.843]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      0.96      0.98        83
          NS       0.77      0.82      0.79       222
          NT       0.71      0.85      0.77       105

   micro avg       0.79      0.85      0.82       410
   macro avg       0.83      0.88      0.85       410
weighted avg       0.80      0.85      0.82       410



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.30it/s, F1=0.749, eval_acc=0.974, eval_loss=4.65, eval_precision=0.734, eval_recall=0.771]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.88      0.91      0.90      1416
          NS       0.73      0.73      0.73      2857
          NT       0.55      0.66      0.60      1314

   micro avg       0.72      0.76      0.74      5587
   macro avg       0.72      0.77      0.74      5587
weighted avg       0.73      0.76      0.74      5587



Epoch: 8/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.28it/s, F1=0.956, train_acc=0.997, train_loss=0.937, train_precision=0.957, train_recall=0.957]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.96      0.98        83
          NS       0.96      0.97      0.96       222
          NT       0.92      0.92      0.92       105

   micro avg       0.95      0.96      0.95       410
   macro avg       0.95      0.95      0.95       410
weighted avg       0.95      0.96      0.95       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.33it/s, F1=0.769, eval_acc=0.975, eval_loss=4.62, eval_precision=0.746, eval_recall=0.8]  


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.91      0.91      0.91      1416
          NS       0.74      0.80      0.77      2857
          NT       0.56      0.64      0.60      1314

   micro avg       0.73      0.79      0.76      5587
   macro avg       0.74      0.78      0.76      5587
weighted avg       0.74      0.79      0.76      5587



Epoch: 9/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.37it/s, F1=0.944, train_acc=0.998, train_loss=0.511, train_precision=0.942, train_recall=0.946]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.98      0.98        83
          NS       0.98      0.98      0.98       222
          NT       0.94      0.97      0.96       105

   micro avg       0.97      0.98      0.98       410
   macro avg       0.97      0.98      0.97       410
weighted avg       0.97      0.98      0.98       410



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.30it/s, F1=0.771, eval_acc=0.975, eval_loss=4.87, eval_precision=0.748, eval_recall=0.802]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.89      0.91      0.90      1416
          NS       0.74      0.81      0.77      2857
          NT       0.57      0.61      0.59      1314

   micro avg       0.74      0.79      0.76      5587
   macro avg       0.73      0.78      0.76      5587
weighted avg       0.74      0.79      0.76      5587



Epoch: 10/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.41it/s, F1=0.964, train_acc=0.999, train_loss=0.35, train_precision=0.965, train_recall=0.964] 


train_reports:
              precision    recall  f1-score   support

          NR       1.00      0.99      0.99        83
          NS       1.00      1.00      1.00       222
          NT       0.99      0.99      0.99       105

   micro avg       1.00      1.00      1.00       410
   macro avg       1.00      0.99      0.99       410
weighted avg       1.00      1.00      1.00       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.32it/s, F1=0.773, eval_acc=0.974, eval_loss=5.38, eval_precision=0.752, eval_recall=0.802]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.90      0.92      0.91      1416
          NS       0.79      0.77      0.78      2857
          NT       0.55      0.71      0.62      1314

   micro avg       0.75      0.79      0.77      5587
   macro avg       0.75      0.80      0.77      5587
weighted avg       0.76      0.79      0.77      5587



Epoch: 11/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.40it/s, F1=0.943, train_acc=0.998, train_loss=0.329, train_precision=0.944, train_recall=0.945]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      0.96      0.98        83
          NS       0.98      0.99      0.99       222
          NT       0.93      0.97      0.95       105

   micro avg       0.97      0.98      0.98       410
   macro avg       0.97      0.98      0.97       410
weighted avg       0.97      0.98      0.98       410



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.59it/s, F1=0.789, eval_acc=0.975, eval_loss=5.49, eval_precision=0.783, eval_recall=0.8]  


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.90      0.92      0.91      1416
          NS       0.79      0.80      0.79      2857
          NT       0.58      0.62      0.60      1314

   micro avg       0.77      0.79      0.78      5587
   macro avg       0.76      0.78      0.77      5587
weighted avg       0.77      0.79      0.78      5587



Epoch: 12/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.32it/s, F1=0.955, train_acc=0.999, train_loss=0.25, train_precision=0.954, train_recall=0.957] 


train_reports:
              precision    recall  f1-score   support

          NR       1.00      0.99      0.99        83
          NS       1.00      1.00      1.00       222
          NT       0.95      0.97      0.96       105

   micro avg       0.99      0.99      0.99       410
   macro avg       0.98      0.99      0.99       410
weighted avg       0.99      0.99      0.99       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.32it/s, F1=0.789, eval_acc=0.976, eval_loss=5.33, eval_precision=0.767, eval_recall=0.818]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.90      0.92      0.91      1416
          NS       0.79      0.80      0.80      2857
          NT       0.59      0.69      0.64      1314

   micro avg       0.76      0.81      0.78      5587
   macro avg       0.76      0.81      0.78      5587
weighted avg       0.77      0.81      0.79      5587



Epoch: 13/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.41it/s, F1=1, train_acc=1, train_loss=0.14, train_precision=1, train_recall=1] 


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00        83
          NS       1.00      1.00      1.00       222
          NT       1.00      1.00      1.00       105

   micro avg       1.00      1.00      1.00       410
   macro avg       1.00      1.00      1.00       410
weighted avg       1.00      1.00      1.00       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.35it/s, F1=0.791, eval_acc=0.976, eval_loss=5.29, eval_precision=0.767, eval_recall=0.823]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.92      0.92      1416
          NS       0.79      0.80      0.80      2857
          NT       0.58      0.72      0.64      1314

   micro avg       0.76      0.81      0.79      5587
   macro avg       0.76      0.81      0.79      5587
weighted avg       0.77      0.81      0.79      5587



Epoch: 14/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.36it/s, F1=0.991, train_acc=1, train_loss=0.163, train_precision=0.99, train_recall=0.991]     


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99        83
          NS       0.99      0.99      0.99       222
          NT       0.99      1.00      1.00       105

   micro avg       0.99      0.99      0.99       410
   macro avg       0.99      0.99      0.99       410
weighted avg       0.99      0.99      0.99       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.34it/s, F1=0.793, eval_acc=0.976, eval_loss=5.39, eval_precision=0.771, eval_recall=0.823]


eval_reports:
              precision    recall  f1-score   support

          NR       0.90      0.92      0.91      1416
          NS       0.78      0.83      0.80      2857
          NT       0.60      0.66      0.63      1314

   micro avg       0.77      0.81      0.79      5587
   macro avg       0.76      0.80      0.78      5587
weighted avg       0.77      0.81      0.79      5587



Epoch: 15/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.42it/s, F1=0.99, train_acc=0.999, train_loss=0.138, train_precision=0.99, train_recall=0.99]   


train_reports:
              precision    recall  f1-score   support

          NR       0.96      0.98      0.97        83
          NS       1.00      1.00      1.00       222
          NT       0.98      0.99      0.99       105

   micro avg       0.99      0.99      0.99       410
   macro avg       0.98      0.99      0.98       410
weighted avg       0.99      0.99      0.99       410



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.21it/s, F1=0.776, eval_acc=0.974, eval_loss=5.89, eval_precision=0.752, eval_recall=0.807]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.84      0.95      0.89      1416
          NS       0.79      0.78      0.79      2857
          NT       0.59      0.70      0.64      1314

   micro avg       0.75      0.80      0.78      5587
   macro avg       0.74      0.81      0.77      5587
weighted avg       0.76      0.80      0.78      5587



Epoch: 16/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.46it/s, F1=0.985, train_acc=0.999, train_loss=0.197, train_precision=0.983, train_recall=0.988]


train_reports:
              precision    recall  f1-score   support

          NR       0.98      1.00      0.99        83
          NS       0.98      0.99      0.99       222
          NT       0.98      0.97      0.98       105

   micro avg       0.98      0.99      0.98       410
   macro avg       0.98      0.99      0.98       410
weighted avg       0.98      0.99      0.98       410



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.52it/s, F1=0.782, eval_acc=0.976, eval_loss=4.93, eval_precision=0.733, eval_recall=0.845]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.91      0.93      0.92      1416
          NS       0.73      0.84      0.78      2857
          NT       0.59      0.74      0.66      1314

   micro avg       0.73      0.84      0.78      5587
   macro avg       0.74      0.84      0.78      5587
weighted avg       0.74      0.84      0.79      5587



Epoch: 17/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.44it/s, F1=0.995, train_acc=1, train_loss=0.209, train_precision=0.991, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      0.99      0.99        83
          NS       0.99      1.00      0.99       222
          NT       1.00      1.00      1.00       105

   micro avg       0.99      1.00      1.00       410
   macro avg       1.00      1.00      1.00       410
weighted avg       0.99      1.00      1.00       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.32it/s, F1=0.796, eval_acc=0.976, eval_loss=5.79, eval_precision=0.78, eval_recall=0.818] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.90      0.92      0.91      1416
          NS       0.77      0.81      0.79      2857
          NT       0.61      0.67      0.64      1314

   micro avg       0.76      0.81      0.78      5587
   macro avg       0.76      0.80      0.78      5587
weighted avg       0.77      0.81      0.79      5587



Epoch: 18/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.40it/s, F1=0.986, train_acc=0.999, train_loss=0.215, train_precision=0.983, train_recall=0.99] 


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.99      0.98        83
          NS       0.99      1.00      0.99       222
          NT       0.98      0.98      0.98       105

   micro avg       0.98      0.99      0.99       410
   macro avg       0.98      0.99      0.98       410
weighted avg       0.98      0.99      0.99       410



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.27it/s, F1=0.77, eval_acc=0.976, eval_loss=5.54, eval_precision=0.739, eval_recall=0.808] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.88      0.92      0.90      1416
          NS       0.70      0.84      0.76      2857
          NT       0.60      0.57      0.59      1314

   micro avg       0.72      0.80      0.76      5587
   macro avg       0.73      0.78      0.75      5587
weighted avg       0.72      0.80      0.76      5587



Epoch: 19/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.49it/s, F1=0.993, train_acc=0.999, train_loss=0.355, train_precision=0.992, train_recall=0.994]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      0.99      0.99        83
          NS       0.98      0.99      0.99       222
          NT       0.99      1.00      1.00       105

   micro avg       0.99      0.99      0.99       410
   macro avg       0.99      0.99      0.99       410
weighted avg       0.99      0.99      0.99       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.33it/s, F1=0.739, eval_acc=0.969, eval_loss=6.33, eval_precision=0.664, eval_recall=0.849]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.87      0.95      0.91      1416
          NS       0.68      0.83      0.75      2857
          NT       0.55      0.78      0.64      1314

   micro avg       0.69      0.85      0.76      5587
   macro avg       0.70      0.85      0.77      5587
weighted avg       0.70      0.85      0.76      5587



Epoch: 20/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.40it/s, F1=0.942, train_acc=0.992, train_loss=1.93, train_precision=0.922, train_recall=0.965] 


train_reports:
              precision    recall  f1-score   support

          NR       0.98      1.00      0.99        83
          NS       0.91      0.96      0.94       222
          NT       0.87      0.94      0.90       105

   micro avg       0.91      0.97      0.94       410
   macro avg       0.92      0.97      0.94       410
weighted avg       0.91      0.97      0.94       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.36it/s, F1=0.711, eval_acc=0.962, eval_loss=6.78, eval_precision=0.629, eval_recall=0.836]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.90      0.95      0.92      1416
          NS       0.68      0.78      0.73      2857
          NT       0.43      0.81      0.56      1314

   micro avg       0.64      0.83      0.72      5587
   macro avg       0.67      0.85      0.74      5587
weighted avg       0.68      0.83      0.74      5587



Epoch: 21/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.42it/s, F1=0.929, train_acc=0.995, train_loss=1.04, train_precision=0.907, train_recall=0.957] 


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00        83
          NS       0.93      0.99      0.96       222
          NT       0.79      0.88      0.83       105

   micro avg       0.91      0.96      0.93       410
   macro avg       0.91      0.95      0.93       410
weighted avg       0.91      0.96      0.93       410



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.58it/s, F1=0.767, eval_acc=0.972, eval_loss=5.98, eval_precision=0.732, eval_recall=0.812]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.88      0.94      0.91      1416
          NS       0.79      0.77      0.78      2857
          NT       0.53      0.75      0.62      1314

   micro avg       0.73      0.81      0.77      5587
   macro avg       0.73      0.82      0.77      5587
weighted avg       0.75      0.81      0.77      5587



Epoch: 22/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.41it/s, F1=0.97, train_acc=0.998, train_loss=0.419, train_precision=0.961, train_recall=0.98]  


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99        83
          NS       0.97      0.99      0.98       222
          NT       0.88      0.94      0.91       105

   micro avg       0.95      0.98      0.97       410
   macro avg       0.95      0.97      0.96       410
weighted avg       0.95      0.98      0.97       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.37it/s, F1=0.784, eval_acc=0.974, eval_loss=6.33, eval_precision=0.767, eval_recall=0.809]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.90      0.92      0.91      1416
          NS       0.77      0.80      0.78      2857
          NT       0.58      0.65      0.61      1314

   micro avg       0.76      0.79      0.77      5587
   macro avg       0.75      0.79      0.77      5587
weighted avg       0.76      0.79      0.78      5587



Epoch: 23/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.29it/s, F1=0.965, train_acc=1, train_loss=0.0991, train_precision=0.964, train_recall=0.966]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00        83
          NS       1.00      1.00      1.00       222
          NT       0.98      0.98      0.98       105

   micro avg       0.99      1.00      0.99       410
   macro avg       0.99      0.99      0.99       410
weighted avg       0.99      1.00      0.99       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.34it/s, F1=0.779, eval_acc=0.974, eval_loss=6.1, eval_precision=0.751, eval_recall=0.816] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.91      0.93      0.92      1416
          NS       0.78      0.79      0.78      2857
          NT       0.57      0.72      0.64      1314

   micro avg       0.75      0.81      0.78      5587
   macro avg       0.75      0.81      0.78      5587
weighted avg       0.76      0.81      0.78      5587



Epoch: 24/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.39it/s, F1=0.993, train_acc=1, train_loss=0.0752, train_precision=0.993, train_recall=0.993]    


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00        83
          NS       0.98      0.98      0.98       222
          NT       1.00      1.00      1.00       105

   micro avg       0.99      0.99      0.99       410
   macro avg       0.99      0.99      0.99       410
weighted avg       0.99      0.99      0.99       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.36it/s, F1=0.781, eval_acc=0.974, eval_loss=6.13, eval_precision=0.752, eval_recall=0.819]


eval_reports:
              precision    recall  f1-score   support

          NR       0.91      0.93      0.92      1416
          NS       0.78      0.79      0.78      2857
          NT       0.57      0.74      0.64      1314

   micro avg       0.75      0.81      0.78      5587
   macro avg       0.76      0.82      0.78      5587
weighted avg       0.77      0.81      0.79      5587



Epoch: 25/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.37it/s, F1=0.968, train_acc=1, train_loss=0.0506, train_precision=0.967, train_recall=0.969]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00        83
          NS       1.00      1.00      1.00       222
          NT       1.00      1.00      1.00       105

   micro avg       1.00      1.00      1.00       410
   macro avg       1.00      1.00      1.00       410
weighted avg       1.00      1.00      1.00       410



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.30it/s, F1=0.786, eval_acc=0.974, eval_loss=6.65, eval_precision=0.777, eval_recall=0.801]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.91      0.93      0.92      1416
          NS       0.82      0.77      0.79      2857
          NT       0.59      0.72      0.65      1314

   micro avg       0.78      0.80      0.79      5587
   macro avg       0.77      0.80      0.79      5587
weighted avg       0.79      0.80      0.79      5587



Epoch: 26/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.40it/s, F1=0.999, train_acc=1, train_loss=0.0433, train_precision=0.999, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00        83
          NS       1.00      1.00      1.00       222
          NT       1.00      1.00      1.00       105

   micro avg       1.00      1.00      1.00       410
   macro avg       1.00      1.00      1.00       410
weighted avg       1.00      1.00      1.00       410



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.58it/s, F1=0.792, eval_acc=0.975, eval_loss=6.38, eval_precision=0.778, eval_recall=0.813]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.91      0.93      0.92      1416
          NS       0.81      0.79      0.80      2857
          NT       0.60      0.72      0.65      1314

   micro avg       0.78      0.81      0.79      5587
   macro avg       0.77      0.81      0.79      5587
weighted avg       0.78      0.81      0.79      5587



Epoch: 27/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.39it/s, F1=1, train_acc=1, train_loss=0.0291, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00        83
          NS       1.00      1.00      1.00       222
          NT       1.00      1.00      1.00       105

   micro avg       1.00      1.00      1.00       410
   macro avg       1.00      1.00      1.00       410
weighted avg       1.00      1.00      1.00       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.34it/s, F1=0.792, eval_acc=0.975, eval_loss=6.45, eval_precision=0.778, eval_recall=0.814]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.91      0.93      0.92      1416
          NS       0.80      0.79      0.80      2857
          NT       0.60      0.71      0.65      1314

   micro avg       0.77      0.81      0.79      5587
   macro avg       0.77      0.81      0.79      5587
weighted avg       0.78      0.81      0.79      5587



Epoch: 28/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.40it/s, F1=0.999, train_acc=1, train_loss=0.0391, train_precision=0.999, train_recall=1]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00        83
          NS       1.00      1.00      1.00       222
          NT       0.99      1.00      1.00       105

   micro avg       1.00      1.00      1.00       410
   macro avg       1.00      1.00      1.00       410
weighted avg       1.00      1.00      1.00       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.34it/s, F1=0.796, eval_acc=0.975, eval_loss=6.82, eval_precision=0.787, eval_recall=0.811]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.91      0.93      0.92      1416
          NS       0.80      0.80      0.80      2857
          NT       0.61      0.68      0.64      1314

   micro avg       0.78      0.80      0.79      5587
   macro avg       0.77      0.80      0.79      5587
weighted avg       0.78      0.80      0.79      5587



Epoch: 29/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.35it/s, F1=1, train_acc=1, train_loss=0.0253, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00        83
          NS       1.00      1.00      1.00       222
          NT       1.00      1.00      1.00       105

   micro avg       1.00      1.00      1.00       410
   macro avg       1.00      1.00      1.00       410
weighted avg       1.00      1.00      1.00       410



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.24it/s, F1=0.794, eval_acc=0.975, eval_loss=6.75, eval_precision=0.783, eval_recall=0.812]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.91      0.93      0.92      1416
          NS       0.80      0.79      0.80      2857
          NT       0.61      0.69      0.65      1314

   micro avg       0.78      0.80      0.79      5587
   macro avg       0.77      0.81      0.79      5587
weighted avg       0.78      0.80      0.79      5587



Epoch: 30/30 Train: 100%|██████████| 32/32 [00:09<00:00,  3.46it/s, F1=0.999, train_acc=1, train_loss=0.0333, train_precision=0.999, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00        83
          NS       1.00      1.00      1.00       222
          NT       0.99      0.99      0.99       105

   micro avg       1.00      1.00      1.00       410
   macro avg       1.00      1.00      1.00       410
weighted avg       1.00      1.00      1.00       410



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.39it/s, F1=0.792, eval_acc=0.975, eval_loss=6.43, eval_precision=0.773, eval_recall=0.818]


eval_reports:
              precision    recall  f1-score   support

          NR       0.91      0.93      0.92      1416
          NS       0.79      0.79      0.79      2857
          NT       0.61      0.73      0.66      1314

   micro avg       0.77      0.81      0.79      5587
   macro avg       0.77      0.82      0.79      5587
weighted avg       0.78      0.81      0.79      5587



calculate data/few_shot/msra/train_500.json etag: 100%|██████████| 314k/314k [00:00<00:00, 17.9MB/s]
calculate data/few_shot/msra/dev.json etag: 100%|██████████| 2.12M/2.12M [00:00<00:00, 329MB/s]
calculate data/few_shot/msra/test.json etag: 100%|██████████| 2.12M/2.12M [00:00<00:00, 369MB/s]
calculate data/few_shot/msra/labels.txt etag: 100%|██████████| 62.0/62.0 [00:00<00:00, 123kB/s]

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/msra/train_500.json",
    "eval_file": "data/few_shot/msra/dev.json",
    "test_file": "data/few_shot/msra/test.json",
    "tag_file": "data/few_shot/msra/labels.txt",
    "bert_vocab_file": "./model/chinese_wwm_ext/vocab.txt",
    "output_eval": true,
    "max_scan_num": 1000000,
    "add_seq_vocab": false,
    "max_seq_length": 150,
    "max_word_num": 5,
    "default_tag": "O",
    "use_test": false,
    "do_shuffle": true,
    "do_predict": false,
    "task_name": "msra_pretrain_lebert_crf_500_x1"
}
load cached ./temp/3a418bc5bceb142b229b235ce03f275d_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/lexicon_tree



count line size data/few_shot/msra/labels.txt: 14L [00:00, 86100.08L/s]
build line mapper: 14L [00:00, 119350.11L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 14/14 [00:00<00:00, 4150.72it/s]
load vocab from list: 100%|██████████| 13/13 [00:00<00:00, 152307.13it/s]

load cached ./temp/3a418bc5bceb142b229b235ce03f275d_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/matched_words
load cached ./temp/3a418bc5bceb142b229b235ce03f275d_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/word_vocab
load cached ./temp/3a418bc5bceb142b229b235ce03f275d_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/vocab_embedding



load dataset from data/few_shot/msra/train_500.json: 500it [00:01, 392.61it/s]
load dataset from data/few_shot/msra/dev.json: 4365it [00:09, 466.78it/s]
Some weights of the model checkpoint at save_pretrained/msra_pretrain_lebert_500_pretraind_task/Bert_480/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model fro

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.37it/s, F1=0.001, train_acc=0.645, train_loss=73.3, train_precision=0.000528, train_recall=0.0105]  


train_reports:
              precision    recall  f1-score   support

          NR       0.00      0.00      0.00       177
          NS       0.00      0.02      0.01       456
          NT       0.00      0.00      0.00       225

   micro avg       0.00      0.01      0.00       858
   macro avg       0.00      0.01      0.00       858
weighted avg       0.00      0.01      0.00       858



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.26it/s, F1=0, eval_acc=0.897, eval_loss=23.7, eval_precision=0, eval_recall=0]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.00      0.00      0.00      1416
          NS       0.00      0.00      0.00      2857
          NT       0.00      0.00      0.00      1314

   micro avg       0.00      0.00      0.00      5587
   macro avg       0.00      0.00      0.00      5587
weighted avg       0.00      0.00      0.00      5587



Epoch: 2/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.44it/s, F1=0.0262, train_acc=0.899, train_loss=21.2, train_precision=0.0209, train_recall=0.0359]   


train_reports:
              precision    recall  f1-score   support

          NR       0.08      0.04      0.05       177
          NS       0.07      0.08      0.07       456
          NT       0.00      0.00      0.00       225

   micro avg       0.05      0.05      0.05       858
   macro avg       0.05      0.04      0.04       858
weighted avg       0.05      0.05      0.05       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.33it/s, F1=0.22, eval_acc=0.947, eval_loss=8.55, eval_precision=0.18, eval_recall=0.289]  


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.70      0.71      0.71      1416
          NS       0.11      0.18      0.14      2857
          NT       0.02      0.06      0.03      1314

   micro avg       0.17      0.29      0.21      5587
   macro avg       0.28      0.32      0.29      5587
weighted avg       0.24      0.29      0.26      5587



Epoch: 3/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.36it/s, F1=0.464, train_acc=0.96, train_loss=7.42, train_precision=0.415, train_recall=0.539] 


train_reports:
              precision    recall  f1-score   support

          NR       0.72      0.78      0.75       177
          NS       0.45      0.55      0.49       456
          NT       0.16      0.31      0.21       225

   micro avg       0.38      0.54      0.45       858
   macro avg       0.44      0.55      0.48       858
weighted avg       0.43      0.54      0.47       858



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.30it/s, F1=0.661, eval_acc=0.973, eval_loss=3.95, eval_precision=0.625, eval_recall=0.713]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.86      0.88      0.87      1416
          NS       0.76      0.73      0.74      2857
          NT       0.24      0.44      0.31      1314

   micro avg       0.59      0.70      0.64      5587
   macro avg       0.62      0.68      0.64      5587
weighted avg       0.66      0.70      0.67      5587



Epoch: 4/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.38it/s, F1=0.806, train_acc=0.987, train_loss=2.63, train_precision=0.786, train_recall=0.832]


train_reports:
              precision    recall  f1-score   support

          NR       0.91      0.90      0.91       177
          NS       0.84      0.83      0.84       456
          NT       0.59      0.77      0.67       225

   micro avg       0.78      0.83      0.80       858
   macro avg       0.78      0.84      0.81       858
weighted avg       0.79      0.83      0.81       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.35it/s, F1=0.79, eval_acc=0.979, eval_loss=4.04, eval_precision=0.778, eval_recall=0.808] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.94      0.94      1416
          NS       0.79      0.83      0.81      2857
          NT       0.51      0.58      0.55      1314

   micro avg       0.76      0.80      0.78      5587
   macro avg       0.75      0.78      0.76      5587
weighted avg       0.76      0.80      0.78      5587



Epoch: 5/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.47it/s, F1=0.918, train_acc=0.995, train_loss=1.11, train_precision=0.914, train_recall=0.925]


train_reports:
              precision    recall  f1-score   support

          NR       0.97      0.95      0.96       177
          NS       0.95      0.95      0.95       456
          NT       0.83      0.86      0.84       225

   micro avg       0.92      0.93      0.92       858
   macro avg       0.91      0.92      0.92       858
weighted avg       0.92      0.93      0.92       858



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.29it/s, F1=0.816, eval_acc=0.982, eval_loss=3.45, eval_precision=0.79, eval_recall=0.849] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.96      0.95      0.95      1416
          NS       0.81      0.84      0.82      2857
          NT       0.59      0.74      0.66      1314

   micro avg       0.78      0.85      0.81      5587
   macro avg       0.79      0.84      0.81      5587
weighted avg       0.79      0.85      0.82      5587



Epoch: 6/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.35it/s, F1=0.942, train_acc=0.997, train_loss=0.672, train_precision=0.935, train_recall=0.952]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      0.97      0.99       177
          NS       0.94      0.96      0.95       456
          NT       0.88      0.93      0.90       225

   micro avg       0.94      0.96      0.95       858
   macro avg       0.94      0.96      0.95       858
weighted avg       0.94      0.96      0.95       858



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.27it/s, F1=0.822, eval_acc=0.981, eval_loss=3.89, eval_precision=0.798, eval_recall=0.852]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.90      0.95      0.93      1416
          NS       0.83      0.84      0.83      2857
          NT       0.63      0.77      0.70      1314

   micro avg       0.80      0.85      0.82      5587
   macro avg       0.79      0.85      0.82      5587
weighted avg       0.80      0.85      0.83      5587



Epoch: 7/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.43it/s, F1=0.967, train_acc=0.998, train_loss=0.486, train_precision=0.964, train_recall=0.972]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       177
          NS       0.98      0.96      0.97       456
          NT       0.92      0.97      0.95       225

   micro avg       0.97      0.97      0.97       858
   macro avg       0.96      0.97      0.97       858
weighted avg       0.97      0.97      0.97       858



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.24it/s, F1=0.836, eval_acc=0.982, eval_loss=4.16, eval_precision=0.829, eval_recall=0.847]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.95      0.94      1416
          NS       0.86      0.86      0.86      2857
          NT       0.64      0.71      0.67      1314

   micro avg       0.83      0.85      0.84      5587
   macro avg       0.81      0.84      0.83      5587
weighted avg       0.83      0.85      0.84      5587



Epoch: 8/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.47it/s, F1=0.975, train_acc=0.998, train_loss=0.356, train_precision=0.971, train_recall=0.98] 


train_reports:
              precision    recall  f1-score   support

          NR       0.96      0.97      0.97       177
          NS       0.98      0.99      0.98       456
          NT       0.96      0.97      0.96       225

   micro avg       0.97      0.98      0.98       858
   macro avg       0.97      0.98      0.97       858
weighted avg       0.97      0.98      0.98       858



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.51it/s, F1=0.845, eval_acc=0.983, eval_loss=4.09, eval_precision=0.826, eval_recall=0.869]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.96      0.95      1416
          NS       0.83      0.89      0.86      2857
          NT       0.69      0.74      0.72      1314

   micro avg       0.83      0.87      0.85      5587
   macro avg       0.82      0.86      0.84      5587
weighted avg       0.83      0.87      0.85      5587



Epoch: 9/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.40it/s, F1=0.987, train_acc=0.999, train_loss=0.276, train_precision=0.984, train_recall=0.99] 


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       177
          NS       0.99      0.99      0.99       456
          NT       0.96      0.98      0.97       225

   micro avg       0.98      0.99      0.99       858
   macro avg       0.98      0.99      0.99       858
weighted avg       0.98      0.99      0.99       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.33it/s, F1=0.82, eval_acc=0.98, eval_loss=4.27, eval_precision=0.784, eval_recall=0.865]  


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.95      0.95      1416
          NS       0.82      0.85      0.83      2857
          NT       0.61      0.81      0.69      1314

   micro avg       0.79      0.86      0.83      5587
   macro avg       0.79      0.87      0.83      5587
weighted avg       0.80      0.86      0.83      5587



Epoch: 10/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.39it/s, F1=0.982, train_acc=0.999, train_loss=0.25, train_precision=0.977, train_recall=0.988] 


train_reports:
              precision    recall  f1-score   support

          NR       0.99      1.00      1.00       177
          NS       0.98      0.98      0.98       456
          NT       0.97      0.98      0.97       225

   micro avg       0.98      0.99      0.98       858
   macro avg       0.98      0.99      0.98       858
weighted avg       0.98      0.99      0.98       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.34it/s, F1=0.831, eval_acc=0.981, eval_loss=5.59, eval_precision=0.842, eval_recall=0.825]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.97      0.95      0.96      1416
          NS       0.84      0.86      0.85      2857
          NT       0.68      0.61      0.64      1314

   micro avg       0.84      0.82      0.83      5587
   macro avg       0.83      0.80      0.82      5587
weighted avg       0.83      0.82      0.83      5587



Epoch: 11/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.45it/s, F1=0.981, train_acc=0.998, train_loss=0.365, train_precision=0.979, train_recall=0.985]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       177
          NS       0.98      0.99      0.99       456
          NT       0.96      0.96      0.96       225

   micro avg       0.98      0.98      0.98       858
   macro avg       0.98      0.98      0.98       858
weighted avg       0.98      0.98      0.98       858



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.48it/s, F1=0.817, eval_acc=0.981, eval_loss=4.23, eval_precision=0.779, eval_recall=0.865]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.96      0.96      0.96      1416
          NS       0.80      0.87      0.83      2857
          NT       0.62      0.77      0.69      1314

   micro avg       0.79      0.87      0.83      5587
   macro avg       0.79      0.87      0.83      5587
weighted avg       0.80      0.87      0.83      5587



Epoch: 12/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.45it/s, F1=0.995, train_acc=0.999, train_loss=0.261, train_precision=0.996, train_recall=0.994]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      0.99      1.00       177
          NS       1.00      1.00      1.00       456
          NT       0.99      0.99      0.99       225

   micro avg       1.00      0.99      1.00       858
   macro avg       1.00      0.99      0.99       858
weighted avg       1.00      0.99      1.00       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.33it/s, F1=0.836, eval_acc=0.982, eval_loss=4.24, eval_precision=0.814, eval_recall=0.863]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.96      0.95      1416
          NS       0.84      0.87      0.86      2857
          NT       0.67      0.76      0.71      1314

   micro avg       0.82      0.87      0.84      5587
   macro avg       0.82      0.86      0.84      5587
weighted avg       0.83      0.87      0.85      5587



Epoch: 13/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.42it/s, F1=0.991, train_acc=1, train_loss=0.106, train_precision=0.988, train_recall=0.994] 


train_reports:
              precision    recall  f1-score   support

          NR       0.97      0.99      0.98       177
          NS       1.00      1.00      1.00       456
          NT       0.97      0.99      0.98       225

   micro avg       0.99      1.00      0.99       858
   macro avg       0.98      0.99      0.99       858
weighted avg       0.99      1.00      0.99       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.32it/s, F1=0.837, eval_acc=0.982, eval_loss=4.49, eval_precision=0.818, eval_recall=0.861]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.92      0.96      0.94      1416
          NS       0.82      0.87      0.85      2857
          NT       0.72      0.73      0.72      1314

   micro avg       0.82      0.86      0.84      5587
   macro avg       0.82      0.85      0.84      5587
weighted avg       0.82      0.86      0.84      5587



Epoch: 14/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.40it/s, F1=0.982, train_acc=0.999, train_loss=0.262, train_precision=0.978, train_recall=0.988]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       177
          NS       0.98      0.99      0.99       456
          NT       0.96      0.99      0.97       225

   micro avg       0.98      0.99      0.98       858
   macro avg       0.98      0.99      0.98       858
weighted avg       0.98      0.99      0.98       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.35it/s, F1=0.846, eval_acc=0.983, eval_loss=4.38, eval_precision=0.83, eval_recall=0.866] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.96      0.96      0.96      1416
          NS       0.85      0.87      0.86      2857
          NT       0.70      0.77      0.73      1314

   micro avg       0.84      0.87      0.85      5587
   macro avg       0.83      0.87      0.85      5587
weighted avg       0.84      0.87      0.85      5587



Epoch: 15/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.41it/s, F1=0.995, train_acc=1, train_loss=0.077, train_precision=0.993, train_recall=0.998]    


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       177
          NS       0.99      1.00      1.00       456
          NT       1.00      1.00      1.00       225

   micro avg       1.00      1.00      1.00       858
   macro avg       1.00      1.00      1.00       858
weighted avg       1.00      1.00      1.00       858



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.57it/s, F1=0.843, eval_acc=0.983, eval_loss=4.79, eval_precision=0.835, eval_recall=0.856]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.94      0.94      1416
          NS       0.84      0.87      0.86      2857
          NT       0.73      0.75      0.74      1314

   micro avg       0.84      0.86      0.85      5587
   macro avg       0.84      0.85      0.84      5587
weighted avg       0.84      0.86      0.85      5587



Epoch: 16/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.44it/s, F1=0.99, train_acc=0.999, train_loss=0.271, train_precision=0.988, train_recall=0.993] 


train_reports:
              precision    recall  f1-score   support

          NR       0.97      0.98      0.97       177
          NS       0.99      0.99      0.99       456
          NT       0.99      1.00      0.99       225

   micro avg       0.98      0.99      0.99       858
   macro avg       0.98      0.99      0.99       858
weighted avg       0.98      0.99      0.99       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.37it/s, F1=0.841, eval_acc=0.983, eval_loss=4.51, eval_precision=0.831, eval_recall=0.854]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.94      0.94      1416
          NS       0.84      0.88      0.86      2857
          NT       0.73      0.71      0.72      1314

   micro avg       0.84      0.85      0.85      5587
   macro avg       0.83      0.84      0.84      5587
weighted avg       0.84      0.85      0.85      5587



Epoch: 17/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.38it/s, F1=0.985, train_acc=0.999, train_loss=0.161, train_precision=0.98, train_recall=0.991]  


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.98      0.98       177
          NS       0.98      0.99      0.99       456
          NT       0.97      0.99      0.98       225

   micro avg       0.98      0.99      0.98       858
   macro avg       0.98      0.99      0.98       858
weighted avg       0.98      0.99      0.98       858



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.23it/s, F1=0.755, eval_acc=0.973, eval_loss=6.37, eval_precision=0.731, eval_recall=0.786]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.90      0.96      0.93      1416
          NS       0.84      0.72      0.77      2857
          NT       0.52      0.80      0.63      1314

   micro avg       0.75      0.80      0.77      5587
   macro avg       0.76      0.82      0.78      5587
weighted avg       0.78      0.80      0.78      5587



Epoch: 18/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.41it/s, F1=0.978, train_acc=0.999, train_loss=0.322, train_precision=0.972, train_recall=0.986]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      1.00      1.00       177
          NS       0.97      0.99      0.98       456
          NT       0.94      0.96      0.95       225

   micro avg       0.97      0.98      0.98       858
   macro avg       0.97      0.98      0.98       858
weighted avg       0.97      0.98      0.98       858



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.29it/s, F1=0.832, eval_acc=0.981, eval_loss=4.81, eval_precision=0.817, eval_recall=0.85] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.94      0.95      1416
          NS       0.82      0.84      0.83      2857
          NT       0.68      0.75      0.71      1314

   micro avg       0.82      0.85      0.83      5587
   macro avg       0.82      0.84      0.83      5587
weighted avg       0.82      0.85      0.83      5587



Epoch: 19/30 Train: 100%|██████████| 63/63 [00:21<00:00,  2.89it/s, F1=0.984, train_acc=0.998, train_loss=0.509, train_precision=0.981, train_recall=0.987]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.97      0.98       177
          NS       0.99      1.00      0.99       456
          NT       0.97      0.98      0.97       225

   micro avg       0.98      0.99      0.98       858
   macro avg       0.98      0.98      0.98       858
weighted avg       0.98      0.99      0.98       858



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.29it/s, F1=0.83, eval_acc=0.981, eval_loss=4.53, eval_precision=0.825, eval_recall=0.838] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.91      0.95      0.93      1416
          NS       0.85      0.84      0.84      2857
          NT       0.69      0.74      0.72      1314

   micro avg       0.83      0.84      0.83      5587
   macro avg       0.82      0.84      0.83      5587
weighted avg       0.83      0.84      0.84      5587



Epoch: 20/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.36it/s, F1=0.956, train_acc=0.997, train_loss=0.576, train_precision=0.95, train_recall=0.963] 


train_reports:
              precision    recall  f1-score   support

          NR       0.88      0.93      0.90       177
          NS       0.96      0.97      0.96       456
          NT       0.97      0.98      0.97       225

   micro avg       0.94      0.96      0.95       858
   macro avg       0.93      0.96      0.95       858
weighted avg       0.94      0.96      0.95       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.35it/s, F1=0.829, eval_acc=0.981, eval_loss=4.28, eval_precision=0.807, eval_recall=0.856]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.95      0.95      1416
          NS       0.82      0.84      0.83      2857
          NT       0.69      0.79      0.74      1314

   micro avg       0.82      0.86      0.84      5587
   macro avg       0.82      0.86      0.84      5587
weighted avg       0.82      0.86      0.84      5587



Epoch: 21/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.38it/s, F1=0.965, train_acc=0.997, train_loss=0.774, train_precision=0.957, train_recall=0.975]


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.99      0.99       177
          NS       0.97      0.98      0.97       456
          NT       0.91      0.96      0.94       225

   micro avg       0.96      0.98      0.97       858
   macro avg       0.95      0.98      0.97       858
weighted avg       0.96      0.98      0.97       858



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.31it/s, F1=0.817, eval_acc=0.98, eval_loss=4.01, eval_precision=0.771, eval_recall=0.875] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.95      0.95      1416
          NS       0.78      0.88      0.83      2857
          NT       0.65      0.78      0.71      1314

   micro avg       0.78      0.88      0.83      5587
   macro avg       0.79      0.87      0.83      5587
weighted avg       0.79      0.88      0.83      5587



Epoch: 22/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.40it/s, F1=0.992, train_acc=0.999, train_loss=0.183, train_precision=0.989, train_recall=0.996]


train_reports:
              precision    recall  f1-score   support

          NR       0.97      0.99      0.98       177
          NS       1.00      1.00      1.00       456
          NT       0.98      0.99      0.98       225

   micro avg       0.99      1.00      0.99       858
   macro avg       0.98      0.99      0.99       858
weighted avg       0.99      1.00      0.99       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.33it/s, F1=0.825, eval_acc=0.981, eval_loss=4.36, eval_precision=0.809, eval_recall=0.846]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.96      0.94      0.95      1416
          NS       0.83      0.84      0.84      2857
          NT       0.67      0.78      0.72      1314

   micro avg       0.82      0.85      0.83      5587
   macro avg       0.82      0.85      0.83      5587
weighted avg       0.82      0.85      0.84      5587



Epoch: 23/30 Train: 100%|██████████| 63/63 [00:21<00:00,  2.87it/s, F1=0.979, train_acc=1, train_loss=0.0541, train_precision=0.979, train_recall=0.98] 


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       177
          NS       1.00      1.00      1.00       456
          NT       0.99      1.00      0.99       225

   micro avg       0.99      1.00      1.00       858
   macro avg       0.99      1.00      0.99       858
weighted avg       0.99      1.00      1.00       858



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.31it/s, F1=0.839, eval_acc=0.983, eval_loss=4.6, eval_precision=0.834, eval_recall=0.848] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.96      0.94      0.95      1416
          NS       0.84      0.86      0.85      2857
          NT       0.70      0.74      0.72      1314

   micro avg       0.84      0.85      0.85      5587
   macro avg       0.84      0.85      0.84      5587
weighted avg       0.84      0.85      0.85      5587



Epoch: 24/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.43it/s, F1=0.997, train_acc=1, train_loss=0.0595, train_precision=0.997, train_recall=0.998]   


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       177
          NS       1.00      1.00      1.00       456
          NT       0.98      0.99      0.99       225

   micro avg       1.00      1.00      1.00       858
   macro avg       0.99      1.00      1.00       858
weighted avg       1.00      1.00      1.00       858



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.25it/s, F1=0.84, eval_acc=0.983, eval_loss=4.61, eval_precision=0.824, eval_recall=0.861] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.96      0.94      0.95      1416
          NS       0.84      0.87      0.86      2857
          NT       0.70      0.78      0.74      1314

   micro avg       0.83      0.87      0.85      5587
   macro avg       0.83      0.86      0.85      5587
weighted avg       0.84      0.87      0.85      5587



Epoch: 25/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.40it/s, F1=0.985, train_acc=0.999, train_loss=0.167, train_precision=0.981, train_recall=0.993]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       177
          NS       1.00      1.00      1.00       456
          NT       0.95      0.98      0.96       225

   micro avg       0.98      0.99      0.99       858
   macro avg       0.98      0.99      0.99       858
weighted avg       0.98      0.99      0.99       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.35it/s, F1=0.825, eval_acc=0.981, eval_loss=5.08, eval_precision=0.804, eval_recall=0.851]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.96      0.95      1416
          NS       0.80      0.86      0.83      2857
          NT       0.69      0.72      0.71      1314

   micro avg       0.81      0.85      0.83      5587
   macro avg       0.81      0.85      0.83      5587
weighted avg       0.81      0.85      0.83      5587



Epoch: 26/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.43it/s, F1=0.969, train_acc=0.999, train_loss=0.199, train_precision=0.966, train_recall=0.972]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       177
          NS       0.98      0.99      0.99       456
          NT       0.96      0.97      0.96       225

   micro avg       0.98      0.99      0.98       858
   macro avg       0.98      0.99      0.98       858
weighted avg       0.98      0.99      0.98       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.33it/s, F1=0.831, eval_acc=0.982, eval_loss=4.27, eval_precision=0.814, eval_recall=0.851]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.96      0.96      0.96      1416
          NS       0.83      0.86      0.84      2857
          NT       0.66      0.73      0.69      1314

   micro avg       0.82      0.85      0.84      5587
   macro avg       0.82      0.85      0.83      5587
weighted avg       0.82      0.85      0.84      5587



Epoch: 27/30 Train: 100%|██████████| 63/63 [00:21<00:00,  2.87it/s, F1=0.979, train_acc=0.998, train_loss=0.441, train_precision=0.975, train_recall=0.984]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       177
          NS       0.97      0.99      0.98       456
          NT       0.95      0.96      0.96       225

   micro avg       0.97      0.98      0.98       858
   macro avg       0.98      0.98      0.98       858
weighted avg       0.97      0.98      0.98       858



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.30it/s, F1=0.813, eval_acc=0.979, eval_loss=4.67, eval_precision=0.763, eval_recall=0.879]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.96      0.95      1416
          NS       0.79      0.87      0.83      2857
          NT       0.62      0.82      0.71      1314

   micro avg       0.78      0.88      0.83      5587
   macro avg       0.78      0.88      0.83      5587
weighted avg       0.79      0.88      0.83      5587



Epoch: 28/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.42it/s, F1=0.999, train_acc=1, train_loss=0.0302, train_precision=1, train_recall=0.998]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       177
          NS       1.00      1.00      1.00       456
          NT       1.00      1.00      1.00       225

   micro avg       1.00      1.00      1.00       858
   macro avg       1.00      1.00      1.00       858
weighted avg       1.00      1.00      1.00       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.35it/s, F1=0.846, eval_acc=0.983, eval_loss=4.43, eval_precision=0.82, eval_recall=0.877] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.96      0.95      1416
          NS       0.83      0.87      0.85      2857
          NT       0.71      0.80      0.75      1314

   micro avg       0.83      0.88      0.85      5587
   macro avg       0.83      0.88      0.85      5587
weighted avg       0.83      0.88      0.85      5587



Epoch: 29/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.40it/s, F1=0.999, train_acc=1, train_loss=0.0164, train_precision=0.998, train_recall=1]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       177
          NS       1.00      1.00      1.00       456
          NT       1.00      1.00      1.00       225

   micro avg       1.00      1.00      1.00       858
   macro avg       1.00      1.00      1.00       858
weighted avg       1.00      1.00      1.00       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.34it/s, F1=0.855, eval_acc=0.983, eval_loss=4.51, eval_precision=0.838, eval_recall=0.875]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.95      0.95      1416
          NS       0.85      0.88      0.86      2857
          NT       0.73      0.79      0.76      1314

   micro avg       0.84      0.88      0.86      5587
   macro avg       0.84      0.87      0.86      5587
weighted avg       0.85      0.88      0.86      5587



Epoch: 30/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.43it/s, F1=0.997, train_acc=1, train_loss=0.0369, train_precision=0.996, train_recall=0.997]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       177
          NS       1.00      1.00      1.00       456
          NT       0.99      1.00      0.99       225

   micro avg       1.00      1.00      1.00       858
   macro avg       1.00      1.00      1.00       858
weighted avg       1.00      1.00      1.00       858



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.58it/s, F1=0.855, eval_acc=0.983, eval_loss=4.6, eval_precision=0.841, eval_recall=0.873] 


eval_reports:
              precision    recall  f1-score   support

          NR       0.95      0.95      0.95      1416
          NS       0.86      0.87      0.86      2857
          NT       0.73      0.79      0.76      1314

   micro avg       0.85      0.87      0.86      5587
   macro avg       0.85      0.87      0.86      5587
weighted avg       0.85      0.87      0.86      5587



calculate data/few_shot/msra/train_500.json etag: 100%|██████████| 314k/314k [00:00<00:00, 253MB/s]
calculate data/few_shot/msra/dev.json etag: 100%|██████████| 2.12M/2.12M [00:00<00:00, 312MB/s]
calculate data/few_shot/msra/test.json etag: 100%|██████████| 2.12M/2.12M [00:00<00:00, 369MB/s]
calculate data/few_shot/msra/labels.txt etag: 100%|██████████| 62.0/62.0 [00:00<00:00, 127kB/s]

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/msra/train_500.json",
    "eval_file": "data/few_shot/msra/dev.json",
    "test_file": "data/few_shot/msra/test.json",
    "tag_file": "data/few_shot/msra/labels.txt",
    "bert_vocab_file": "./model/chinese_wwm_ext/vocab.txt",
    "output_eval": true,
    "max_scan_num": 1000000,
    "add_seq_vocab": false,
    "max_seq_length": 150,
    "max_word_num": 5,
    "default_tag": "O",
    "use_test": false,
    "do_shuffle": true,
    "do_predict": false,
    "task_name": "msra_pretrain_lebert_crf_500_x2"
}
load cached ./temp/3a418bc5bceb142b229b235ce03f275d_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/lexicon_tree



count line size data/few_shot/msra/labels.txt: 14L [00:00, 110584.29L/s]
build line mapper: 14L [00:00, 124936.71L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 14/14 [00:00<00:00, 4049.11it/s]
load vocab from list: 100%|██████████| 13/13 [00:00<00:00, 97892.19it/s]
load dataset from data/few_shot/msra/train_500.json: 59it [00:00, 583.39it/s]

load cached ./temp/3a418bc5bceb142b229b235ce03f275d_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/matched_words
load cached ./temp/3a418bc5bceb142b229b235ce03f275d_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/word_vocab
load cached ./temp/3a418bc5bceb142b229b235ce03f275d_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/vocab_embedding


load dataset from data/few_shot/msra/train_500.json: 500it [00:00, 563.84it/s]
load dataset from data/few_shot/msra/dev.json: 4365it [00:06, 673.45it/s]
Some weights of the model checkpoint at save_pretrained/msra_pretrain_lebert_500_pretraind_task/Bert_480/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.45it/s, F1=0.0043, train_acc=0.627, train_loss=123, train_precision=0.00232, train_recall=0.033]  


train_reports:
              precision    recall  f1-score   support

          NR       0.00      0.00      0.00       177
          NS       0.00      0.06      0.01       456
          NT       0.00      0.00      0.00       225

   micro avg       0.00      0.03      0.01       858
   macro avg       0.00      0.02      0.00       858
weighted avg       0.00      0.03      0.00       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.33it/s, F1=0, eval_acc=0.897, eval_loss=30.2, eval_precision=0, eval_recall=0]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.00      0.00      0.00      1416
          NS       0.00      0.00      0.00      2857
          NT       0.00      0.00      0.00      1314

   micro avg       0.00      0.00      0.00      5587
   macro avg       0.00      0.00      0.00      5587
weighted avg       0.00      0.00      0.00      5587



Epoch: 2/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.39it/s, F1=0.00348, train_acc=0.887, train_loss=32.4, train_precision=0.00255, train_recall=0.00556]


train_reports:
              precision    recall  f1-score   support

          NR       0.00      0.00      0.00       177
          NS       0.01      0.00      0.01       456
          NT       0.00      0.00      0.00       225

   micro avg       0.00      0.00      0.00       858
   macro avg       0.00      0.00      0.00       858
weighted avg       0.00      0.00      0.00       858



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.31it/s, F1=0.0217, eval_acc=0.902, eval_loss=14.6, eval_precision=0.0147, eval_recall=0.0431]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.00      0.00      0.00      1416
          NS       0.03      0.10      0.05      2857
          NT       0.00      0.00      0.00      1314

   micro avg       0.02      0.05      0.02      5587
   macro avg       0.01      0.03      0.02      5587
weighted avg       0.02      0.05      0.03      5587



Epoch: 3/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.42it/s, F1=0.264, train_acc=0.938, train_loss=12.2, train_precision=0.224, train_recall=0.336]   


train_reports:
              precision    recall  f1-score   support

          NR       0.23      0.28      0.26       177
          NS       0.28      0.48      0.35       456
          NT       0.02      0.07      0.03       225

   micro avg       0.16      0.33      0.22       858
   macro avg       0.18      0.28      0.21       858
weighted avg       0.20      0.33      0.25       858



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.28it/s, F1=0.564, eval_acc=0.968, eval_loss=5.66, eval_precision=0.514, eval_recall=0.635]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.82      0.87      0.84      1416
          NS       0.67      0.70      0.69      2857
          NT       0.04      0.09      0.06      1314

   micro avg       0.45      0.60      0.52      5587
   macro avg       0.51      0.55      0.53      5587
weighted avg       0.56      0.60      0.58      5587



Epoch: 4/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.34it/s, F1=0.718, train_acc=0.979, train_loss=4.93, train_precision=0.68, train_recall=0.771] 


train_reports:
              precision    recall  f1-score   support

          NR       0.93      0.94      0.93       177
          NS       0.74      0.78      0.76       456
          NT       0.41      0.62      0.49       225

   micro avg       0.66      0.77      0.71       858
   macro avg       0.69      0.78      0.73       858
weighted avg       0.69      0.77      0.72       858



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.29it/s, F1=0.722, eval_acc=0.976, eval_loss=4.77, eval_precision=0.686, eval_recall=0.772]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.94      0.94      1416
          NS       0.68      0.75      0.71      2857
          NT       0.38      0.55      0.45      1314

   micro avg       0.65      0.75      0.70      5587
   macro avg       0.67      0.75      0.70      5587
weighted avg       0.68      0.75      0.71      5587



Epoch: 5/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.37it/s, F1=0.822, train_acc=0.989, train_loss=2.31, train_precision=0.806, train_recall=0.845]


train_reports:
              precision    recall  f1-score   support

          NR       0.95      0.95      0.95       177
          NS       0.84      0.85      0.84       456
          NT       0.57      0.74      0.65       225

   micro avg       0.78      0.84      0.81       858
   macro avg       0.79      0.84      0.81       858
weighted avg       0.79      0.84      0.81       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.32it/s, F1=0.789, eval_acc=0.98, eval_loss=4.64, eval_precision=0.765, eval_recall=0.821] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.95      0.95      1416
          NS       0.79      0.80      0.79      2857
          NT       0.53      0.71      0.61      1314

   micro avg       0.75      0.82      0.78      5587
   macro avg       0.76      0.82      0.78      5587
weighted avg       0.77      0.82      0.79      5587



Epoch: 6/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.38it/s, F1=0.937, train_acc=0.995, train_loss=1.1, train_precision=0.928, train_recall=0.948]  


train_reports:
              precision    recall  f1-score   support

          NR       0.95      0.95      0.95       177
          NS       0.94      0.94      0.94       456
          NT       0.85      0.92      0.88       225

   micro avg       0.92      0.94      0.93       858
   macro avg       0.91      0.94      0.93       858
weighted avg       0.92      0.94      0.93       858



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.31it/s, F1=0.776, eval_acc=0.98, eval_loss=4.72, eval_precision=0.757, eval_recall=0.805] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.91      0.92      1416
          NS       0.78      0.81      0.79      2857
          NT       0.53      0.67      0.59      1314

   micro avg       0.74      0.80      0.77      5587
   macro avg       0.74      0.79      0.77      5587
weighted avg       0.76      0.80      0.78      5587



Epoch: 7/30 Train: 100%|██████████| 63/63 [00:22<00:00,  2.84it/s, F1=0.945, train_acc=0.996, train_loss=0.835, train_precision=0.938, train_recall=0.953]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.98      0.99       177
          NS       0.95      0.96      0.96       456
          NT       0.87      0.92      0.90       225

   micro avg       0.94      0.95      0.95       858
   macro avg       0.94      0.95      0.95       858
weighted avg       0.94      0.95      0.95       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.34it/s, F1=0.789, eval_acc=0.979, eval_loss=4.71, eval_precision=0.742, eval_recall=0.848]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.96      0.96      1416
          NS       0.76      0.83      0.79      2857
          NT       0.54      0.75      0.62      1314

   micro avg       0.74      0.84      0.79      5587
   macro avg       0.75      0.85      0.79      5587
weighted avg       0.76      0.84      0.79      5587



Epoch: 8/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.50it/s, F1=0.962, train_acc=0.998, train_loss=0.394, train_precision=0.957, train_recall=0.968]


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.98      0.98       177
          NS       0.97      0.98      0.98       456
          NT       0.92      0.96      0.94       225

   micro avg       0.96      0.97      0.97       858
   macro avg       0.96      0.97      0.97       858
weighted avg       0.96      0.97      0.97       858



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.26it/s, F1=0.821, eval_acc=0.982, eval_loss=4.65, eval_precision=0.793, eval_recall=0.857]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.95      0.95      1416
          NS       0.79      0.86      0.82      2857
          NT       0.62      0.74      0.68      1314

   micro avg       0.78      0.86      0.82      5587
   macro avg       0.79      0.85      0.82      5587
weighted avg       0.79      0.86      0.82      5587



Epoch: 9/30 Train: 100%|██████████| 63/63 [00:17<00:00,  3.52it/s, F1=0.972, train_acc=0.999, train_loss=0.266, train_precision=0.967, train_recall=0.977]


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.99      0.99       177
          NS       0.98      0.98      0.98       456
          NT       0.95      0.96      0.96       225

   micro avg       0.97      0.98      0.98       858
   macro avg       0.97      0.98      0.98       858
weighted avg       0.97      0.98      0.98       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.37it/s, F1=0.816, eval_acc=0.982, eval_loss=4.84, eval_precision=0.787, eval_recall=0.852]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.96      0.95      0.95      1416
          NS       0.78      0.86      0.82      2857
          NT       0.62      0.75      0.68      1314

   micro avg       0.78      0.85      0.82      5587
   macro avg       0.79      0.85      0.82      5587
weighted avg       0.79      0.85      0.82      5587



Epoch: 10/30 Train: 100%|██████████| 63/63 [00:21<00:00,  2.87it/s, F1=0.984, train_acc=0.999, train_loss=0.211, train_precision=0.978, train_recall=0.991]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      0.99      1.00       177
          NS       0.99      1.00      0.99       456
          NT       0.96      0.99      0.97       225

   micro avg       0.98      0.99      0.99       858
   macro avg       0.98      0.99      0.99       858
weighted avg       0.99      0.99      0.99       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.37it/s, F1=0.814, eval_acc=0.981, eval_loss=4.86, eval_precision=0.785, eval_recall=0.851]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.95      0.95      1416
          NS       0.80      0.84      0.82      2857
          NT       0.60      0.76      0.67      1314

   micro avg       0.78      0.85      0.81      5587
   macro avg       0.78      0.85      0.81      5587
weighted avg       0.79      0.85      0.82      5587



Epoch: 11/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.47it/s, F1=0.997, train_acc=1, train_loss=0.126, train_precision=0.997, train_recall=0.998]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       177
          NS       1.00      1.00      1.00       456
          NT       0.99      1.00      0.99       225

   micro avg       1.00      1.00      1.00       858
   macro avg       1.00      1.00      1.00       858
weighted avg       1.00      1.00      1.00       858



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.26it/s, F1=0.821, eval_acc=0.981, eval_loss=5.34, eval_precision=0.795, eval_recall=0.854]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.96      0.96      1416
          NS       0.81      0.85      0.83      2857
          NT       0.61      0.74      0.67      1314

   micro avg       0.79      0.85      0.82      5587
   macro avg       0.79      0.85      0.82      5587
weighted avg       0.80      0.85      0.82      5587



Epoch: 12/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.42it/s, F1=0.995, train_acc=1, train_loss=0.121, train_precision=0.993, train_recall=0.996]    


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       177
          NS       0.99      0.99      0.99       456
          NT       0.98      0.99      0.99       225

   micro avg       0.99      0.99      0.99       858
   macro avg       0.99      0.99      0.99       858
weighted avg       0.99      0.99      0.99       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.35it/s, F1=0.823, eval_acc=0.981, eval_loss=6.42, eval_precision=0.811, eval_recall=0.839]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.96      0.96      1416
          NS       0.80      0.84      0.82      2857
          NT       0.65      0.68      0.66      1314

   micro avg       0.80      0.84      0.82      5587
   macro avg       0.80      0.83      0.81      5587
weighted avg       0.80      0.84      0.82      5587



Epoch: 13/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.42it/s, F1=0.989, train_acc=0.999, train_loss=0.223, train_precision=0.985, train_recall=0.994]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       177
          NS       1.00      1.00      1.00       456
          NT       0.96      0.98      0.97       225

   micro avg       0.99      1.00      0.99       858
   macro avg       0.98      0.99      0.99       858
weighted avg       0.99      1.00      0.99       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.34it/s, F1=0.793, eval_acc=0.978, eval_loss=7.4, eval_precision=0.783, eval_recall=0.808] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.94      0.93      1416
          NS       0.81      0.83      0.82      2857
          NT       0.58      0.62      0.60      1314

   micro avg       0.78      0.81      0.79      5587
   macro avg       0.77      0.79      0.78      5587
weighted avg       0.78      0.81      0.80      5587



Epoch: 14/30 Train: 100%|██████████| 63/63 [00:21<00:00,  2.91it/s, F1=0.972, train_acc=0.999, train_loss=0.429, train_precision=0.971, train_recall=0.973]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       177
          NS       0.98      0.98      0.98       456
          NT       0.95      0.97      0.96       225

   micro avg       0.98      0.98      0.98       858
   macro avg       0.98      0.98      0.98       858
weighted avg       0.98      0.98      0.98       858



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.24it/s, F1=0.831, eval_acc=0.983, eval_loss=4.88, eval_precision=0.801, eval_recall=0.867]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.96      0.96      1416
          NS       0.81      0.88      0.84      2857
          NT       0.65      0.75      0.70      1314

   micro avg       0.80      0.87      0.84      5587
   macro avg       0.80      0.86      0.83      5587
weighted avg       0.81      0.87      0.84      5587



Epoch: 15/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.37it/s, F1=0.987, train_acc=0.999, train_loss=0.146, train_precision=0.981, train_recall=0.994]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      1.00      0.99       177
          NS       0.99      1.00      1.00       456
          NT       0.97      0.99      0.98       225

   micro avg       0.99      1.00      0.99       858
   macro avg       0.98      0.99      0.99       858
weighted avg       0.99      1.00      0.99       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.32it/s, F1=0.828, eval_acc=0.982, eval_loss=5.31, eval_precision=0.79, eval_recall=0.874] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.95      0.95      1416
          NS       0.81      0.88      0.84      2857
          NT       0.65      0.79      0.71      1314

   micro avg       0.80      0.88      0.84      5587
   macro avg       0.80      0.87      0.84      5587
weighted avg       0.81      0.88      0.84      5587



Epoch: 16/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.38it/s, F1=0.984, train_acc=0.999, train_loss=0.228, train_precision=0.978, train_recall=0.991] 


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.99      0.99       177
          NS       0.99      0.99      0.99       456
          NT       0.96      0.99      0.97       225

   micro avg       0.98      0.99      0.98       858
   macro avg       0.98      0.99      0.98       858
weighted avg       0.98      0.99      0.98       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.33it/s, F1=0.843, eval_acc=0.983, eval_loss=5.3, eval_precision=0.818, eval_recall=0.873] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.95      0.94      1416
          NS       0.83      0.89      0.86      2857
          NT       0.70      0.76      0.73      1314

   micro avg       0.82      0.88      0.85      5587
   macro avg       0.82      0.87      0.84      5587
weighted avg       0.83      0.88      0.85      5587



Epoch: 17/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.41it/s, F1=0.995, train_acc=1, train_loss=0.0781, train_precision=0.994, train_recall=0.997]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       177
          NS       1.00      1.00      1.00       456
          NT       0.99      0.99      0.99       225

   micro avg       0.99      1.00      1.00       858
   macro avg       0.99      1.00      1.00       858
weighted avg       0.99      1.00      1.00       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.31it/s, F1=0.827, eval_acc=0.981, eval_loss=5.54, eval_precision=0.782, eval_recall=0.882]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.96      0.95      1416
          NS       0.82      0.88      0.85      2857
          NT       0.63      0.83      0.72      1314

   micro avg       0.80      0.88      0.84      5587
   macro avg       0.80      0.89      0.84      5587
weighted avg       0.81      0.88      0.84      5587



Epoch: 18/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.43it/s, F1=0.996, train_acc=1, train_loss=0.137, train_precision=0.994, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      1.00      1.00       177
          NS       1.00      1.00      1.00       456
          NT       0.99      1.00      0.99       225

   micro avg       0.99      1.00      1.00       858
   macro avg       0.99      1.00      1.00       858
weighted avg       0.99      1.00      1.00       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.37it/s, F1=0.828, eval_acc=0.982, eval_loss=5.15, eval_precision=0.791, eval_recall=0.874]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.91      0.96      0.94      1416
          NS       0.83      0.88      0.85      2857
          NT       0.65      0.78      0.71      1314

   micro avg       0.80      0.88      0.84      5587
   macro avg       0.80      0.87      0.83      5587
weighted avg       0.81      0.88      0.84      5587



Epoch: 19/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.39it/s, F1=0.996, train_acc=1, train_loss=0.0617, train_precision=0.993, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      1.00      1.00       177
          NS       1.00      1.00      1.00       456
          NT       0.99      1.00      0.99       225

   micro avg       1.00      1.00      1.00       858
   macro avg       0.99      1.00      1.00       858
weighted avg       1.00      1.00      1.00       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.34it/s, F1=0.831, eval_acc=0.983, eval_loss=5.34, eval_precision=0.795, eval_recall=0.875]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.92      0.96      0.94      1416
          NS       0.83      0.88      0.85      2857
          NT       0.67      0.78      0.72      1314

   micro avg       0.81      0.88      0.84      5587
   macro avg       0.81      0.87      0.84      5587
weighted avg       0.81      0.88      0.84      5587



Epoch: 20/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.37it/s, F1=0.993, train_acc=0.999, train_loss=0.287, train_precision=0.995, train_recall=0.991]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       177
          NS       0.99      1.00      0.99       456
          NT       0.99      0.98      0.98       225

   micro avg       0.99      0.99      0.99       858
   macro avg       0.99      0.99      0.99       858
weighted avg       0.99      0.99      0.99       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.38it/s, F1=0.828, eval_acc=0.983, eval_loss=5.21, eval_precision=0.807, eval_recall=0.855]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.95      0.95      1416
          NS       0.82      0.88      0.85      2857
          NT       0.62      0.69      0.65      1314

   micro avg       0.80      0.85      0.83      5587
   macro avg       0.80      0.84      0.82      5587
weighted avg       0.81      0.85      0.83      5587



Epoch: 21/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.39it/s, F1=0.973, train_acc=0.999, train_loss=0.205, train_precision=0.969, train_recall=0.977]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       177
          NS       0.99      0.99      0.99       456
          NT       0.97      0.99      0.98       225

   micro avg       0.98      0.99      0.99       858
   macro avg       0.98      0.99      0.99       858
weighted avg       0.98      0.99      0.99       858



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.60it/s, F1=0.825, eval_acc=0.982, eval_loss=5.35, eval_precision=0.808, eval_recall=0.847]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.94      0.94      1416
          NS       0.82      0.83      0.83      2857
          NT       0.62      0.75      0.68      1314

   micro avg       0.79      0.84      0.82      5587
   macro avg       0.79      0.84      0.82      5587
weighted avg       0.80      0.84      0.82      5587



Epoch: 22/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.46it/s, F1=0.979, train_acc=0.999, train_loss=0.427, train_precision=0.975, train_recall=0.983]


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.98      0.98       177
          NS       0.98      0.99      0.99       456
          NT       0.95      0.96      0.96       225

   micro avg       0.97      0.98      0.98       858
   macro avg       0.97      0.98      0.97       858
weighted avg       0.97      0.98      0.98       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.37it/s, F1=0.817, eval_acc=0.981, eval_loss=5.27, eval_precision=0.797, eval_recall=0.843]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.92      0.94      0.93      1416
          NS       0.79      0.84      0.82      2857
          NT       0.64      0.72      0.68      1314

   micro avg       0.79      0.84      0.81      5587
   macro avg       0.79      0.83      0.81      5587
weighted avg       0.79      0.84      0.81      5587



Epoch: 23/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.43it/s, F1=0.974, train_acc=1, train_loss=0.148, train_precision=0.972, train_recall=0.976]    


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       177
          NS       1.00      0.99      1.00       456
          NT       0.97      0.99      0.98       225

   micro avg       0.99      0.99      0.99       858
   macro avg       0.99      0.99      0.99       858
weighted avg       0.99      0.99      0.99       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.36it/s, F1=0.826, eval_acc=0.982, eval_loss=5.22, eval_precision=0.796, eval_recall=0.862]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.95      0.94      1416
          NS       0.80      0.87      0.84      2857
          NT       0.64      0.75      0.69      1314

   micro avg       0.79      0.86      0.83      5587
   macro avg       0.79      0.86      0.82      5587
weighted avg       0.80      0.86      0.83      5587



Epoch: 24/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.43it/s, F1=0.992, train_acc=1, train_loss=0.114, train_precision=0.991, train_recall=0.994] 


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       177
          NS       0.99      0.99      0.99       456
          NT       0.99      1.00      0.99       225

   micro avg       0.99      1.00      0.99       858
   macro avg       0.99      1.00      0.99       858
weighted avg       0.99      1.00      0.99       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.38it/s, F1=0.825, eval_acc=0.982, eval_loss=5.66, eval_precision=0.811, eval_recall=0.843]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.93      0.93      1416
          NS       0.80      0.85      0.82      2857
          NT       0.68      0.72      0.70      1314

   micro avg       0.80      0.84      0.82      5587
   macro avg       0.80      0.83      0.82      5587
weighted avg       0.80      0.84      0.82      5587



Epoch: 25/30 Train: 100%|██████████| 63/63 [00:21<00:00,  2.92it/s, F1=0.995, train_acc=1, train_loss=0.107, train_precision=0.995, train_recall=0.994] 


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       177
          NS       1.00      1.00      1.00       456
          NT       0.99      1.00      0.99       225

   micro avg       1.00      1.00      1.00       858
   macro avg       1.00      1.00      1.00       858
weighted avg       1.00      1.00      1.00       858



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.31it/s, F1=0.824, eval_acc=0.982, eval_loss=5.45, eval_precision=0.789, eval_recall=0.867]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.95      0.94      1416
          NS       0.80      0.86      0.83      2857
          NT       0.66      0.78      0.72      1314

   micro avg       0.79      0.87      0.83      5587
   macro avg       0.80      0.87      0.83      5587
weighted avg       0.80      0.87      0.83      5587



Epoch: 26/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.43it/s, F1=0.99, train_acc=1, train_loss=0.0952, train_precision=0.987, train_recall=0.994]    


train_reports:
              precision    recall  f1-score   support

          NR       0.97      0.99      0.98       177
          NS       1.00      1.00      1.00       456
          NT       0.98      0.99      0.99       225

   micro avg       0.99      1.00      0.99       858
   macro avg       0.98      0.99      0.99       858
weighted avg       0.99      1.00      0.99       858



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.12it/s, F1=0.832, eval_acc=0.982, eval_loss=5.88, eval_precision=0.819, eval_recall=0.851]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.95      0.94      1416
          NS       0.82      0.86      0.84      2857
          NT       0.71      0.72      0.71      1314

   micro avg       0.82      0.85      0.83      5587
   macro avg       0.82      0.84      0.83      5587
weighted avg       0.82      0.85      0.83      5587



Epoch: 27/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.49it/s, F1=0.999, train_acc=1, train_loss=0.0476, train_precision=0.998, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      1.00      1.00       177
          NS       1.00      1.00      1.00       456
          NT       1.00      1.00      1.00       225

   micro avg       1.00      1.00      1.00       858
   macro avg       1.00      1.00      1.00       858
weighted avg       1.00      1.00      1.00       858



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.26it/s, F1=0.835, eval_acc=0.983, eval_loss=5.83, eval_precision=0.819, eval_recall=0.855]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.94      0.93      1416
          NS       0.82      0.86      0.84      2857
          NT       0.70      0.73      0.71      1314

   micro avg       0.82      0.85      0.83      5587
   macro avg       0.81      0.84      0.83      5587
weighted avg       0.82      0.85      0.83      5587



Epoch: 28/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.41it/s, F1=0.995, train_acc=0.999, train_loss=0.121, train_precision=0.995, train_recall=0.995] 


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       177
          NS       1.00      1.00      1.00       456
          NT       0.98      0.98      0.98       225

   micro avg       0.99      0.99      0.99       858
   macro avg       0.99      0.99      0.99       858
weighted avg       0.99      0.99      0.99       858



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.49it/s, F1=0.801, eval_acc=0.979, eval_loss=5.98, eval_precision=0.756, eval_recall=0.862]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.92      0.95      0.93      1416
          NS       0.77      0.87      0.81      2857
          NT       0.64      0.75      0.69      1314

   micro avg       0.77      0.86      0.81      5587
   macro avg       0.77      0.86      0.81      5587
weighted avg       0.77      0.86      0.82      5587



Epoch: 29/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.38it/s, F1=0.994, train_acc=1, train_loss=0.0724, train_precision=0.991, train_recall=0.997]    


train_reports:
              precision    recall  f1-score   support

          NR       0.99      1.00      1.00       177
          NS       0.99      1.00      1.00       456
          NT       0.98      0.99      0.98       225

   micro avg       0.99      1.00      0.99       858
   macro avg       0.99      1.00      0.99       858
weighted avg       0.99      1.00      0.99       858



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.19it/s, F1=0.812, eval_acc=0.979, eval_loss=6.36, eval_precision=0.782, eval_recall=0.851]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.95      0.94      1416
          NS       0.82      0.82      0.82      2857
          NT       0.60      0.80      0.68      1314

   micro avg       0.78      0.85      0.81      5587
   macro avg       0.79      0.86      0.82      5587
weighted avg       0.80      0.85      0.82      5587



Epoch: 30/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.42it/s, F1=0.993, train_acc=0.999, train_loss=0.126, train_precision=0.992, train_recall=0.995]


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.98      0.98       177
          NS       1.00      1.00      1.00       456
          NT       0.98      0.99      0.98       225

   micro avg       0.99      0.99      0.99       858
   macro avg       0.99      0.99      0.99       858
weighted avg       0.99      0.99      0.99       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.36it/s, F1=0.823, eval_acc=0.98, eval_loss=6.21, eval_precision=0.802, eval_recall=0.85]  


eval_reports:
              precision    recall  f1-score   support

          NR       0.94      0.94      0.94      1416
          NS       0.82      0.85      0.83      2857
          NT       0.63      0.74      0.68      1314

   micro avg       0.80      0.84      0.82      5587
   macro avg       0.80      0.84      0.82      5587
weighted avg       0.80      0.84      0.82      5587



calculate data/few_shot/msra/train_500.json etag: 100%|██████████| 314k/314k [00:00<00:00, 279MB/s]
calculate data/few_shot/msra/dev.json etag: 100%|██████████| 2.12M/2.12M [00:00<00:00, 331MB/s]
calculate data/few_shot/msra/test.json etag: 100%|██████████| 2.12M/2.12M [00:00<00:00, 341MB/s]
calculate data/few_shot/msra/labels.txt etag: 100%|██████████| 62.0/62.0 [00:00<00:00, 127kB/s]

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/msra/train_500.json",
    "eval_file": "data/few_shot/msra/dev.json",
    "test_file": "data/few_shot/msra/test.json",
    "tag_file": "data/few_shot/msra/labels.txt",
    "bert_vocab_file": "./model/chinese_wwm_ext/vocab.txt",
    "output_eval": true,
    "max_scan_num": 1000000,
    "add_seq_vocab": false,
    "max_seq_length": 150,
    "max_word_num": 5,
    "default_tag": "O",
    "use_test": false,
    "do_shuffle": true,
    "do_predict": false,
    "task_name": "msra_pretrain_lebert_crf_500_x3"
}
load cached ./temp/3a418bc5bceb142b229b235ce03f275d_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/lexicon_tree



count line size data/few_shot/msra/labels.txt: 14L [00:00, 138818.57L/s]
build line mapper: 14L [00:00, 120082.32L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 14/14 [00:00<00:00, 4936.96it/s]
load vocab from list: 100%|██████████| 13/13 [00:00<00:00, 165732.38it/s]
load dataset from data/few_shot/msra/train_500.json: 59it [00:00, 581.15it/s]

load cached ./temp/3a418bc5bceb142b229b235ce03f275d_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/matched_words
load cached ./temp/3a418bc5bceb142b229b235ce03f275d_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/word_vocab
load cached ./temp/3a418bc5bceb142b229b235ce03f275d_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/vocab_embedding


load dataset from data/few_shot/msra/train_500.json: 500it [00:00, 568.08it/s]
load dataset from data/few_shot/msra/dev.json: 4365it [00:07, 583.77it/s]
Some weights of the model checkpoint at save_pretrained/msra_pretrain_lebert_500_pretraind_task/Bert_480/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.36it/s, F1=0.000564, train_acc=0.606, train_loss=99.5, train_precision=0.000297, train_recall=0.00659]


train_reports:
              precision    recall  f1-score   support

          NR       0.00      0.00      0.00       177
          NS       0.00      0.01      0.00       456
          NT       0.00      0.00      0.00       225

   micro avg       0.00      0.01      0.00       858
   macro avg       0.00      0.00      0.00       858
weighted avg       0.00      0.01      0.00       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.32it/s, F1=0, eval_acc=0.897, eval_loss=25.7, eval_precision=0, eval_recall=0]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.00      0.00      0.00      1416
          NS       0.00      0.00      0.00      2857
          NT       0.00      0.00      0.00      1314

   micro avg       0.00      0.00      0.00      5587
   macro avg       0.00      0.00      0.00      5587
weighted avg       0.00      0.00      0.00      5587



Epoch: 2/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.38it/s, F1=0.00263, train_acc=0.887, train_loss=23.8, train_precision=0.00199, train_recall=0.00407]  


train_reports:
              precision    recall  f1-score   support

          NR       0.00      0.00      0.00       177
          NS       0.01      0.01      0.01       456
          NT       0.00      0.00      0.00       225

   micro avg       0.01      0.00      0.01       858
   macro avg       0.00      0.00      0.00       858
weighted avg       0.01      0.00      0.01       858



Eval Result: 100%|██████████| 69/69 [00:18<00:00,  3.71it/s, F1=0.0373, eval_acc=0.924, eval_loss=10.3, eval_precision=0.0268, eval_recall=0.0631]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.04      0.12      0.06      1416
          NS       0.03      0.07      0.04      2857
          NT       0.00      0.00      0.00      1314

   micro avg       0.03      0.07      0.04      5587
   macro avg       0.02      0.06      0.03      5587
weighted avg       0.03      0.07      0.04      5587



Epoch: 3/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.41it/s, F1=0.459, train_acc=0.955, train_loss=8.72, train_precision=0.413, train_recall=0.534]


train_reports:
              precision    recall  f1-score   support

          NR       0.51      0.79      0.62       177
          NS       0.47      0.54      0.50       456
          NT       0.15      0.30      0.20       225

   micro avg       0.36      0.53      0.43       858
   macro avg       0.38      0.54      0.44       858
weighted avg       0.39      0.53      0.45       858



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.30it/s, F1=0.584, eval_acc=0.969, eval_loss=4.64, eval_precision=0.538, eval_recall=0.65] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.89      0.91      0.90      1416
          NS       0.70      0.70      0.70      2857
          NT       0.10      0.20      0.13      1314

   micro avg       0.51      0.63      0.56      5587
   macro avg       0.56      0.60      0.58      5587
weighted avg       0.61      0.63      0.62      5587



Epoch: 4/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.37it/s, F1=0.726, train_acc=0.981, train_loss=4.36, train_precision=0.706, train_recall=0.764]


train_reports:
              precision    recall  f1-score   support

          NR       0.90      0.88      0.89       177
          NS       0.80      0.81      0.81       456
          NT       0.41      0.59      0.48       225

   micro avg       0.69      0.77      0.72       858
   macro avg       0.70      0.76      0.73       858
weighted avg       0.72      0.77      0.74       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.33it/s, F1=0.726, eval_acc=0.976, eval_loss=3.52, eval_precision=0.677, eval_recall=0.791]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.95      0.95      1416
          NS       0.75      0.81      0.78      2857
          NT       0.34      0.53      0.42      1314

   micro avg       0.66      0.78      0.72      5587
   macro avg       0.68      0.77      0.71      5587
weighted avg       0.70      0.78      0.74      5587



Epoch: 5/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.44it/s, F1=0.874, train_acc=0.991, train_loss=1.79, train_precision=0.862, train_recall=0.892]


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.93      0.96       177
          NS       0.89      0.89      0.89       456
          NT       0.72      0.84      0.78       225

   micro avg       0.86      0.89      0.87       858
   macro avg       0.87      0.89      0.88       858
weighted avg       0.87      0.89      0.88       858



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.58it/s, F1=0.793, eval_acc=0.978, eval_loss=3.65, eval_precision=0.749, eval_recall=0.85] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.96      0.94      0.95      1416
          NS       0.79      0.85      0.82      2857
          NT       0.55      0.76      0.64      1314

   micro avg       0.76      0.85      0.80      5587
   macro avg       0.77      0.85      0.80      5587
weighted avg       0.77      0.85      0.81      5587



Epoch: 6/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.43it/s, F1=0.897, train_acc=0.993, train_loss=1.23, train_precision=0.887, train_recall=0.909]


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.95      0.97       177
          NS       0.91      0.93      0.92       456
          NT       0.83      0.90      0.86       225

   micro avg       0.90      0.93      0.92       858
   macro avg       0.91      0.93      0.92       858
weighted avg       0.91      0.93      0.92       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.37it/s, F1=0.795, eval_acc=0.98, eval_loss=3.63, eval_precision=0.77, eval_recall=0.828]  


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.97      0.94      0.95      1416
          NS       0.84      0.81      0.82      2857
          NT       0.52      0.74      0.61      1314

   micro avg       0.77      0.83      0.80      5587
   macro avg       0.78      0.83      0.80      5587
weighted avg       0.80      0.83      0.81      5587



Epoch: 7/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.41it/s, F1=0.962, train_acc=0.997, train_loss=0.662, train_precision=0.96, train_recall=0.964] 


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.97      0.98       177
          NS       0.97      0.96      0.97       456
          NT       0.89      0.94      0.92       225

   micro avg       0.95      0.96      0.96       858
   macro avg       0.95      0.96      0.95       858
weighted avg       0.95      0.96      0.96       858



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.25it/s, F1=0.826, eval_acc=0.981, eval_loss=3.6, eval_precision=0.796, eval_recall=0.864] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.96      0.95      1416
          NS       0.83      0.86      0.84      2857
          NT       0.64      0.78      0.70      1314

   micro avg       0.81      0.86      0.83      5587
   macro avg       0.80      0.86      0.83      5587
weighted avg       0.81      0.86      0.84      5587



Epoch: 8/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.38it/s, F1=0.97, train_acc=0.997, train_loss=0.517, train_precision=0.965, train_recall=0.975] 


train_reports:
              precision    recall  f1-score   support

          NR       0.97      0.98      0.97       177
          NS       0.98      0.98      0.98       456
          NT       0.91      0.94      0.93       225

   micro avg       0.96      0.97      0.97       858
   macro avg       0.95      0.97      0.96       858
weighted avg       0.96      0.97      0.97       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.33it/s, F1=0.827, eval_acc=0.98, eval_loss=3.69, eval_precision=0.801, eval_recall=0.86]  


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.96      0.94      0.95      1416
          NS       0.81      0.85      0.83      2857
          NT       0.66      0.79      0.72      1314

   micro avg       0.81      0.86      0.83      5587
   macro avg       0.81      0.86      0.83      5587
weighted avg       0.81      0.86      0.83      5587



Epoch: 9/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.41it/s, F1=0.98, train_acc=0.999, train_loss=0.334, train_precision=0.979, train_recall=0.982] 


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.99      0.99       177
          NS       0.98      0.98      0.98       456
          NT       0.96      0.96      0.96       225

   micro avg       0.98      0.98      0.98       858
   macro avg       0.97      0.98      0.98       858
weighted avg       0.98      0.98      0.98       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.38it/s, F1=0.823, eval_acc=0.981, eval_loss=3.83, eval_precision=0.792, eval_recall=0.864]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.96      0.94      0.95      1416
          NS       0.80      0.88      0.83      2857
          NT       0.68      0.77      0.72      1314

   micro avg       0.80      0.87      0.84      5587
   macro avg       0.81      0.86      0.84      5587
weighted avg       0.81      0.87      0.84      5587



Epoch: 10/30 Train: 100%|██████████| 63/63 [00:21<00:00,  2.92it/s, F1=0.987, train_acc=0.999, train_loss=0.316, train_precision=0.985, train_recall=0.988]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      1.00      1.00       177
          NS       0.98      0.99      0.99       456
          NT       0.96      0.97      0.97       225

   micro avg       0.98      0.99      0.98       858
   macro avg       0.98      0.99      0.98       858
weighted avg       0.98      0.99      0.98       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.33it/s, F1=0.771, eval_acc=0.977, eval_loss=4.74, eval_precision=0.73, eval_recall=0.824] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.97      0.95      0.96      1416
          NS       0.72      0.89      0.80      2857
          NT       0.50      0.55      0.53      1314

   micro avg       0.73      0.82      0.77      5587
   macro avg       0.73      0.80      0.76      5587
weighted avg       0.73      0.82      0.77      5587



Epoch: 11/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.44it/s, F1=0.943, train_acc=0.997, train_loss=0.616, train_precision=0.933, train_recall=0.955]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      1.00      0.99       177
          NS       0.92      0.95      0.94       456
          NT       0.88      0.93      0.91       225

   micro avg       0.92      0.95      0.94       858
   macro avg       0.93      0.96      0.94       858
weighted avg       0.92      0.95      0.94       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.33it/s, F1=0.82, eval_acc=0.982, eval_loss=4.18, eval_precision=0.803, eval_recall=0.843] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.96      0.94      0.95      1416
          NS       0.81      0.88      0.84      2857
          NT       0.68      0.70      0.69      1314

   micro avg       0.82      0.85      0.83      5587
   macro avg       0.82      0.84      0.83      5587
weighted avg       0.82      0.85      0.83      5587



Epoch: 12/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.40it/s, F1=0.99, train_acc=0.999, train_loss=0.186, train_precision=0.988, train_recall=0.992] 


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       177
          NS       0.98      0.99      0.99       456
          NT       0.98      0.99      0.98       225

   micro avg       0.98      0.99      0.99       858
   macro avg       0.99      0.99      0.99       858
weighted avg       0.98      0.99      0.99       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.39it/s, F1=0.833, eval_acc=0.982, eval_loss=4.12, eval_precision=0.81, eval_recall=0.861] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.95      0.95      1416
          NS       0.82      0.86      0.84      2857
          NT       0.67      0.76      0.71      1314

   micro avg       0.82      0.86      0.84      5587
   macro avg       0.82      0.86      0.84      5587
weighted avg       0.82      0.86      0.84      5587



Epoch: 13/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.46it/s, F1=0.993, train_acc=1, train_loss=0.0865, train_precision=0.992, train_recall=0.995]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       177
          NS       0.99      0.99      0.99       456
          NT       0.98      1.00      0.99       225

   micro avg       0.99      1.00      0.99       858
   macro avg       0.99      1.00      0.99       858
weighted avg       0.99      1.00      0.99       858



Eval Result: 100%|██████████| 69/69 [00:18<00:00,  3.70it/s, F1=0.833, eval_acc=0.982, eval_loss=4.54, eval_precision=0.819, eval_recall=0.852]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.96      0.96      1416
          NS       0.83      0.85      0.84      2857
          NT       0.70      0.74      0.72      1314

   micro avg       0.83      0.85      0.84      5587
   macro avg       0.82      0.85      0.84      5587
weighted avg       0.83      0.85      0.84      5587



Epoch: 14/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.39it/s, F1=0.993, train_acc=1, train_loss=0.0989, train_precision=0.992, train_recall=0.994]   


train_reports:
              precision    recall  f1-score   support

          NR       1.00      0.99      1.00       177
          NS       1.00      1.00      1.00       456
          NT       0.99      0.99      0.99       225

   micro avg       1.00      1.00      1.00       858
   macro avg       0.99      0.99      0.99       858
weighted avg       1.00      1.00      1.00       858



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.30it/s, F1=0.842, eval_acc=0.983, eval_loss=4.42, eval_precision=0.84, eval_recall=0.849] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.96      0.95      0.96      1416
          NS       0.84      0.86      0.85      2857
          NT       0.72      0.71      0.72      1314

   micro avg       0.84      0.85      0.85      5587
   macro avg       0.84      0.84      0.84      5587
weighted avg       0.84      0.85      0.85      5587



Epoch: 15/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.41it/s, F1=0.997, train_acc=1, train_loss=0.186, train_precision=0.997, train_recall=0.996]    


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       177
          NS       1.00      1.00      1.00       456
          NT       0.99      0.99      0.99       225

   micro avg       1.00      1.00      1.00       858
   macro avg       1.00      1.00      1.00       858
weighted avg       1.00      1.00      1.00       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.39it/s, F1=0.842, eval_acc=0.983, eval_loss=4.19, eval_precision=0.823, eval_recall=0.866]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.95      0.95      1416
          NS       0.82      0.89      0.85      2857
          NT       0.71      0.71      0.71      1314

   micro avg       0.83      0.87      0.85      5587
   macro avg       0.83      0.85      0.84      5587
weighted avg       0.83      0.87      0.85      5587



Epoch: 16/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.42it/s, F1=0.99, train_acc=0.999, train_loss=0.106, train_precision=0.989, train_recall=0.992]  


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       177
          NS       0.99      0.99      0.99       456
          NT       0.99      0.99      0.99       225

   micro avg       0.99      0.99      0.99       858
   macro avg       0.99      0.99      0.99       858
weighted avg       0.99      0.99      0.99       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.39it/s, F1=0.825, eval_acc=0.98, eval_loss=4.53, eval_precision=0.794, eval_recall=0.863] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.96      0.96      0.96      1416
          NS       0.82      0.86      0.84      2857
          NT       0.64      0.79      0.71      1314

   micro avg       0.80      0.87      0.83      5587
   macro avg       0.81      0.87      0.83      5587
weighted avg       0.81      0.87      0.84      5587



Epoch: 17/30 Train: 100%|██████████| 63/63 [00:21<00:00,  2.92it/s, F1=0.989, train_acc=0.999, train_loss=0.145, train_precision=0.987, train_recall=0.992]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       177
          NS       0.99      1.00      0.99       456
          NT       0.98      0.99      0.98       225

   micro avg       0.99      0.99      0.99       858
   macro avg       0.99      0.99      0.99       858
weighted avg       0.99      0.99      0.99       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.32it/s, F1=0.833, eval_acc=0.984, eval_loss=4.32, eval_precision=0.826, eval_recall=0.844]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.96      0.96      0.96      1416
          NS       0.84      0.87      0.85      2857
          NT       0.67      0.69      0.68      1314

   micro avg       0.83      0.85      0.84      5587
   macro avg       0.82      0.84      0.83      5587
weighted avg       0.83      0.85      0.84      5587



Epoch: 18/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.41it/s, F1=0.991, train_acc=0.999, train_loss=0.161, train_precision=0.986, train_recall=0.997]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       177
          NS       0.99      1.00      0.99       456
          NT       0.97      0.99      0.98       225

   micro avg       0.99      1.00      0.99       858
   macro avg       0.99      1.00      0.99       858
weighted avg       0.99      1.00      0.99       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.34it/s, F1=0.839, eval_acc=0.983, eval_loss=4.1, eval_precision=0.831, eval_recall=0.852] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.97      0.95      0.96      1416
          NS       0.85      0.87      0.86      2857
          NT       0.69      0.71      0.70      1314

   micro avg       0.84      0.85      0.85      5587
   macro avg       0.84      0.84      0.84      5587
weighted avg       0.84      0.85      0.85      5587



Epoch: 19/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.43it/s, F1=0.992, train_acc=0.999, train_loss=0.124, train_precision=0.992, train_recall=0.993]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       177
          NS       1.00      1.00      1.00       456
          NT       0.98      0.98      0.98       225

   micro avg       0.99      0.99      0.99       858
   macro avg       0.99      0.99      0.99       858
weighted avg       0.99      0.99      0.99       858



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.28it/s, F1=0.825, eval_acc=0.982, eval_loss=4.04, eval_precision=0.79, eval_recall=0.87]  


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.96      0.95      0.96      1416
          NS       0.80      0.87      0.83      2857
          NT       0.66      0.80      0.72      1314

   micro avg       0.80      0.87      0.83      5587
   macro avg       0.81      0.87      0.84      5587
weighted avg       0.81      0.87      0.84      5587



Epoch: 20/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.43it/s, F1=0.997, train_acc=1, train_loss=0.085, train_precision=0.996, train_recall=0.998]    


train_reports:
              precision    recall  f1-score   support

          NR       1.00      0.99      1.00       177
          NS       1.00      1.00      1.00       456
          NT       0.99      1.00      1.00       225

   micro avg       1.00      1.00      1.00       858
   macro avg       1.00      1.00      1.00       858
weighted avg       1.00      1.00      1.00       858



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.54it/s, F1=0.833, eval_acc=0.984, eval_loss=4.16, eval_precision=0.817, eval_recall=0.854]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.96      0.96      1416
          NS       0.81      0.86      0.83      2857
          NT       0.70      0.72      0.71      1314

   micro avg       0.82      0.85      0.83      5587
   macro avg       0.82      0.85      0.83      5587
weighted avg       0.82      0.85      0.84      5587



Epoch: 21/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.41it/s, F1=0.998, train_acc=1, train_loss=0.0267, train_precision=0.998, train_recall=0.998]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       177
          NS       1.00      1.00      1.00       456
          NT       1.00      1.00      1.00       225

   micro avg       1.00      1.00      1.00       858
   macro avg       1.00      1.00      1.00       858
weighted avg       1.00      1.00      1.00       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.32it/s, F1=0.832, eval_acc=0.983, eval_loss=4.11, eval_precision=0.807, eval_recall=0.863]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.96      0.96      0.96      1416
          NS       0.82      0.87      0.85      2857
          NT       0.68      0.77      0.72      1314

   micro avg       0.82      0.87      0.85      5587
   macro avg       0.82      0.87      0.84      5587
weighted avg       0.82      0.87      0.85      5587



Epoch: 22/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.35it/s, F1=0.987, train_acc=0.998, train_loss=0.333, train_precision=0.983, train_recall=0.992]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       177
          NS       0.99      1.00      1.00       456
          NT       0.94      0.97      0.96       225

   micro avg       0.98      0.99      0.99       858
   macro avg       0.98      0.99      0.98       858
weighted avg       0.98      0.99      0.99       858



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.24it/s, F1=0.824, eval_acc=0.982, eval_loss=4, eval_precision=0.808, eval_recall=0.844]   


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.96      0.95      1416
          NS       0.82      0.86      0.84      2857
          NT       0.65      0.71      0.68      1314

   micro avg       0.81      0.85      0.83      5587
   macro avg       0.81      0.84      0.82      5587
weighted avg       0.81      0.85      0.83      5587



Epoch: 23/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.48it/s, F1=0.976, train_acc=0.999, train_loss=0.45, train_precision=0.971, train_recall=0.981] 


train_reports:
              precision    recall  f1-score   support

          NR       0.96      0.95      0.96       177
          NS       0.96      0.98      0.97       456
          NT       0.99      0.99      0.99       225

   micro avg       0.97      0.98      0.97       858
   macro avg       0.97      0.98      0.97       858
weighted avg       0.97      0.98      0.97       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.40it/s, F1=0.816, eval_acc=0.98, eval_loss=4.66, eval_precision=0.784, eval_recall=0.856] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.96      0.92      0.94      1416
          NS       0.80      0.88      0.83      2857
          NT       0.66      0.77      0.71      1314

   micro avg       0.80      0.86      0.83      5587
   macro avg       0.81      0.86      0.83      5587
weighted avg       0.81      0.86      0.83      5587



Epoch: 24/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.44it/s, F1=0.998, train_acc=1, train_loss=0.0683, train_precision=0.997, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      0.99      1.00       177
          NS       1.00      1.00      1.00       456
          NT       1.00      1.00      1.00       225

   micro avg       1.00      1.00      1.00       858
   macro avg       1.00      1.00      1.00       858
weighted avg       1.00      1.00      1.00       858



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.54it/s, F1=0.84, eval_acc=0.982, eval_loss=4.91, eval_precision=0.825, eval_recall=0.86]  


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.94      0.94      1416
          NS       0.83      0.88      0.85      2857
          NT       0.70      0.74      0.72      1314

   micro avg       0.83      0.86      0.84      5587
   macro avg       0.83      0.85      0.84      5587
weighted avg       0.83      0.86      0.85      5587



Epoch: 25/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.43it/s, F1=0.982, train_acc=1, train_loss=0.0306, train_precision=0.982, train_recall=0.982]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       177
          NS       1.00      1.00      1.00       456
          NT       1.00      1.00      1.00       225

   micro avg       1.00      1.00      1.00       858
   macro avg       1.00      1.00      1.00       858
weighted avg       1.00      1.00      1.00       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.31it/s, F1=0.836, eval_acc=0.982, eval_loss=5.03, eval_precision=0.819, eval_recall=0.858]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.95      0.95      1416
          NS       0.83      0.88      0.86      2857
          NT       0.69      0.73      0.71      1314

   micro avg       0.83      0.86      0.84      5587
   macro avg       0.82      0.85      0.84      5587
weighted avg       0.83      0.86      0.84      5587



Epoch: 26/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.42it/s, F1=0.981, train_acc=0.999, train_loss=0.297, train_precision=0.978, train_recall=0.984]


train_reports:
              precision    recall  f1-score   support

          NR       0.97      0.98      0.97       177
          NS       0.98      0.99      0.99       456
          NT       0.97      0.98      0.98       225

   micro avg       0.98      0.98      0.98       858
   macro avg       0.97      0.98      0.98       858
weighted avg       0.98      0.98      0.98       858



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.26it/s, F1=0.813, eval_acc=0.98, eval_loss=5.29, eval_precision=0.79, eval_recall=0.842]  


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.90      0.96      0.93      1416
          NS       0.80      0.87      0.83      2857
          NT       0.68      0.66      0.67      1314

   micro avg       0.80      0.84      0.82      5587
   macro avg       0.79      0.83      0.81      5587
weighted avg       0.79      0.84      0.82      5587



Epoch: 27/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.42it/s, F1=0.994, train_acc=1, train_loss=0.143, train_precision=0.993, train_recall=0.996]    


train_reports:
              precision    recall  f1-score   support

          NR       0.99      1.00      0.99       177
          NS       1.00      1.00      1.00       456
          NT       0.98      0.99      0.98       225

   micro avg       0.99      1.00      0.99       858
   macro avg       0.99      0.99      0.99       858
weighted avg       0.99      1.00      0.99       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.33it/s, F1=0.837, eval_acc=0.983, eval_loss=4.04, eval_precision=0.814, eval_recall=0.866]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.94      0.94      1416
          NS       0.82      0.88      0.85      2857
          NT       0.69      0.77      0.73      1314

   micro avg       0.82      0.87      0.84      5587
   macro avg       0.82      0.86      0.84      5587
weighted avg       0.82      0.87      0.85      5587



Epoch: 28/30 Train: 100%|██████████| 63/63 [00:21<00:00,  2.87it/s, F1=0.99, train_acc=0.999, train_loss=0.161, train_precision=0.986, train_recall=0.994] 


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       177
          NS       0.99      1.00      0.99       456
          NT       0.97      0.98      0.97       225

   micro avg       0.98      0.99      0.99       858
   macro avg       0.98      0.99      0.99       858
weighted avg       0.99      0.99      0.99       858



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.26it/s, F1=0.826, eval_acc=0.981, eval_loss=5.64, eval_precision=0.826, eval_recall=0.829]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.95      0.95      1416
          NS       0.86      0.85      0.85      2857
          NT       0.65      0.66      0.66      1314

   micro avg       0.83      0.83      0.83      5587
   macro avg       0.82      0.82      0.82      5587
weighted avg       0.83      0.83      0.83      5587



Epoch: 29/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.46it/s, F1=0.983, train_acc=0.999, train_loss=0.195, train_precision=0.981, train_recall=0.986]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      1.00      1.00       177
          NS       0.99      0.99      0.99       456
          NT       0.96      0.97      0.96       225

   micro avg       0.98      0.99      0.99       858
   macro avg       0.98      0.99      0.98       858
weighted avg       0.98      0.99      0.99       858



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.29it/s, F1=0.83, eval_acc=0.982, eval_loss=5.04, eval_precision=0.808, eval_recall=0.859] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.93      0.94      1416
          NS       0.83      0.88      0.86      2857
          NT       0.67      0.76      0.71      1314

   micro avg       0.82      0.86      0.84      5587
   macro avg       0.82      0.86      0.84      5587
weighted avg       0.82      0.86      0.84      5587



Epoch: 30/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.43it/s, F1=0.984, train_acc=0.999, train_loss=0.386, train_precision=0.982, train_recall=0.986]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      0.99      1.00       177
          NS       0.98      0.99      0.99       456
          NT       0.97      0.97      0.97       225

   micro avg       0.98      0.99      0.98       858
   macro avg       0.98      0.99      0.99       858
weighted avg       0.98      0.99      0.98       858



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.37it/s, F1=0.826, eval_acc=0.982, eval_loss=4.68, eval_precision=0.814, eval_recall=0.842]


eval_reports:
              precision    recall  f1-score   support

          NR       0.95      0.95      0.95      1416
          NS       0.80      0.86      0.83      2857
          NT       0.70      0.70      0.70      1314

   micro avg       0.81      0.85      0.83      5587
   macro avg       0.82      0.84      0.83      5587
weighted avg       0.81      0.85      0.83      5587



calculate data/few_shot/msra/train_1000.json etag: 100%|██████████| 597k/597k [00:00<00:00, 28.8MB/s]
calculate data/few_shot/msra/dev.json etag: 100%|██████████| 2.12M/2.12M [00:00<00:00, 336MB/s]
calculate data/few_shot/msra/test.json etag: 100%|██████████| 2.12M/2.12M [00:00<00:00, 370MB/s]
calculate data/few_shot/msra/labels.txt etag: 100%|██████████| 62.0/62.0 [00:00<00:00, 120kB/s]

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/msra/train_1000.json",
    "eval_file": "data/few_shot/msra/dev.json",
    "test_file": "data/few_shot/msra/test.json",
    "tag_file": "data/few_shot/msra/labels.txt",
    "bert_vocab_file": "./model/chinese_wwm_ext/vocab.txt",
    "output_eval": true,
    "max_scan_num": 1000000,
    "add_seq_vocab": false,
    "max_seq_length": 150,
    "max_word_num": 5,
    "default_tag": "O",
    "use_test": false,
    "do_shuffle": true,
    "do_predict": false,
    "task_name": "msra_pretrain_lebert_crf_1000_x1"
}
load cached ./temp/cd9a43ce51176d6be9ddcff512797086_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/lexicon_tree



count line size data/few_shot/msra/labels.txt: 14L [00:00, 124936.71L/s]
build line mapper: 14L [00:00, 121574.03L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 14/14 [00:00<00:00, 4293.67it/s]
load vocab from list: 100%|██████████| 13/13 [00:00<00:00, 163741.60it/s]

load cached ./temp/cd9a43ce51176d6be9ddcff512797086_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/matched_words
load cached ./temp/cd9a43ce51176d6be9ddcff512797086_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/word_vocab
load cached ./temp/cd9a43ce51176d6be9ddcff512797086_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/vocab_embedding



load dataset from data/few_shot/msra/train_1000.json: 1000it [00:01, 587.84it/s]
load dataset from data/few_shot/msra/dev.json: 4365it [00:06, 673.56it/s]
Some weights of the model checkpoint at save_pretrained/msra_pretrain_lebert_1000_pretraind_task/Bert_960/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model 

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.44it/s, F1=0.0153, train_acc=0.744, train_loss=45.5, train_precision=0.0137, train_recall=0.0227]    


train_reports:
              precision    recall  f1-score   support

          NR       0.00      0.01      0.00       375
          NS       0.01      0.04      0.02       821
          NT       0.00      0.01      0.00       432

   micro avg       0.01      0.02      0.01      1628
   macro avg       0.01      0.02      0.01      1628
weighted avg       0.01      0.02      0.01      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.23it/s, F1=0.246, eval_acc=0.938, eval_loss=9.39, eval_precision=0.202, eval_recall=0.322]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.08      0.17      0.11      1416
          NS       0.36      0.49      0.41      2857
          NT       0.05      0.10      0.07      1314

   micro avg       0.19      0.32      0.23      5587
   macro avg       0.16      0.25      0.20      5587
weighted avg       0.22      0.32      0.26      5587



Epoch: 2/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.45it/s, F1=0.585, train_acc=0.967, train_loss=5.84, train_precision=0.548, train_recall=0.644]


train_reports:
              precision    recall  f1-score   support

          NR       0.61      0.74      0.67       375
          NS       0.58      0.69      0.63       821
          NT       0.34      0.49      0.40       432

   micro avg       0.51      0.65      0.57      1628
   macro avg       0.51      0.64      0.57      1628
weighted avg       0.52      0.65      0.58      1628



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.34it/s, F1=0.755, eval_acc=0.978, eval_loss=3.43, eval_precision=0.702, eval_recall=0.827]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.95      0.94      1416
          NS       0.73      0.79      0.76      2857
          NT       0.48      0.76      0.59      1314

   micro avg       0.69      0.82      0.75      5587
   macro avg       0.71      0.84      0.76      5587
weighted avg       0.72      0.82      0.76      5587



Epoch: 3/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.46it/s, F1=0.874, train_acc=0.99, train_loss=1.77, train_precision=0.86, train_recall=0.896]  


train_reports:
              precision    recall  f1-score   support

          NR       0.93      0.94      0.93       375
          NS       0.88      0.92      0.90       821
          NT       0.75      0.85      0.79       432

   micro avg       0.85      0.90      0.88      1628
   macro avg       0.85      0.90      0.88      1628
weighted avg       0.86      0.90      0.88      1628



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.34it/s, F1=0.814, eval_acc=0.979, eval_loss=3.53, eval_precision=0.773, eval_recall=0.864]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.94      0.95      1416
          NS       0.81      0.86      0.83      2857
          NT       0.60      0.82      0.69      1314

   micro avg       0.78      0.87      0.82      5587
   macro avg       0.79      0.87      0.83      5587
weighted avg       0.80      0.87      0.83      5587



Epoch: 4/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.46it/s, F1=0.927, train_acc=0.994, train_loss=1, train_precision=0.913, train_recall=0.945]    


train_reports:
              precision    recall  f1-score   support

          NR       0.96      0.96      0.96       375
          NS       0.95      0.97      0.96       821
          NT       0.83      0.90      0.86       432

   micro avg       0.92      0.95      0.93      1628
   macro avg       0.91      0.94      0.93      1628
weighted avg       0.92      0.95      0.93      1628



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.34it/s, F1=0.837, eval_acc=0.983, eval_loss=3.16, eval_precision=0.804, eval_recall=0.879]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.95      0.95      1416
          NS       0.81      0.89      0.85      2857
          NT       0.68      0.79      0.73      1314

   micro avg       0.81      0.88      0.84      5587
   macro avg       0.81      0.87      0.84      5587
weighted avg       0.82      0.88      0.85      5587



Epoch: 5/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.45it/s, F1=0.961, train_acc=0.998, train_loss=0.425, train_precision=0.955, train_recall=0.968]


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.98      0.98       375
          NS       0.96      0.98      0.97       821
          NT       0.92      0.95      0.94       432

   micro avg       0.96      0.97      0.96      1628
   macro avg       0.96      0.97      0.96      1628
weighted avg       0.96      0.97      0.96      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.24it/s, F1=0.853, eval_acc=0.985, eval_loss=3.48, eval_precision=0.84, eval_recall=0.869] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.94      0.94      1416
          NS       0.83      0.88      0.85      2857
          NT       0.74      0.76      0.75      1314

   micro avg       0.83      0.87      0.85      5587
   macro avg       0.83      0.86      0.85      5587
weighted avg       0.83      0.87      0.85      5587



Epoch: 6/30 Train: 100%|██████████| 125/125 [00:35<00:00,  3.49it/s, F1=0.986, train_acc=0.999, train_loss=0.208, train_precision=0.985, train_recall=0.989]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       375
          NS       0.98      0.99      0.99       821
          NT       0.97      0.99      0.98       432

   micro avg       0.98      0.99      0.98      1628
   macro avg       0.98      0.99      0.98      1628
weighted avg       0.98      0.99      0.99      1628



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.33it/s, F1=0.843, eval_acc=0.983, eval_loss=3.98, eval_precision=0.815, eval_recall=0.878]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.95      0.94      1416
          NS       0.84      0.87      0.86      2857
          NT       0.68      0.82      0.74      1314

   micro avg       0.82      0.88      0.85      5587
   macro avg       0.82      0.88      0.85      5587
weighted avg       0.82      0.88      0.85      5587



Epoch: 7/30 Train: 100%|██████████| 125/125 [00:39<00:00,  3.15it/s, F1=0.973, train_acc=0.999, train_loss=0.197, train_precision=0.97, train_recall=0.975] 


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       375
          NS       0.98      0.99      0.98       821
          NT       0.96      0.97      0.97       432

   micro avg       0.98      0.98      0.98      1628
   macro avg       0.98      0.98      0.98      1628
weighted avg       0.98      0.98      0.98      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.21it/s, F1=0.861, eval_acc=0.984, eval_loss=3.88, eval_precision=0.852, eval_recall=0.874]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.95      0.95      1416
          NS       0.84      0.89      0.86      2857
          NT       0.76      0.77      0.77      1314

   micro avg       0.85      0.88      0.86      5587
   macro avg       0.85      0.87      0.86      5587
weighted avg       0.85      0.88      0.86      5587



Epoch: 8/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.47it/s, F1=0.972, train_acc=0.998, train_loss=0.477, train_precision=0.965, train_recall=0.98] 


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.99      0.99       375
          NS       0.97      0.98      0.98       821
          NT       0.92      0.97      0.94       432

   micro avg       0.96      0.98      0.97      1628
   macro avg       0.96      0.98      0.97      1628
weighted avg       0.96      0.98      0.97      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.30it/s, F1=0.85, eval_acc=0.983, eval_loss=4.18, eval_precision=0.841, eval_recall=0.863] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.95      0.95      1416
          NS       0.84      0.86      0.85      2857
          NT       0.72      0.76      0.74      1314

   micro avg       0.84      0.86      0.85      5587
   macro avg       0.83      0.86      0.85      5587
weighted avg       0.84      0.86      0.85      5587



Epoch: 9/30 Train: 100%|██████████| 125/125 [00:39<00:00,  3.13it/s, F1=0.98, train_acc=0.999, train_loss=0.309, train_precision=0.976, train_recall=0.985] 


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       375
          NS       0.98      0.99      0.98       821
          NT       0.95      0.97      0.96       432

   micro avg       0.97      0.98      0.98      1628
   macro avg       0.97      0.98      0.98      1628
weighted avg       0.97      0.98      0.98      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.26it/s, F1=0.841, eval_acc=0.983, eval_loss=4.32, eval_precision=0.831, eval_recall=0.855]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.96      0.91      0.94      1416
          NS       0.82      0.89      0.85      2857
          NT       0.73      0.73      0.73      1314

   micro avg       0.83      0.86      0.85      5587
   macro avg       0.84      0.85      0.84      5587
weighted avg       0.84      0.86      0.85      5587



Epoch: 10/30 Train: 100%|██████████| 125/125 [00:35<00:00,  3.52it/s, F1=0.973, train_acc=0.998, train_loss=0.37, train_precision=0.97, train_recall=0.977]  


train_reports:
              precision    recall  f1-score   support

          NR       0.97      0.97      0.97       375
          NS       0.99      1.00      0.99       821
          NT       0.96      0.98      0.97       432

   micro avg       0.98      0.99      0.98      1628
   macro avg       0.97      0.98      0.98      1628
weighted avg       0.98      0.99      0.98      1628



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.38it/s, F1=0.844, eval_acc=0.983, eval_loss=3.95, eval_precision=0.829, eval_recall=0.863]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.90      0.96      0.93      1416
          NS       0.86      0.86      0.86      2857
          NT       0.70      0.77      0.74      1314

   micro avg       0.83      0.87      0.85      5587
   macro avg       0.82      0.86      0.84      5587
weighted avg       0.83      0.87      0.85      5587



Epoch: 11/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.46it/s, F1=0.965, train_acc=0.998, train_loss=0.48, train_precision=0.956, train_recall=0.975] 


train_reports:
              precision    recall  f1-score   support

          NR       0.96      0.97      0.96       375
          NS       0.96      0.98      0.97       821
          NT       0.93      0.96      0.95       432

   micro avg       0.95      0.97      0.96      1628
   macro avg       0.95      0.97      0.96      1628
weighted avg       0.95      0.97      0.96      1628



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.54it/s, F1=0.837, eval_acc=0.981, eval_loss=4.36, eval_precision=0.822, eval_recall=0.858]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.94      0.93      1416
          NS       0.86      0.83      0.84      2857
          NT       0.67      0.85      0.75      1314

   micro avg       0.82      0.86      0.84      5587
   macro avg       0.82      0.87      0.84      5587
weighted avg       0.83      0.86      0.84      5587



Epoch: 12/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.46it/s, F1=0.989, train_acc=0.999, train_loss=0.244, train_precision=0.985, train_recall=0.993]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       375
          NS       0.99      1.00      0.99       821
          NT       0.96      0.98      0.97       432

   micro avg       0.98      0.99      0.99      1628
   macro avg       0.98      0.99      0.99      1628
weighted avg       0.98      0.99      0.99      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.22it/s, F1=0.848, eval_acc=0.983, eval_loss=4.15, eval_precision=0.833, eval_recall=0.867]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.91      0.95      0.93      1416
          NS       0.87      0.86      0.86      2857
          NT       0.71      0.82      0.76      1314

   micro avg       0.84      0.87      0.86      5587
   macro avg       0.83      0.88      0.85      5587
weighted avg       0.84      0.87      0.86      5587



Epoch: 13/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.44it/s, F1=0.989, train_acc=0.999, train_loss=0.159, train_precision=0.987, train_recall=0.991]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       375
          NS       0.99      0.99      0.99       821
          NT       0.97      0.99      0.98       432

   micro avg       0.99      0.99      0.99      1628
   macro avg       0.99      0.99      0.99      1628
weighted avg       0.99      0.99      0.99      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.27it/s, F1=0.854, eval_acc=0.984, eval_loss=3.9, eval_precision=0.844, eval_recall=0.869] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.94      0.94      1416
          NS       0.85      0.89      0.87      2857
          NT       0.73      0.75      0.74      1314

   micro avg       0.85      0.87      0.86      5587
   macro avg       0.84      0.86      0.85      5587
weighted avg       0.85      0.87      0.86      5587



Epoch: 14/30 Train: 100%|██████████| 125/125 [00:39<00:00,  3.17it/s, F1=0.994, train_acc=1, train_loss=0.104, train_precision=0.992, train_recall=0.996]   


train_reports:
              precision    recall  f1-score   support

          NR       0.99      1.00      0.99       375
          NS       0.99      1.00      0.99       821
          NT       0.99      0.99      0.99       432

   micro avg       0.99      1.00      0.99      1628
   macro avg       0.99      1.00      0.99      1628
weighted avg       0.99      1.00      0.99      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.28it/s, F1=0.851, eval_acc=0.984, eval_loss=4.58, eval_precision=0.85, eval_recall=0.857] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.94      0.94      1416
          NS       0.84      0.87      0.85      2857
          NT       0.76      0.75      0.76      1314

   micro avg       0.85      0.86      0.85      5587
   macro avg       0.85      0.85      0.85      5587
weighted avg       0.85      0.86      0.85      5587



Epoch: 15/30 Train: 100%|██████████| 125/125 [00:35<00:00,  3.48it/s, F1=0.997, train_acc=1, train_loss=0.0677, train_precision=0.996, train_recall=0.997]  


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       375
          NS       0.99      1.00      0.99       821
          NT       1.00      1.00      1.00       432

   micro avg       0.99      1.00      1.00      1628
   macro avg       1.00      1.00      1.00      1628
weighted avg       0.99      1.00      1.00      1628



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.34it/s, F1=0.857, eval_acc=0.984, eval_loss=4.49, eval_precision=0.852, eval_recall=0.867]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.94      0.94      1416
          NS       0.85      0.87      0.86      2857
          NT       0.76      0.78      0.77      1314

   micro avg       0.85      0.87      0.86      5587
   macro avg       0.85      0.87      0.86      5587
weighted avg       0.85      0.87      0.86      5587



Epoch: 16/30 Train: 100%|██████████| 125/125 [00:35<00:00,  3.52it/s, F1=0.994, train_acc=1, train_loss=0.0575, train_precision=0.993, train_recall=0.996]   


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       375
          NS       1.00      1.00      1.00       821
          NT       0.99      0.99      0.99       432

   micro avg       0.99      1.00      1.00      1628
   macro avg       0.99      1.00      1.00      1628
weighted avg       0.99      1.00      1.00      1628



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.59it/s, F1=0.859, eval_acc=0.985, eval_loss=4.26, eval_precision=0.86, eval_recall=0.861] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.94      0.95      1416
          NS       0.85      0.88      0.86      2857
          NT       0.79      0.75      0.77      1314

   micro avg       0.86      0.86      0.86      5587
   macro avg       0.86      0.86      0.86      5587
weighted avg       0.86      0.86      0.86      5587



Epoch: 17/30 Train: 100%|██████████| 125/125 [00:35<00:00,  3.49it/s, F1=0.997, train_acc=1, train_loss=0.0269, train_precision=0.996, train_recall=0.997]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       375
          NS       1.00      1.00      1.00       821
          NT       0.99      1.00      0.99       432

   micro avg       1.00      1.00      1.00      1628
   macro avg       1.00      1.00      1.00      1628
weighted avg       1.00      1.00      1.00      1628



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.34it/s, F1=0.843, eval_acc=0.983, eval_loss=4.48, eval_precision=0.819, eval_recall=0.875]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.94      0.95      1416
          NS       0.79      0.89      0.84      2857
          NT       0.77      0.80      0.78      1314

   micro avg       0.83      0.88      0.85      5587
   macro avg       0.84      0.87      0.86      5587
weighted avg       0.83      0.88      0.85      5587



Epoch: 18/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.46it/s, F1=0.996, train_acc=1, train_loss=0.0377, train_precision=0.995, train_recall=0.998]  


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       375
          NS       1.00      1.00      1.00       821
          NT       0.99      1.00      1.00       432

   micro avg       1.00      1.00      1.00      1628
   macro avg       1.00      1.00      1.00      1628
weighted avg       1.00      1.00      1.00      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.31it/s, F1=0.847, eval_acc=0.983, eval_loss=5.38, eval_precision=0.833, eval_recall=0.865]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.96      0.94      0.95      1416
          NS       0.79      0.87      0.83      2857
          NT       0.78      0.77      0.78      1314

   micro avg       0.83      0.86      0.85      5587
   macro avg       0.84      0.86      0.85      5587
weighted avg       0.83      0.86      0.85      5587



Epoch: 19/30 Train: 100%|██████████| 125/125 [00:39<00:00,  3.15it/s, F1=0.993, train_acc=1, train_loss=0.102, train_precision=0.991, train_recall=0.995]    


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       375
          NS       0.99      1.00      0.99       821
          NT       1.00      1.00      1.00       432

   micro avg       0.99      1.00      0.99      1628
   macro avg       0.99      1.00      0.99      1628
weighted avg       0.99      1.00      0.99      1628



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.33it/s, F1=0.849, eval_acc=0.983, eval_loss=5.08, eval_precision=0.848, eval_recall=0.855]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.90      0.92      1416
          NS       0.84      0.87      0.86      2857
          NT       0.78      0.78      0.78      1314

   micro avg       0.85      0.86      0.85      5587
   macro avg       0.85      0.85      0.85      5587
weighted avg       0.85      0.86      0.85      5587



Epoch: 20/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.46it/s, F1=0.992, train_acc=0.999, train_loss=0.207, train_precision=0.99, train_recall=0.994] 


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       375
          NS       1.00      1.00      1.00       821
          NT       0.98      0.99      0.99       432

   micro avg       0.99      1.00      0.99      1628
   macro avg       0.99      0.99      0.99      1628
weighted avg       0.99      1.00      0.99      1628



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.36it/s, F1=0.853, eval_acc=0.982, eval_loss=4.91, eval_precision=0.851, eval_recall=0.858]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.95      0.95      1416
          NS       0.85      0.85      0.85      2857
          NT       0.75      0.78      0.77      1314

   micro avg       0.85      0.86      0.86      5587
   macro avg       0.85      0.86      0.86      5587
weighted avg       0.85      0.86      0.86      5587



Epoch: 21/30 Train: 100%|██████████| 125/125 [00:39<00:00,  3.17it/s, F1=0.994, train_acc=0.999, train_loss=0.14, train_precision=0.993, train_recall=0.996] 


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       375
          NS       0.99      0.99      0.99       821
          NT       0.99      0.99      0.99       432

   micro avg       0.99      1.00      0.99      1628
   macro avg       0.99      1.00      0.99      1628
weighted avg       0.99      1.00      0.99      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.13it/s, F1=0.854, eval_acc=0.983, eval_loss=4.45, eval_precision=0.843, eval_recall=0.869]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.94      0.94      1416
          NS       0.84      0.87      0.85      2857
          NT       0.75      0.78      0.77      1314

   micro avg       0.84      0.87      0.86      5587
   macro avg       0.84      0.87      0.85      5587
weighted avg       0.84      0.87      0.86      5587



Epoch: 22/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.47it/s, F1=0.997, train_acc=1, train_loss=0.0474, train_precision=0.996, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       375
          NS       1.00      1.00      1.00       821
          NT       0.99      1.00      1.00       432

   micro avg       1.00      1.00      1.00      1628
   macro avg       1.00      1.00      1.00      1628
weighted avg       1.00      1.00      1.00      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.25it/s, F1=0.846, eval_acc=0.982, eval_loss=4.74, eval_precision=0.831, eval_recall=0.865]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.95      0.95      1416
          NS       0.83      0.87      0.85      2857
          NT       0.75      0.79      0.77      1314

   micro avg       0.84      0.87      0.85      5587
   macro avg       0.84      0.87      0.85      5587
weighted avg       0.84      0.87      0.86      5587



Epoch: 23/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.41it/s, F1=0.983, train_acc=0.999, train_loss=0.433, train_precision=0.979, train_recall=0.988]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       375
          NS       0.97      0.99      0.98       821
          NT       0.97      0.99      0.98       432

   micro avg       0.98      0.99      0.98      1628
   macro avg       0.98      0.99      0.99      1628
weighted avg       0.98      0.99      0.98      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.31it/s, F1=0.839, eval_acc=0.981, eval_loss=4.99, eval_precision=0.814, eval_recall=0.869]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.95      0.94      1416
          NS       0.79      0.86      0.83      2857
          NT       0.74      0.79      0.76      1314

   micro avg       0.81      0.87      0.84      5587
   macro avg       0.82      0.87      0.84      5587
weighted avg       0.81      0.87      0.84      5587



Epoch: 24/30 Train: 100%|██████████| 125/125 [00:39<00:00,  3.13it/s, F1=0.967, train_acc=0.998, train_loss=0.868, train_precision=0.957, train_recall=0.978]


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.99      0.98       375
          NS       0.98      0.99      0.98       821
          NT       0.92      0.96      0.94       432

   micro avg       0.96      0.98      0.97      1628
   macro avg       0.96      0.98      0.97      1628
weighted avg       0.96      0.98      0.97      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.31it/s, F1=0.826, eval_acc=0.978, eval_loss=4.83, eval_precision=0.813, eval_recall=0.843]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.92      0.96      0.94      1416
          NS       0.79      0.86      0.82      2857
          NT       0.69      0.66      0.67      1314

   micro avg       0.80      0.84      0.82      5587
   macro avg       0.80      0.83      0.81      5587
weighted avg       0.80      0.84      0.82      5587



Epoch: 25/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.44it/s, F1=0.975, train_acc=0.998, train_loss=0.477, train_precision=0.969, train_recall=0.982]


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.98      0.98       375
          NS       0.98      0.99      0.98       821
          NT       0.93      0.97      0.95       432

   micro avg       0.97      0.98      0.97      1628
   macro avg       0.96      0.98      0.97      1628
weighted avg       0.97      0.98      0.97      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.30it/s, F1=0.813, eval_acc=0.981, eval_loss=4.06, eval_precision=0.806, eval_recall=0.825]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.87      0.91      0.89      1416
          NS       0.83      0.85      0.84      2857
          NT       0.74      0.72      0.73      1314

   micro avg       0.82      0.84      0.83      5587
   macro avg       0.81      0.83      0.82      5587
weighted avg       0.82      0.84      0.83      5587



Epoch: 26/30 Train: 100%|██████████| 125/125 [00:39<00:00,  3.13it/s, F1=0.99, train_acc=0.999, train_loss=0.198, train_precision=0.989, train_recall=0.991] 


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.99      0.99       375
          NS       0.99      0.99      0.99       821
          NT       0.99      0.99      0.99       432

   micro avg       0.99      0.99      0.99      1628
   macro avg       0.99      0.99      0.99      1628
weighted avg       0.99      0.99      0.99      1628



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.31it/s, F1=0.836, eval_acc=0.982, eval_loss=4.4, eval_precision=0.821, eval_recall=0.854] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.95      0.94      1416
          NS       0.82      0.86      0.84      2857
          NT       0.73      0.76      0.74      1314

   micro avg       0.82      0.86      0.84      5587
   macro avg       0.83      0.86      0.84      5587
weighted avg       0.83      0.86      0.84      5587



Epoch: 27/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.45it/s, F1=0.992, train_acc=1, train_loss=0.112, train_precision=0.99, train_recall=0.994]     


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       375
          NS       1.00      1.00      1.00       821
          NT       0.97      0.99      0.98       432

   micro avg       0.99      0.99      0.99      1628
   macro avg       0.99      0.99      0.99      1628
weighted avg       0.99      0.99      0.99      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.20it/s, F1=0.84, eval_acc=0.982, eval_loss=4.68, eval_precision=0.823, eval_recall=0.861] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.95      0.95      1416
          NS       0.81      0.86      0.84      2857
          NT       0.71      0.79      0.75      1314

   micro avg       0.82      0.87      0.84      5587
   macro avg       0.82      0.87      0.84      5587
weighted avg       0.82      0.87      0.84      5587



Epoch: 28/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.41it/s, F1=0.986, train_acc=0.999, train_loss=0.266, train_precision=0.983, train_recall=0.989]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       375
          NS       0.99      0.99      0.99       821
          NT       0.96      0.98      0.97       432

   micro avg       0.98      0.99      0.99      1628
   macro avg       0.98      0.99      0.98      1628
weighted avg       0.98      0.99      0.99      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.24it/s, F1=0.851, eval_acc=0.983, eval_loss=4.9, eval_precision=0.847, eval_recall=0.858] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.95      0.95      1416
          NS       0.84      0.87      0.85      2857
          NT       0.76      0.77      0.77      1314

   micro avg       0.85      0.86      0.86      5587
   macro avg       0.85      0.86      0.86      5587
weighted avg       0.85      0.86      0.86      5587



Epoch: 29/30 Train: 100%|██████████| 125/125 [00:39<00:00,  3.13it/s, F1=0.99, train_acc=0.999, train_loss=0.15, train_precision=0.989, train_recall=0.992]  


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       375
          NS       0.99      0.99      0.99       821
          NT       0.98      0.99      0.98       432

   micro avg       0.99      0.99      0.99      1628
   macro avg       0.99      0.99      0.99      1628
weighted avg       0.99      0.99      0.99      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.24it/s, F1=0.861, eval_acc=0.984, eval_loss=4.46, eval_precision=0.863, eval_recall=0.862]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.95      0.95      1416
          NS       0.87      0.87      0.87      2857
          NT       0.76      0.79      0.78      1314

   micro avg       0.86      0.87      0.87      5587
   macro avg       0.86      0.87      0.86      5587
weighted avg       0.87      0.87      0.87      5587



Epoch: 30/30 Train: 100%|██████████| 125/125 [00:35<00:00,  3.48it/s, F1=0.995, train_acc=1, train_loss=0.0941, train_precision=0.995, train_recall=0.997]  


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       375
          NS       1.00      1.00      1.00       821
          NT       0.99      1.00      0.99       432

   micro avg       1.00      1.00      1.00      1628
   macro avg       0.99      1.00      1.00      1628
weighted avg       1.00      1.00      1.00      1628



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.33it/s, F1=0.853, eval_acc=0.983, eval_loss=4.9, eval_precision=0.84, eval_recall=0.871]  


eval_reports:
              precision    recall  f1-score   support

          NR       0.95      0.95      0.95      1416
          NS       0.81      0.89      0.85      2857
          NT       0.78      0.75      0.76      1314

   micro avg       0.84      0.87      0.86      5587
   macro avg       0.85      0.86      0.85      5587
weighted avg       0.84      0.87      0.85      5587



calculate data/few_shot/msra/train_1000.json etag: 100%|██████████| 597k/597k [00:00<00:00, 296MB/s]
calculate data/few_shot/msra/dev.json etag: 100%|██████████| 2.12M/2.12M [00:00<00:00, 335MB/s]
calculate data/few_shot/msra/test.json etag: 100%|██████████| 2.12M/2.12M [00:00<00:00, 368MB/s]
calculate data/few_shot/msra/labels.txt etag: 100%|██████████| 62.0/62.0 [00:00<00:00, 105kB/s]

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/msra/train_1000.json",
    "eval_file": "data/few_shot/msra/dev.json",
    "test_file": "data/few_shot/msra/test.json",
    "tag_file": "data/few_shot/msra/labels.txt",
    "bert_vocab_file": "./model/chinese_wwm_ext/vocab.txt",
    "output_eval": true,
    "max_scan_num": 1000000,
    "add_seq_vocab": false,
    "max_seq_length": 150,
    "max_word_num": 5,
    "default_tag": "O",
    "use_test": false,
    "do_shuffle": true,
    "do_predict": false,
    "task_name": "msra_pretrain_lebert_crf_1000_x2"
}
load cached ./temp/cd9a43ce51176d6be9ddcff512797086_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/lexicon_tree



count line size data/few_shot/msra/labels.txt: 14L [00:00, 113578.83L/s]
build line mapper: 14L [00:00, 114241.74L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 14/14 [00:00<00:00, 3958.22it/s]
load vocab from list: 100%|██████████| 13/13 [00:00<00:00, 154464.45it/s]
load dataset from data/few_shot/msra/train_1000.json: 0it [00:00, ?it/s]

load cached ./temp/cd9a43ce51176d6be9ddcff512797086_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/matched_words
load cached ./temp/cd9a43ce51176d6be9ddcff512797086_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/word_vocab
load cached ./temp/cd9a43ce51176d6be9ddcff512797086_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/vocab_embedding


load dataset from data/few_shot/msra/train_1000.json: 1000it [00:01, 585.82it/s]
load dataset from data/few_shot/msra/dev.json: 4365it [00:06, 666.26it/s]
Some weights of the model checkpoint at save_pretrained/msra_pretrain_lebert_1000_pretraind_task/Bert_960/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model f

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.44it/s, F1=0.00396, train_acc=0.738, train_loss=59.4, train_precision=0.00394, train_recall=0.00888]


train_reports:
              precision    recall  f1-score   support

          NR       0.00      0.00      0.00       375
          NS       0.00      0.02      0.01       821
          NT       0.00      0.01      0.00       432

   micro avg       0.00      0.01      0.00      1628
   macro avg       0.00      0.01      0.00      1628
weighted avg       0.00      0.01      0.00      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.26it/s, F1=0.0312, eval_acc=0.914, eval_loss=12.5, eval_precision=0.0219, eval_recall=0.0554]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.00      0.00      0.00      1416
          NS       0.04      0.07      0.05      2857
          NT       0.02      0.13      0.04      1314

   micro avg       0.02      0.06      0.04      5587
   macro avg       0.02      0.07      0.03      5587
weighted avg       0.03      0.06      0.03      5587



Epoch: 2/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.44it/s, F1=0.533, train_acc=0.964, train_loss=6.76, train_precision=0.494, train_recall=0.59]   


train_reports:
              precision    recall  f1-score   support

          NR       0.66      0.75      0.70       375
          NS       0.44      0.55      0.49       821
          NT       0.32      0.54      0.40       432

   micro avg       0.44      0.60      0.51      1628
   macro avg       0.47      0.62      0.53      1628
weighted avg       0.46      0.60      0.51      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.31it/s, F1=0.771, eval_acc=0.976, eval_loss=4.32, eval_precision=0.741, eval_recall=0.816]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.94      0.94      1416
          NS       0.76      0.80      0.78      2857
          NT       0.51      0.68      0.58      1314

   micro avg       0.73      0.81      0.77      5587
   macro avg       0.74      0.81      0.77      5587
weighted avg       0.75      0.81      0.77      5587



Epoch: 3/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.46it/s, F1=0.857, train_acc=0.99, train_loss=2.05, train_precision=0.842, train_recall=0.88]  


train_reports:
              precision    recall  f1-score   support

          NR       0.93      0.93      0.93       375
          NS       0.84      0.89      0.87       821
          NT       0.76      0.82      0.79       432

   micro avg       0.84      0.88      0.86      1628
   macro avg       0.84      0.88      0.86      1628
weighted avg       0.84      0.88      0.86      1628



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.35it/s, F1=0.798, eval_acc=0.979, eval_loss=3.77, eval_precision=0.749, eval_recall=0.861]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.96      0.95      1416
          NS       0.78      0.83      0.80      2857
          NT       0.57      0.82      0.68      1314

   micro avg       0.75      0.86      0.80      5587
   macro avg       0.76      0.87      0.81      5587
weighted avg       0.77      0.86      0.81      5587



Epoch: 4/30 Train: 100%|██████████| 125/125 [00:35<00:00,  3.49it/s, F1=0.926, train_acc=0.995, train_loss=0.864, train_precision=0.914, train_recall=0.943]


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.97      0.97       375
          NS       0.92      0.96      0.94       821
          NT       0.88      0.91      0.89       432

   micro avg       0.92      0.95      0.93      1628
   macro avg       0.92      0.95      0.93      1628
weighted avg       0.92      0.95      0.93      1628



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.36it/s, F1=0.84, eval_acc=0.983, eval_loss=4.55, eval_precision=0.842, eval_recall=0.841] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.95      0.94      1416
          NS       0.83      0.85      0.84      2857
          NT       0.74      0.70      0.72      1314

   micro avg       0.84      0.84      0.84      5587
   macro avg       0.83      0.83      0.83      5587
weighted avg       0.83      0.84      0.84      5587



Epoch: 5/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.42it/s, F1=0.955, train_acc=0.997, train_loss=0.569, train_precision=0.954, train_recall=0.958]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.98      0.98       375
          NS       0.96      0.97      0.96       821
          NT       0.94      0.96      0.95       432

   micro avg       0.96      0.97      0.96      1628
   macro avg       0.96      0.97      0.97      1628
weighted avg       0.96      0.97      0.96      1628



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.32it/s, F1=0.818, eval_acc=0.982, eval_loss=3.94, eval_precision=0.774, eval_recall=0.876]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.95      0.94      1416
          NS       0.77      0.88      0.82      2857
          NT       0.68      0.81      0.74      1314

   micro avg       0.79      0.88      0.83      5587
   macro avg       0.79      0.88      0.83      5587
weighted avg       0.79      0.88      0.83      5587



Epoch: 6/30 Train: 100%|██████████| 125/125 [00:39<00:00,  3.13it/s, F1=0.954, train_acc=0.997, train_loss=0.711, train_precision=0.947, train_recall=0.962]


train_reports:
              precision    recall  f1-score   support

          NR       0.97      0.98      0.97       375
          NS       0.97      0.98      0.98       821
          NT       0.88      0.93      0.91       432

   micro avg       0.95      0.97      0.96      1628
   macro avg       0.94      0.96      0.95      1628
weighted avg       0.95      0.97      0.96      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.22it/s, F1=0.827, eval_acc=0.981, eval_loss=4.2, eval_precision=0.797, eval_recall=0.865] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.92      0.96      0.94      1416
          NS       0.79      0.88      0.84      2857
          NT       0.71      0.74      0.72      1314

   micro avg       0.80      0.87      0.84      5587
   macro avg       0.81      0.86      0.83      5587
weighted avg       0.81      0.87      0.84      5587



Epoch: 7/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.43it/s, F1=0.956, train_acc=0.997, train_loss=0.626, train_precision=0.949, train_recall=0.966]


train_reports:
              precision    recall  f1-score   support

          NR       0.97      0.97      0.97       375
          NS       0.97      0.98      0.97       821
          NT       0.91      0.95      0.93       432

   micro avg       0.95      0.97      0.96      1628
   macro avg       0.95      0.97      0.96      1628
weighted avg       0.95      0.97      0.96      1628



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.32it/s, F1=0.832, eval_acc=0.984, eval_loss=3.81, eval_precision=0.81, eval_recall=0.861] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.95      0.94      1416
          NS       0.82      0.87      0.84      2857
          NT       0.67      0.74      0.70      1314

   micro avg       0.81      0.86      0.83      5587
   macro avg       0.81      0.85      0.83      5587
weighted avg       0.81      0.86      0.84      5587



Epoch: 8/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.45it/s, F1=0.979, train_acc=0.999, train_loss=0.203, train_precision=0.975, train_recall=0.984]


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.99      0.98       375
          NS       0.99      0.99      0.99       821
          NT       0.96      0.97      0.97       432

   micro avg       0.98      0.99      0.98      1628
   macro avg       0.98      0.98      0.98      1628
weighted avg       0.98      0.99      0.98      1628



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.60it/s, F1=0.84, eval_acc=0.983, eval_loss=4.07, eval_precision=0.811, eval_recall=0.878] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.96      0.95      1416
          NS       0.83      0.88      0.85      2857
          NT       0.68      0.81      0.74      1314

   micro avg       0.82      0.88      0.85      5587
   macro avg       0.82      0.88      0.85      5587
weighted avg       0.82      0.88      0.85      5587



Epoch: 9/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.45it/s, F1=0.989, train_acc=0.999, train_loss=0.113, train_precision=0.987, train_recall=0.991] 


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       375
          NS       0.99      0.99      0.99       821
          NT       0.97      0.99      0.98       432

   micro avg       0.99      0.99      0.99      1628
   macro avg       0.99      0.99      0.99      1628
weighted avg       0.99      0.99      0.99      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.22it/s, F1=0.859, eval_acc=0.985, eval_loss=4.54, eval_precision=0.842, eval_recall=0.881]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.96      0.95      1416
          NS       0.84      0.89      0.86      2857
          NT       0.77      0.78      0.77      1314

   micro avg       0.85      0.88      0.86      5587
   macro avg       0.85      0.88      0.86      5587
weighted avg       0.85      0.88      0.86      5587



Epoch: 10/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.43it/s, F1=0.973, train_acc=0.998, train_loss=0.475, train_precision=0.967, train_recall=0.981]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       375
          NS       0.98      0.99      0.98       821
          NT       0.91      0.95      0.93       432

   micro avg       0.96      0.98      0.97      1628
   macro avg       0.96      0.98      0.97      1628
weighted avg       0.96      0.98      0.97      1628



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.33it/s, F1=0.844, eval_acc=0.982, eval_loss=4.59, eval_precision=0.841, eval_recall=0.849]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.96      0.95      1416
          NS       0.87      0.85      0.86      2857
          NT       0.67      0.72      0.70      1314

   micro avg       0.84      0.85      0.84      5587
   macro avg       0.83      0.84      0.84      5587
weighted avg       0.84      0.85      0.84      5587



Epoch: 11/30 Train: 100%|██████████| 125/125 [00:40<00:00,  3.11it/s, F1=0.991, train_acc=0.999, train_loss=0.194, train_precision=0.989, train_recall=0.992]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       375
          NS       0.99      0.99      0.99       821
          NT       0.97      0.98      0.97       432

   micro avg       0.99      0.99      0.99      1628
   macro avg       0.99      0.99      0.99      1628
weighted avg       0.99      0.99      0.99      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.29it/s, F1=0.859, eval_acc=0.984, eval_loss=4.78, eval_precision=0.844, eval_recall=0.877]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.96      0.95      1416
          NS       0.86      0.88      0.87      2857
          NT       0.73      0.79      0.76      1314

   micro avg       0.85      0.88      0.86      5587
   macro avg       0.84      0.88      0.86      5587
weighted avg       0.85      0.88      0.86      5587



Epoch: 12/30 Train: 100%|██████████| 125/125 [00:35<00:00,  3.49it/s, F1=0.997, train_acc=1, train_loss=0.109, train_precision=0.997, train_recall=0.997]   


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       375
          NS       0.99      0.99      0.99       821
          NT       1.00      1.00      1.00       432

   micro avg       1.00      1.00      1.00      1628
   macro avg       1.00      1.00      1.00      1628
weighted avg       1.00      1.00      1.00      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.31it/s, F1=0.859, eval_acc=0.984, eval_loss=4.91, eval_precision=0.856, eval_recall=0.865]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.96      0.95      1416
          NS       0.85      0.87      0.86      2857
          NT       0.76      0.75      0.76      1314

   micro avg       0.86      0.87      0.86      5587
   macro avg       0.86      0.86      0.86      5587
weighted avg       0.85      0.87      0.86      5587



Epoch: 13/30 Train: 100%|██████████| 125/125 [00:39<00:00,  3.13it/s, F1=0.992, train_acc=0.999, train_loss=0.134, train_precision=0.989, train_recall=0.995]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       375
          NS       0.99      1.00      0.99       821
          NT       0.98      0.99      0.98       432

   micro avg       0.99      1.00      0.99      1628
   macro avg       0.99      1.00      0.99      1628
weighted avg       0.99      1.00      0.99      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.26it/s, F1=0.865, eval_acc=0.985, eval_loss=4.43, eval_precision=0.848, eval_recall=0.886]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.96      0.95      1416
          NS       0.86      0.90      0.88      2857
          NT       0.74      0.79      0.77      1314

   micro avg       0.85      0.89      0.87      5587
   macro avg       0.85      0.88      0.87      5587
weighted avg       0.85      0.89      0.87      5587



Epoch: 14/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.44it/s, F1=0.997, train_acc=1, train_loss=0.0653, train_precision=0.997, train_recall=0.997]   


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       375
          NS       1.00      1.00      1.00       821
          NT       0.99      0.99      0.99       432

   micro avg       1.00      1.00      1.00      1628
   macro avg       1.00      1.00      1.00      1628
weighted avg       1.00      1.00      1.00      1628



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.34it/s, F1=0.87, eval_acc=0.985, eval_loss=4.97, eval_precision=0.865, eval_recall=0.877] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.96      0.95      1416
          NS       0.87      0.90      0.88      2857
          NT       0.77      0.75      0.76      1314

   micro avg       0.87      0.88      0.87      5587
   macro avg       0.86      0.87      0.87      5587
weighted avg       0.87      0.88      0.87      5587



Epoch: 15/30 Train: 100%|██████████| 125/125 [00:35<00:00,  3.48it/s, F1=0.997, train_acc=1, train_loss=0.0618, train_precision=0.996, train_recall=0.998]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       375
          NS       1.00      1.00      1.00       821
          NT       1.00      1.00      1.00       432

   micro avg       1.00      1.00      1.00      1628
   macro avg       1.00      1.00      1.00      1628
weighted avg       1.00      1.00      1.00      1628



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.57it/s, F1=0.851, eval_acc=0.984, eval_loss=4.22, eval_precision=0.822, eval_recall=0.887]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.96      0.96      0.96      1416
          NS       0.85      0.89      0.87      2857
          NT       0.68      0.83      0.74      1314

   micro avg       0.83      0.89      0.86      5587
   macro avg       0.83      0.89      0.86      5587
weighted avg       0.83      0.89      0.86      5587



Epoch: 16/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.45it/s, F1=0.99, train_acc=1, train_loss=0.0635, train_precision=0.99, train_recall=0.99]   


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       375
          NS       1.00      1.00      1.00       821
          NT       1.00      1.00      1.00       432

   micro avg       1.00      1.00      1.00      1628
   macro avg       1.00      1.00      1.00      1628
weighted avg       1.00      1.00      1.00      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.23it/s, F1=0.857, eval_acc=0.985, eval_loss=4.59, eval_precision=0.834, eval_recall=0.886]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.96      0.95      1416
          NS       0.83      0.90      0.87      2857
          NT       0.72      0.79      0.75      1314

   micro avg       0.83      0.89      0.86      5587
   macro avg       0.84      0.88      0.86      5587
weighted avg       0.84      0.89      0.86      5587



Epoch: 17/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.40it/s, F1=0.999, train_acc=1, train_loss=0.0332, train_precision=0.998, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       375
          NS       1.00      1.00      1.00       821
          NT       1.00      1.00      1.00       432

   micro avg       1.00      1.00      1.00      1628
   macro avg       1.00      1.00      1.00      1628
weighted avg       1.00      1.00      1.00      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.26it/s, F1=0.868, eval_acc=0.985, eval_loss=4.36, eval_precision=0.856, eval_recall=0.883]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.96      0.96      0.96      1416
          NS       0.85      0.89      0.87      2857
          NT       0.77      0.79      0.78      1314

   micro avg       0.86      0.89      0.87      5587
   macro avg       0.86      0.88      0.87      5587
weighted avg       0.86      0.89      0.87      5587



Epoch: 18/30 Train: 100%|██████████| 125/125 [00:39<00:00,  3.13it/s, F1=0.978, train_acc=0.999, train_loss=0.449, train_precision=0.973, train_recall=0.984]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       375
          NS       0.98      0.98      0.98       821
          NT       0.94      0.97      0.95       432

   micro avg       0.97      0.98      0.98      1628
   macro avg       0.97      0.98      0.97      1628
weighted avg       0.97      0.98      0.98      1628



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.35it/s, F1=0.836, eval_acc=0.983, eval_loss=4.49, eval_precision=0.817, eval_recall=0.862]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.95      0.94      1416
          NS       0.83      0.86      0.84      2857
          NT       0.68      0.80      0.74      1314

   micro avg       0.82      0.87      0.84      5587
   macro avg       0.82      0.87      0.84      5587
weighted avg       0.82      0.87      0.84      5587



Epoch: 19/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.46it/s, F1=0.974, train_acc=0.998, train_loss=0.415, train_precision=0.97, train_recall=0.979] 


train_reports:
              precision    recall  f1-score   support

          NR       1.00      0.99      1.00       375
          NS       0.98      0.99      0.98       821
          NT       0.93      0.96      0.94       432

   micro avg       0.97      0.98      0.98      1628
   macro avg       0.97      0.98      0.97      1628
weighted avg       0.97      0.98      0.98      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.31it/s, F1=0.801, eval_acc=0.978, eval_loss=7.45, eval_precision=0.81, eval_recall=0.796] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.94      0.94      1416
          NS       0.77      0.80      0.79      2857
          NT       0.70      0.63      0.66      1314

   micro avg       0.80      0.80      0.80      5587
   macro avg       0.80      0.79      0.80      5587
weighted avg       0.80      0.80      0.80      5587



Epoch: 20/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.43it/s, F1=0.986, train_acc=0.999, train_loss=0.238, train_precision=0.983, train_recall=0.989]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       375
          NS       0.98      0.99      0.98       821
          NT       0.97      0.98      0.97       432

   micro avg       0.98      0.99      0.98      1628
   macro avg       0.98      0.99      0.99      1628
weighted avg       0.98      0.99      0.98      1628



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.60it/s, F1=0.847, eval_acc=0.984, eval_loss=4.72, eval_precision=0.84, eval_recall=0.857] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.95      0.95      1416
          NS       0.82      0.88      0.85      2857
          NT       0.72      0.71      0.72      1314

   micro avg       0.83      0.86      0.84      5587
   macro avg       0.83      0.85      0.84      5587
weighted avg       0.83      0.86      0.84      5587



Epoch: 21/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.43it/s, F1=0.966, train_acc=0.998, train_loss=0.6, train_precision=0.959, train_recall=0.974]  


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       375
          NS       0.97      0.99      0.98       821
          NT       0.94      0.97      0.95       432

   micro avg       0.97      0.98      0.97      1628
   macro avg       0.97      0.98      0.97      1628
weighted avg       0.97      0.98      0.97      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.27it/s, F1=0.834, eval_acc=0.982, eval_loss=4.57, eval_precision=0.799, eval_recall=0.881]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.92      0.96      0.94      1416
          NS       0.81      0.89      0.85      2857
          NT       0.70      0.79      0.74      1314

   micro avg       0.81      0.88      0.84      5587
   macro avg       0.81      0.88      0.84      5587
weighted avg       0.81      0.88      0.84      5587



Epoch: 22/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.47it/s, F1=0.979, train_acc=0.998, train_loss=0.418, train_precision=0.974, train_recall=0.986]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       375
          NS       0.97      0.99      0.98       821
          NT       0.96      0.97      0.97       432

   micro avg       0.97      0.98      0.98      1628
   macro avg       0.97      0.98      0.98      1628
weighted avg       0.97      0.98      0.98      1628



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.35it/s, F1=0.838, eval_acc=0.982, eval_loss=4.47, eval_precision=0.819, eval_recall=0.864]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.92      0.96      0.94      1416
          NS       0.81      0.86      0.84      2857
          NT       0.74      0.78      0.76      1314

   micro avg       0.82      0.87      0.85      5587
   macro avg       0.83      0.87      0.85      5587
weighted avg       0.82      0.87      0.85      5587



Epoch: 23/30 Train: 100%|██████████| 125/125 [00:39<00:00,  3.15it/s, F1=0.968, train_acc=0.997, train_loss=0.632, train_precision=0.961, train_recall=0.977]


train_reports:
              precision    recall  f1-score   support

          NR       0.97      0.98      0.98       375
          NS       0.97      0.99      0.98       821
          NT       0.93      0.95      0.94       432

   micro avg       0.96      0.98      0.97      1628
   macro avg       0.96      0.97      0.97      1628
weighted avg       0.96      0.98      0.97      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.19it/s, F1=0.834, eval_acc=0.982, eval_loss=4.57, eval_precision=0.802, eval_recall=0.875]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.93      0.94      1416
          NS       0.80      0.90      0.85      2857
          NT       0.73      0.79      0.76      1314

   micro avg       0.82      0.88      0.85      5587
   macro avg       0.82      0.87      0.85      5587
weighted avg       0.82      0.88      0.85      5587



Epoch: 24/30 Train: 100%|██████████| 125/125 [00:35<00:00,  3.49it/s, F1=0.985, train_acc=0.999, train_loss=0.34, train_precision=0.979, train_recall=0.991] 


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.98      0.98       375
          NS       0.97      0.99      0.98       821
          NT       0.98      0.99      0.98       432

   micro avg       0.98      0.99      0.98      1628
   macro avg       0.98      0.99      0.98      1628
weighted avg       0.98      0.99      0.98      1628



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.35it/s, F1=0.856, eval_acc=0.983, eval_loss=4.79, eval_precision=0.846, eval_recall=0.873]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.95      0.94      1416
          NS       0.86      0.88      0.87      2857
          NT       0.75      0.79      0.77      1314

   micro avg       0.85      0.88      0.86      5587
   macro avg       0.85      0.87      0.86      5587
weighted avg       0.85      0.88      0.86      5587



Epoch: 25/30 Train: 100%|██████████| 125/125 [00:39<00:00,  3.13it/s, F1=0.998, train_acc=1, train_loss=0.0347, train_precision=0.998, train_recall=0.998]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       375
          NS       1.00      1.00      1.00       821
          NT       1.00      1.00      1.00       432

   micro avg       1.00      1.00      1.00      1628
   macro avg       1.00      1.00      1.00      1628
weighted avg       1.00      1.00      1.00      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.30it/s, F1=0.859, eval_acc=0.983, eval_loss=5.03, eval_precision=0.845, eval_recall=0.878]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.96      0.95      1416
          NS       0.85      0.88      0.87      2857
          NT       0.76      0.80      0.78      1314

   micro avg       0.85      0.88      0.87      5587
   macro avg       0.85      0.88      0.86      5587
weighted avg       0.85      0.88      0.87      5587



Epoch: 26/30 Train: 100%|██████████| 125/125 [00:35<00:00,  3.50it/s, F1=0.998, train_acc=1, train_loss=0.0249, train_precision=0.998, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      1.00      1.00       375
          NS       1.00      1.00      1.00       821
          NT       0.99      1.00      0.99       432

   micro avg       1.00      1.00      1.00      1628
   macro avg       1.00      1.00      1.00      1628
weighted avg       1.00      1.00      1.00      1628



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.35it/s, F1=0.844, eval_acc=0.982, eval_loss=5.64, eval_precision=0.833, eval_recall=0.86] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.87      0.93      0.90      1416
          NS       0.85      0.86      0.86      2857
          NT       0.76      0.79      0.78      1314

   micro avg       0.84      0.86      0.85      5587
   macro avg       0.83      0.86      0.85      5587
weighted avg       0.84      0.86      0.85      5587



Epoch: 27/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.45it/s, F1=0.995, train_acc=1, train_loss=0.0369, train_precision=0.994, train_recall=0.997]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       375
          NS       0.99      1.00      1.00       821
          NT       1.00      1.00      1.00       432

   micro avg       0.99      1.00      1.00      1628
   macro avg       0.99      1.00      0.99      1628
weighted avg       0.99      1.00      1.00      1628



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.32it/s, F1=0.851, eval_acc=0.982, eval_loss=5.59, eval_precision=0.839, eval_recall=0.868]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.96      0.92      0.94      1416
          NS       0.85      0.89      0.87      2857
          NT       0.74      0.79      0.76      1314

   micro avg       0.85      0.87      0.86      5587
   macro avg       0.85      0.87      0.86      5587
weighted avg       0.85      0.87      0.86      5587



Epoch: 28/30 Train: 100%|██████████| 125/125 [00:39<00:00,  3.15it/s, F1=0.985, train_acc=1, train_loss=0.128, train_precision=0.984, train_recall=0.987]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       375
          NS       1.00      1.00      1.00       821
          NT       0.98      0.99      0.99       432

   micro avg       0.99      1.00      1.00      1628
   macro avg       0.99      1.00      0.99      1628
weighted avg       0.99      1.00      1.00      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.26it/s, F1=0.863, eval_acc=0.983, eval_loss=5.3, eval_precision=0.846, eval_recall=0.884] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.95      0.94      1416
          NS       0.86      0.89      0.87      2857
          NT       0.75      0.81      0.78      1314

   micro avg       0.85      0.89      0.87      5587
   macro avg       0.85      0.88      0.86      5587
weighted avg       0.85      0.89      0.87      5587



Epoch: 29/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.45it/s, F1=0.996, train_acc=1, train_loss=0.0422, train_precision=0.995, train_recall=0.997]   


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       375
          NS       1.00      1.00      1.00       821
          NT       0.99      1.00      0.99       432

   micro avg       1.00      1.00      1.00      1628
   macro avg       1.00      1.00      1.00      1628
weighted avg       1.00      1.00      1.00      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.29it/s, F1=0.866, eval_acc=0.984, eval_loss=5.46, eval_precision=0.862, eval_recall=0.874]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.95      0.95      1416
          NS       0.86      0.88      0.87      2857
          NT       0.78      0.80      0.79      1314

   micro avg       0.86      0.88      0.87      5587
   macro avg       0.86      0.87      0.87      5587
weighted avg       0.86      0.88      0.87      5587



Epoch: 30/30 Train: 100%|██████████| 125/125 [00:39<00:00,  3.17it/s, F1=0.998, train_acc=1, train_loss=0.0348, train_precision=0.997, train_recall=0.998]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       375
          NS       1.00      1.00      1.00       821
          NT       0.99      1.00      0.99       432

   micro avg       1.00      1.00      1.00      1628
   macro avg       1.00      1.00      1.00      1628
weighted avg       1.00      1.00      1.00      1628



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.34it/s, F1=0.86, eval_acc=0.984, eval_loss=5.73, eval_precision=0.861, eval_recall=0.862] 


eval_reports:
              precision    recall  f1-score   support

          NR       0.94      0.94      0.94      1416
          NS       0.86      0.88      0.87      2857
          NT       0.79      0.75      0.77      1314

   micro avg       0.86      0.87      0.86      5587
   macro avg       0.86      0.86      0.86      5587
weighted avg       0.86      0.87      0.86      5587



calculate data/few_shot/msra/train_1000.json etag: 100%|██████████| 597k/597k [00:00<00:00, 298MB/s]
calculate data/few_shot/msra/dev.json etag: 100%|██████████| 2.12M/2.12M [00:00<00:00, 334MB/s]
calculate data/few_shot/msra/test.json etag: 100%|██████████| 2.12M/2.12M [00:00<00:00, 369MB/s]
calculate data/few_shot/msra/labels.txt etag: 100%|██████████| 62.0/62.0 [00:00<00:00, 114kB/s]

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/msra/train_1000.json",
    "eval_file": "data/few_shot/msra/dev.json",
    "test_file": "data/few_shot/msra/test.json",
    "tag_file": "data/few_shot/msra/labels.txt",
    "bert_vocab_file": "./model/chinese_wwm_ext/vocab.txt",
    "output_eval": true,
    "max_scan_num": 1000000,
    "add_seq_vocab": false,
    "max_seq_length": 150,
    "max_word_num": 5,
    "default_tag": "O",
    "use_test": false,
    "do_shuffle": true,
    "do_predict": false,
    "task_name": "msra_pretrain_lebert_crf_1000_x3"
}
load cached ./temp/cd9a43ce51176d6be9ddcff512797086_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/lexicon_tree



count line size data/few_shot/msra/labels.txt: 14L [00:00, 100893.91L/s]
build line mapper: 14L [00:00, 119108.02L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 14/14 [00:00<00:00, 4869.01it/s]
load vocab from list: 100%|██████████| 13/13 [00:00<00:00, 163741.60it/s]
load dataset from data/few_shot/msra/train_1000.json: 0it [00:00, ?it/s]

load cached ./temp/cd9a43ce51176d6be9ddcff512797086_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/matched_words
load cached ./temp/cd9a43ce51176d6be9ddcff512797086_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/word_vocab
load cached ./temp/cd9a43ce51176d6be9ddcff512797086_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/vocab_embedding


load dataset from data/few_shot/msra/train_1000.json: 1000it [00:01, 585.80it/s]
load dataset from data/few_shot/msra/dev.json: 4365it [00:06, 670.53it/s]
Some weights of the model checkpoint at save_pretrained/msra_pretrain_lebert_1000_pretraind_task/Bert_960/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model f

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.46it/s, F1=0.0095, train_acc=0.777, train_loss=48.3, train_precision=0.00762, train_recall=0.0153]    


train_reports:
              precision    recall  f1-score   support

          NR       0.00      0.01      0.00       375
          NS       0.01      0.02      0.02       821
          NT       0.01      0.02      0.01       432

   micro avg       0.00      0.02      0.01      1628
   macro avg       0.01      0.02      0.01      1628
weighted avg       0.01      0.02      0.01      1628



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.34it/s, F1=0.074, eval_acc=0.931, eval_loss=9.83, eval_precision=0.059, eval_recall=0.101]  


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.02      0.03      0.02      1416
          NS       0.05      0.08      0.06      2857
          NT       0.15      0.29      0.19      1314

   micro avg       0.07      0.12      0.09      5587
   macro avg       0.07      0.14      0.09      5587
weighted avg       0.06      0.12      0.08      5587



Epoch: 2/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.43it/s, F1=0.567, train_acc=0.968, train_loss=5.77, train_precision=0.537, train_recall=0.617]


train_reports:
              precision    recall  f1-score   support

          NR       0.43      0.58      0.49       375
          NS       0.54      0.69      0.60       821
          NT       0.45      0.57      0.51       432

   micro avg       0.49      0.63      0.55      1628
   macro avg       0.47      0.61      0.53      1628
weighted avg       0.49      0.63      0.55      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.31it/s, F1=0.767, eval_acc=0.979, eval_loss=3.24, eval_precision=0.711, eval_recall=0.842]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.92      0.89      0.91      1416
          NS       0.73      0.86      0.79      2857
          NT       0.53      0.74      0.62      1314

   micro avg       0.71      0.84      0.77      5587
   macro avg       0.73      0.83      0.77      5587
weighted avg       0.73      0.84      0.78      5587



Epoch: 3/30 Train: 100%|██████████| 125/125 [00:35<00:00,  3.48it/s, F1=0.866, train_acc=0.99, train_loss=1.9, train_precision=0.845, train_recall=0.896] 


train_reports:
              precision    recall  f1-score   support

          NR       0.93      0.95      0.94       375
          NS       0.85      0.91      0.88       821
          NT       0.73      0.81      0.77       432

   micro avg       0.84      0.90      0.87      1628
   macro avg       0.84      0.89      0.87      1628
weighted avg       0.84      0.90      0.87      1628



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.54it/s, F1=0.816, eval_acc=0.982, eval_loss=2.73, eval_precision=0.798, eval_recall=0.84] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.89      0.91      1416
          NS       0.80      0.84      0.82      2857
          NT       0.67      0.76      0.71      1314

   micro avg       0.80      0.83      0.82      5587
   macro avg       0.80      0.83      0.81      5587
weighted avg       0.80      0.83      0.82      5587



Epoch: 4/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.46it/s, F1=0.921, train_acc=0.995, train_loss=0.906, train_precision=0.907, train_recall=0.94] 


train_reports:
              precision    recall  f1-score   support

          NR       0.96      0.97      0.96       375
          NS       0.93      0.96      0.95       821
          NT       0.84      0.89      0.87       432

   micro avg       0.91      0.95      0.93      1628
   macro avg       0.91      0.94      0.93      1628
weighted avg       0.91      0.95      0.93      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.27it/s, F1=0.823, eval_acc=0.981, eval_loss=3.17, eval_precision=0.791, eval_recall=0.863]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.89      0.92      1416
          NS       0.81      0.88      0.84      2857
          NT       0.69      0.81      0.74      1314

   micro avg       0.81      0.87      0.83      5587
   macro avg       0.81      0.86      0.83      5587
weighted avg       0.81      0.87      0.84      5587



Epoch: 5/30 Train: 100%|██████████| 125/125 [00:35<00:00,  3.49it/s, F1=0.96, train_acc=0.997, train_loss=0.477, train_precision=0.954, train_recall=0.967] 


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.98      0.98       375
          NS       0.97      0.98      0.97       821
          NT       0.91      0.95      0.93       432

   micro avg       0.95      0.97      0.96      1628
   macro avg       0.95      0.97      0.96      1628
weighted avg       0.96      0.97      0.96      1628



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.33it/s, F1=0.828, eval_acc=0.982, eval_loss=3.66, eval_precision=0.805, eval_recall=0.857]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.91      0.91      0.91      1416
          NS       0.80      0.85      0.83      2857
          NT       0.73      0.78      0.76      1314

   micro avg       0.81      0.85      0.83      5587
   macro avg       0.81      0.85      0.83      5587
weighted avg       0.81      0.85      0.83      5587



Epoch: 6/30 Train: 100%|██████████| 125/125 [00:39<00:00,  3.18it/s, F1=0.981, train_acc=0.999, train_loss=0.245, train_precision=0.978, train_recall=0.985]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       375
          NS       0.98      0.98      0.98       821
          NT       0.95      0.97      0.96       432

   micro avg       0.97      0.98      0.98      1628
   macro avg       0.97      0.98      0.98      1628
weighted avg       0.97      0.98      0.98      1628



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.32it/s, F1=0.835, eval_acc=0.982, eval_loss=3.49, eval_precision=0.809, eval_recall=0.866]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.92      0.90      0.91      1416
          NS       0.82      0.89      0.85      2857
          NT       0.72      0.81      0.76      1314

   micro avg       0.82      0.87      0.85      5587
   macro avg       0.82      0.86      0.84      5587
weighted avg       0.82      0.87      0.85      5587



Epoch: 7/30 Train: 100%|██████████| 125/125 [00:35<00:00,  3.48it/s, F1=0.976, train_acc=0.998, train_loss=0.333, train_precision=0.971, train_recall=0.982]


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.99      0.98       375
          NS       0.98      0.99      0.98       821
          NT       0.94      0.97      0.96       432

   micro avg       0.97      0.98      0.98      1628
   macro avg       0.97      0.98      0.97      1628
weighted avg       0.97      0.98      0.98      1628



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.35it/s, F1=0.819, eval_acc=0.982, eval_loss=4.04, eval_precision=0.811, eval_recall=0.832]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.93      0.94      1416
          NS       0.81      0.88      0.85      2857
          NT       0.71      0.68      0.70      1314

   micro avg       0.82      0.85      0.83      5587
   macro avg       0.82      0.83      0.83      5587
weighted avg       0.82      0.85      0.83      5587



Epoch: 8/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.47it/s, F1=0.977, train_acc=0.999, train_loss=0.33, train_precision=0.971, train_recall=0.983] 


train_reports:
              precision    recall  f1-score   support

          NR       0.97      0.99      0.98       375
          NS       0.97      0.98      0.98       821
          NT       0.95      0.97      0.96       432

   micro avg       0.97      0.98      0.98      1628
   macro avg       0.97      0.98      0.97      1628
weighted avg       0.97      0.98      0.98      1628



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.59it/s, F1=0.838, eval_acc=0.983, eval_loss=4.28, eval_precision=0.839, eval_recall=0.841]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.96      0.92      0.94      1416
          NS       0.83      0.88      0.85      2857
          NT       0.72      0.69      0.70      1314

   micro avg       0.84      0.84      0.84      5587
   macro avg       0.84      0.83      0.83      5587
weighted avg       0.84      0.84      0.84      5587



Epoch: 9/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.45it/s, F1=0.981, train_acc=0.999, train_loss=0.273, train_precision=0.976, train_recall=0.987]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       375
          NS       0.98      0.99      0.98       821
          NT       0.97      0.98      0.97       432

   micro avg       0.98      0.99      0.98      1628
   macro avg       0.98      0.99      0.98      1628
weighted avg       0.98      0.99      0.98      1628



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.37it/s, F1=0.832, eval_acc=0.982, eval_loss=4.01, eval_precision=0.823, eval_recall=0.846]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.92      0.93      1416
          NS       0.84      0.84      0.84      2857
          NT       0.71      0.79      0.75      1314

   micro avg       0.83      0.85      0.84      5587
   macro avg       0.83      0.85      0.84      5587
weighted avg       0.83      0.85      0.84      5587



Epoch: 10/30 Train: 100%|██████████| 125/125 [00:35<00:00,  3.47it/s, F1=0.965, train_acc=0.997, train_loss=0.535, train_precision=0.958, train_recall=0.973]


train_reports:
              precision    recall  f1-score   support

          NR       0.97      0.98      0.98       375
          NS       0.96      0.98      0.97       821
          NT       0.92      0.95      0.94       432

   micro avg       0.95      0.97      0.96      1628
   macro avg       0.95      0.97      0.96      1628
weighted avg       0.95      0.97      0.96      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.27it/s, F1=0.832, eval_acc=0.982, eval_loss=3.88, eval_precision=0.83, eval_recall=0.838] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.92      0.93      1416
          NS       0.81      0.85      0.83      2857
          NT       0.77      0.73      0.75      1314

   micro avg       0.83      0.84      0.84      5587
   macro avg       0.84      0.83      0.84      5587
weighted avg       0.83      0.84      0.84      5587



Epoch: 11/30 Train: 100%|██████████| 125/125 [00:39<00:00,  3.17it/s, F1=0.981, train_acc=0.998, train_loss=0.342, train_precision=0.978, train_recall=0.985]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      1.00      0.99       375
          NS       0.98      0.99      0.98       821
          NT       0.96      0.97      0.96       432

   micro avg       0.98      0.98      0.98      1628
   macro avg       0.97      0.98      0.98      1628
weighted avg       0.98      0.98      0.98      1628



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.34it/s, F1=0.842, eval_acc=0.982, eval_loss=4.01, eval_precision=0.834, eval_recall=0.854]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.92      0.93      1416
          NS       0.83      0.85      0.84      2857
          NT       0.72      0.77      0.75      1314

   micro avg       0.83      0.85      0.84      5587
   macro avg       0.83      0.85      0.84      5587
weighted avg       0.83      0.85      0.84      5587



Epoch: 12/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.47it/s, F1=0.995, train_acc=1, train_loss=0.0854, train_precision=0.993, train_recall=0.997]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       375
          NS       1.00      1.00      1.00       821
          NT       0.98      0.99      0.99       432

   micro avg       0.99      1.00      0.99      1628
   macro avg       0.99      1.00      0.99      1628
weighted avg       0.99      1.00      0.99      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.25it/s, F1=0.856, eval_acc=0.983, eval_loss=4.45, eval_precision=0.85, eval_recall=0.866] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.94      0.94      1416
          NS       0.84      0.88      0.86      2857
          NT       0.77      0.75      0.76      1314

   micro avg       0.85      0.86      0.86      5587
   macro avg       0.85      0.86      0.85      5587
weighted avg       0.85      0.86      0.86      5587



Epoch: 13/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.22it/s, F1=0.994, train_acc=0.999, train_loss=0.124, train_precision=0.993, train_recall=0.996]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       375
          NS       0.99      1.00      0.99       821
          NT       0.99      0.99      0.99       432

   micro avg       0.99      1.00      0.99      1628
   macro avg       0.99      1.00      0.99      1628
weighted avg       0.99      1.00      0.99      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.30it/s, F1=0.835, eval_acc=0.981, eval_loss=4.34, eval_precision=0.814, eval_recall=0.862]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.94      0.94      1416
          NS       0.82      0.85      0.84      2857
          NT       0.71      0.80      0.75      1314

   micro avg       0.82      0.86      0.84      5587
   macro avg       0.82      0.86      0.84      5587
weighted avg       0.82      0.86      0.84      5587



Epoch: 14/30 Train: 100%|██████████| 125/125 [00:35<00:00,  3.49it/s, F1=0.987, train_acc=0.999, train_loss=0.219, train_precision=0.986, train_recall=0.989]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       375
          NS       0.98      0.99      0.98       821
          NT       0.98      0.99      0.99       432

   micro avg       0.98      0.99      0.99      1628
   macro avg       0.99      0.99      0.99      1628
weighted avg       0.98      0.99      0.99      1628



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.32it/s, F1=0.86, eval_acc=0.984, eval_loss=4.28, eval_precision=0.861, eval_recall=0.863] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.94      0.95      1416
          NS       0.85      0.87      0.86      2857
          NT       0.80      0.76      0.78      1314

   micro avg       0.87      0.86      0.86      5587
   macro avg       0.87      0.86      0.86      5587
weighted avg       0.87      0.86      0.86      5587



Epoch: 15/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.46it/s, F1=0.999, train_acc=1, train_loss=0.0335, train_precision=0.999, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       375
          NS       1.00      1.00      1.00       821
          NT       1.00      1.00      1.00       432

   micro avg       1.00      1.00      1.00      1628
   macro avg       1.00      1.00      1.00      1628
weighted avg       1.00      1.00      1.00      1628



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.56it/s, F1=0.865, eval_acc=0.985, eval_loss=4.14, eval_precision=0.862, eval_recall=0.871]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.94      0.94      1416
          NS       0.86      0.88      0.87      2857
          NT       0.79      0.79      0.79      1314

   micro avg       0.87      0.87      0.87      5587
   macro avg       0.87      0.87      0.87      5587
weighted avg       0.87      0.87      0.87      5587



Epoch: 16/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.46it/s, F1=0.994, train_acc=1, train_loss=0.0411, train_precision=0.992, train_recall=0.996]   


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       375
          NS       0.99      1.00      1.00       821
          NT       0.99      0.99      0.99       432

   micro avg       0.99      1.00      1.00      1628
   macro avg       0.99      1.00      1.00      1628
weighted avg       0.99      1.00      1.00      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.27it/s, F1=0.859, eval_acc=0.985, eval_loss=4.1, eval_precision=0.858, eval_recall=0.864] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.94      0.94      1416
          NS       0.87      0.87      0.87      2857
          NT       0.76      0.79      0.78      1314

   micro avg       0.86      0.87      0.87      5587
   macro avg       0.86      0.87      0.86      5587
weighted avg       0.86      0.87      0.87      5587



Epoch: 17/30 Train: 100%|██████████| 125/125 [00:35<00:00,  3.52it/s, F1=0.992, train_acc=0.999, train_loss=0.222, train_precision=0.988, train_recall=0.995]


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.99      0.99       375
          NS       1.00      1.00      1.00       821
          NT       0.97      0.99      0.98       432

   micro avg       0.99      0.99      0.99      1628
   macro avg       0.99      0.99      0.99      1628
weighted avg       0.99      0.99      0.99      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.29it/s, F1=0.83, eval_acc=0.982, eval_loss=5.35, eval_precision=0.86, eval_recall=0.808]  


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.94      0.94      1416
          NS       0.87      0.81      0.83      2857
          NT       0.79      0.76      0.77      1314

   micro avg       0.87      0.83      0.85      5587
   macro avg       0.87      0.83      0.85      5587
weighted avg       0.87      0.83      0.85      5587



Epoch: 18/30 Train: 100%|██████████| 125/125 [00:39<00:00,  3.20it/s, F1=0.983, train_acc=0.998, train_loss=0.363, train_precision=0.98, train_recall=0.987] 


train_reports:
              precision    recall  f1-score   support

          NR       0.99      1.00      0.99       375
          NS       0.99      0.99      0.99       821
          NT       0.96      0.98      0.97       432

   micro avg       0.98      0.99      0.98      1628
   macro avg       0.98      0.99      0.98      1628
weighted avg       0.98      0.99      0.98      1628



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.32it/s, F1=0.827, eval_acc=0.982, eval_loss=4.34, eval_precision=0.814, eval_recall=0.846]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.95      0.95      1416
          NS       0.79      0.86      0.82      2857
          NT       0.74      0.74      0.74      1314

   micro avg       0.81      0.85      0.83      5587
   macro avg       0.82      0.85      0.84      5587
weighted avg       0.82      0.85      0.83      5587



Epoch: 19/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.43it/s, F1=0.988, train_acc=0.999, train_loss=0.183, train_precision=0.988, train_recall=0.988]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       375
          NS       0.99      0.99      0.99       821
          NT       0.98      0.99      0.98       432

   micro avg       0.99      0.99      0.99      1628
   macro avg       0.99      0.99      0.99      1628
weighted avg       0.99      0.99      0.99      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.29it/s, F1=0.849, eval_acc=0.983, eval_loss=3.98, eval_precision=0.834, eval_recall=0.869]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.95      0.94      1416
          NS       0.83      0.87      0.85      2857
          NT       0.77      0.80      0.78      1314

   micro avg       0.84      0.87      0.86      5587
   macro avg       0.84      0.87      0.86      5587
weighted avg       0.84      0.87      0.86      5587



Epoch: 20/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.45it/s, F1=0.99, train_acc=0.999, train_loss=0.179, train_precision=0.988, train_recall=0.993] 


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.99      0.99       375
          NS       0.99      0.99      0.99       821
          NT       0.99      0.99      0.99       432

   micro avg       0.99      0.99      0.99      1628
   macro avg       0.99      0.99      0.99      1628
weighted avg       0.99      0.99      0.99      1628



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.60it/s, F1=0.842, eval_acc=0.982, eval_loss=4.08, eval_precision=0.823, eval_recall=0.868]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.92      0.93      1416
          NS       0.82      0.88      0.85      2857
          NT       0.74      0.80      0.77      1314

   micro avg       0.83      0.87      0.85      5587
   macro avg       0.83      0.86      0.85      5587
weighted avg       0.83      0.87      0.85      5587



Epoch: 21/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.45it/s, F1=0.998, train_acc=1, train_loss=0.0443, train_precision=0.998, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       375
          NS       1.00      1.00      1.00       821
          NT       1.00      1.00      1.00       432

   micro avg       1.00      1.00      1.00      1628
   macro avg       1.00      1.00      1.00      1628
weighted avg       1.00      1.00      1.00      1628



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.37it/s, F1=0.845, eval_acc=0.982, eval_loss=4.61, eval_precision=0.835, eval_recall=0.861]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.96      0.93      0.94      1416
          NS       0.82      0.85      0.83      2857
          NT       0.75      0.81      0.78      1314

   micro avg       0.83      0.86      0.85      5587
   macro avg       0.84      0.86      0.85      5587
weighted avg       0.84      0.86      0.85      5587



Epoch: 22/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.42it/s, F1=0.995, train_acc=0.999, train_loss=0.133, train_precision=0.995, train_recall=0.996]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       375
          NS       1.00      1.00      1.00       821
          NT       0.99      0.99      0.99       432

   micro avg       0.99      1.00      0.99      1628
   macro avg       0.99      1.00      0.99      1628
weighted avg       0.99      1.00      0.99      1628



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.34it/s, F1=0.855, eval_acc=0.983, eval_loss=4.26, eval_precision=0.848, eval_recall=0.865]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.94      0.94      1416
          NS       0.83      0.87      0.85      2857
          NT       0.76      0.78      0.77      1314

   micro avg       0.84      0.86      0.85      5587
   macro avg       0.85      0.86      0.85      5587
weighted avg       0.84      0.86      0.85      5587



Epoch: 23/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.24it/s, F1=0.993, train_acc=0.999, train_loss=0.152, train_precision=0.992, train_recall=0.993]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       375
          NS       0.99      1.00      0.99       821
          NT       0.98      0.98      0.98       432

   micro avg       0.99      0.99      0.99      1628
   macro avg       0.99      0.99      0.99      1628
weighted avg       0.99      0.99      0.99      1628



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.37it/s, F1=0.856, eval_acc=0.982, eval_loss=5.11, eval_precision=0.859, eval_recall=0.857]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.97      0.94      0.95      1416
          NS       0.83      0.87      0.85      2857
          NT       0.81      0.73      0.77      1314

   micro avg       0.86      0.85      0.86      5587
   macro avg       0.87      0.85      0.86      5587
weighted avg       0.86      0.85      0.86      5587



Epoch: 24/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.46it/s, F1=0.977, train_acc=0.998, train_loss=0.472, train_precision=0.973, train_recall=0.982]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       375
          NS       0.97      0.98      0.98       821
          NT       0.94      0.97      0.96       432

   micro avg       0.97      0.98      0.98      1628
   macro avg       0.97      0.98      0.98      1628
weighted avg       0.97      0.98      0.98      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.25it/s, F1=0.817, eval_acc=0.979, eval_loss=4.51, eval_precision=0.787, eval_recall=0.855]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.93      0.93      1416
          NS       0.75      0.89      0.81      2857
          NT       0.72      0.68      0.70      1314

   micro avg       0.78      0.85      0.82      5587
   macro avg       0.80      0.83      0.81      5587
weighted avg       0.79      0.85      0.82      5587



Epoch: 25/30 Train: 100%|██████████| 125/125 [00:35<00:00,  3.48it/s, F1=0.976, train_acc=0.998, train_loss=0.364, train_precision=0.971, train_recall=0.983]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       375
          NS       0.98      0.99      0.98       821
          NT       0.95      0.97      0.96       432

   micro avg       0.97      0.98      0.98      1628
   macro avg       0.97      0.98      0.98      1628
weighted avg       0.97      0.98      0.98      1628



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.57it/s, F1=0.856, eval_acc=0.983, eval_loss=4.26, eval_precision=0.856, eval_recall=0.859]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.93      0.94      1416
          NS       0.85      0.86      0.85      2857
          NT       0.75      0.76      0.76      1314

   micro avg       0.85      0.85      0.85      5587
   macro avg       0.85      0.85      0.85      5587
weighted avg       0.85      0.85      0.85      5587



Epoch: 26/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.45it/s, F1=0.986, train_acc=0.999, train_loss=0.404, train_precision=0.982, train_recall=0.989]


train_reports:
              precision    recall  f1-score   support

          NR       0.97      0.98      0.98       375
          NS       0.98      0.99      0.99       821
          NT       0.98      0.98      0.98       432

   micro avg       0.98      0.99      0.98      1628
   macro avg       0.98      0.99      0.98      1628
weighted avg       0.98      0.99      0.98      1628



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.33it/s, F1=0.85, eval_acc=0.983, eval_loss=4.72, eval_precision=0.858, eval_recall=0.846] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.96      0.90      0.93      1416
          NS       0.86      0.87      0.86      2857
          NT       0.78      0.76      0.77      1314

   micro avg       0.86      0.85      0.86      5587
   macro avg       0.87      0.84      0.85      5587
weighted avg       0.87      0.85      0.86      5587



Epoch: 27/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.39it/s, F1=0.994, train_acc=1, train_loss=0.133, train_precision=0.994, train_recall=0.994]   


train_reports:
              precision    recall  f1-score   support

          NR       1.00      0.99      1.00       375
          NS       1.00      1.00      1.00       821
          NT       0.99      0.99      0.99       432

   micro avg       0.99      1.00      0.99      1628
   macro avg       0.99      0.99      0.99      1628
weighted avg       0.99      1.00      0.99      1628



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.35it/s, F1=0.848, eval_acc=0.983, eval_loss=4.62, eval_precision=0.838, eval_recall=0.862]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.94      0.94      1416
          NS       0.81      0.89      0.85      2857
          NT       0.82      0.71      0.76      1314

   micro avg       0.84      0.86      0.85      5587
   macro avg       0.86      0.85      0.85      5587
weighted avg       0.84      0.86      0.85      5587



Epoch: 28/30 Train: 100%|██████████| 125/125 [00:38<00:00,  3.25it/s, F1=0.991, train_acc=0.999, train_loss=0.253, train_precision=0.99, train_recall=0.992] 


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       375
          NS       0.99      1.00      0.99       821
          NT       0.99      0.98      0.98       432

   micro avg       0.99      0.99      0.99      1628
   macro avg       0.99      0.99      0.99      1628
weighted avg       0.99      0.99      0.99      1628



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.27it/s, F1=0.852, eval_acc=0.983, eval_loss=5.04, eval_precision=0.861, eval_recall=0.847]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.93      0.94      1416
          NS       0.83      0.87      0.85      2857
          NT       0.81      0.70      0.75      1314

   micro avg       0.86      0.84      0.85      5587
   macro avg       0.86      0.83      0.85      5587
weighted avg       0.86      0.84      0.85      5587



Epoch: 29/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.43it/s, F1=0.996, train_acc=1, train_loss=0.0298, train_precision=0.996, train_recall=0.996]   


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       375
          NS       1.00      1.00      1.00       821
          NT       1.00      1.00      1.00       432

   micro avg       1.00      1.00      1.00      1628
   macro avg       1.00      1.00      1.00      1628
weighted avg       1.00      1.00      1.00      1628



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.32it/s, F1=0.858, eval_acc=0.984, eval_loss=4.72, eval_precision=0.858, eval_recall=0.861]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.94      0.94      1416
          NS       0.85      0.87      0.86      2857
          NT       0.79      0.75      0.77      1314

   micro avg       0.86      0.86      0.86      5587
   macro avg       0.86      0.85      0.86      5587
weighted avg       0.86      0.86      0.86      5587



Epoch: 30/30 Train: 100%|██████████| 125/125 [00:39<00:00,  3.18it/s, F1=0.996, train_acc=1, train_loss=0.062, train_precision=0.997, train_recall=0.996] 


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       375
          NS       1.00      1.00      1.00       821
          NT       1.00      1.00      1.00       432

   micro avg       1.00      1.00      1.00      1628
   macro avg       1.00      1.00      1.00      1628
weighted avg       1.00      1.00      1.00      1628



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.35it/s, F1=0.834, eval_acc=0.981, eval_loss=5.33, eval_precision=0.827, eval_recall=0.845]


eval_reports:
              precision    recall  f1-score   support

          NR       0.92      0.94      0.93      1416
          NS       0.80      0.88      0.84      2857
          NT       0.79      0.64      0.71      1314

   micro avg       0.83      0.84      0.84      5587
   macro avg       0.84      0.82      0.83      5587
weighted avg       0.83      0.84      0.83      5587



calculate data/few_shot/msra/train_1350.json etag: 100%|██████████| 808k/808k [00:00<00:00, 305MB/s]
calculate data/few_shot/msra/dev.json etag: 100%|██████████| 2.12M/2.12M [00:00<00:00, 338MB/s]
calculate data/few_shot/msra/test.json etag: 100%|██████████| 2.12M/2.12M [00:00<00:00, 360MB/s]
calculate data/few_shot/msra/labels.txt etag: 100%|██████████| 62.0/62.0 [00:00<00:00, 116kB/s]

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/msra/train_1350.json",
    "eval_file": "data/few_shot/msra/dev.json",
    "test_file": "data/few_shot/msra/test.json",
    "tag_file": "data/few_shot/msra/labels.txt",
    "bert_vocab_file": "./model/chinese_wwm_ext/vocab.txt",
    "output_eval": true,
    "max_scan_num": 1000000,
    "add_seq_vocab": false,
    "max_seq_length": 150,
    "max_word_num": 5,
    "default_tag": "O",
    "use_test": false,
    "do_shuffle": true,
    "do_predict": false,
    "task_name": "msra_pretrain_lebert_crf_1350_x1"
}
load cached ./temp/0a0e7393bc7beec17cf50eebefb4418b_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/lexicon_tree



count line size data/few_shot/msra/labels.txt: 14L [00:00, 117440.51L/s]
build line mapper: 14L [00:00, 120328.39L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 14/14 [00:00<00:00, 4153.95it/s]
load vocab from list: 100%|██████████| 13/13 [00:00<00:00, 161798.08it/s]

load cached ./temp/0a0e7393bc7beec17cf50eebefb4418b_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/matched_words
load cached ./temp/0a0e7393bc7beec17cf50eebefb4418b_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/word_vocab
load cached ./temp/0a0e7393bc7beec17cf50eebefb4418b_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/vocab_embedding



load dataset from data/few_shot/msra/train_1350.json: 1350it [00:02, 584.04it/s]
load dataset from data/few_shot/msra/dev.json: 4365it [00:06, 675.32it/s]
Some weights of the model checkpoint at save_pretrained/msra_pretrain_lebert_1350_pretraind_task/Bert_1290/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.40it/s, F1=0.107, train_acc=0.825, train_loss=29.7, train_precision=0.0968, train_recall=0.123]       


train_reports:
              precision    recall  f1-score   support

          NR       0.02      0.11      0.04       520
          NS       0.06      0.10      0.08      1140
          NT       0.03      0.19      0.06       593

   micro avg       0.04      0.12      0.06      2253
   macro avg       0.04      0.13      0.06      2253
weighted avg       0.05      0.12      0.06      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.33it/s, F1=0.637, eval_acc=0.969, eval_loss=4.48, eval_precision=0.588, eval_recall=0.702]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.88      0.87      0.87      1416
          NS       0.47      0.60      0.53      2857
          NT       0.58      0.75      0.66      1314

   micro avg       0.58      0.70      0.64      5587
   macro avg       0.64      0.74      0.69      5587
weighted avg       0.60      0.70      0.65      5587



Epoch: 2/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.45it/s, F1=0.811, train_acc=0.982, train_loss=3.02, train_precision=0.792, train_recall=0.839]


train_reports:
              precision    recall  f1-score   support

          NR       0.92      0.92      0.92       520
          NS       0.77      0.83      0.80      1140
          NT       0.72      0.77      0.74       593

   micro avg       0.79      0.83      0.81      2253
   macro avg       0.80      0.84      0.82      2253
weighted avg       0.79      0.83      0.81      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.34it/s, F1=0.829, eval_acc=0.983, eval_loss=2.43, eval_precision=0.812, eval_recall=0.85] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.95      0.95      1416
          NS       0.78      0.84      0.81      2857
          NT       0.74      0.78      0.76      1314

   micro avg       0.81      0.85      0.83      5587
   macro avg       0.82      0.85      0.84      5587
weighted avg       0.81      0.85      0.83      5587



Epoch: 3/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.19it/s, F1=0.919, train_acc=0.993, train_loss=1.15, train_precision=0.912, train_recall=0.93]  


train_reports:
              precision    recall  f1-score   support

          NR       0.95      0.96      0.95       520
          NS       0.90      0.93      0.92      1140
          NT       0.87      0.90      0.89       593

   micro avg       0.91      0.93      0.92      2253
   macro avg       0.91      0.93      0.92      2253
weighted avg       0.91      0.93      0.92      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.31it/s, F1=0.803, eval_acc=0.98, eval_loss=3.64, eval_precision=0.809, eval_recall=0.801] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.90      0.91      0.91      1416
          NS       0.78      0.80      0.79      2857
          NT       0.75      0.71      0.73      1314

   micro avg       0.80      0.81      0.81      5587
   macro avg       0.81      0.81      0.81      5587
weighted avg       0.80      0.81      0.81      5587



Epoch: 4/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.46it/s, F1=0.949, train_acc=0.995, train_loss=0.872, train_precision=0.941, train_recall=0.96] 


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.98      0.98       520
          NS       0.94      0.96      0.95      1140
          NT       0.90      0.93      0.91       593

   micro avg       0.94      0.96      0.95      2253
   macro avg       0.94      0.96      0.95      2253
weighted avg       0.94      0.96      0.95      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.36it/s, F1=0.837, eval_acc=0.982, eval_loss=2.92, eval_precision=0.837, eval_recall=0.84] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.96      0.96      0.96      1416
          NS       0.86      0.84      0.85      2857
          NT       0.71      0.76      0.73      1314

   micro avg       0.85      0.85      0.85      5587
   macro avg       0.84      0.85      0.85      5587
weighted avg       0.85      0.85      0.85      5587



Epoch: 5/30 Train: 100%|██████████| 169/169 [00:51<00:00,  3.27it/s, F1=0.963, train_acc=0.997, train_loss=0.515, train_precision=0.961, train_recall=0.966]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       520
          NS       0.97      0.98      0.98      1140
          NT       0.92      0.93      0.93       593

   micro avg       0.96      0.97      0.97      2253
   macro avg       0.96      0.97      0.96      2253
weighted avg       0.96      0.97      0.97      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.33it/s, F1=0.857, eval_acc=0.985, eval_loss=2.7, eval_precision=0.849, eval_recall=0.869] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.96      0.95      1416
          NS       0.85      0.87      0.86      2857
          NT       0.76      0.78      0.77      1314

   micro avg       0.85      0.87      0.86      5587
   macro avg       0.85      0.87      0.86      5587
weighted avg       0.85      0.87      0.86      5587



Epoch: 6/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.44it/s, F1=0.98, train_acc=0.998, train_loss=0.366, train_precision=0.98, train_recall=0.981]  


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       520
          NS       0.98      0.99      0.98      1140
          NT       0.96      0.97      0.97       593

   micro avg       0.98      0.98      0.98      2253
   macro avg       0.98      0.98      0.98      2253
weighted avg       0.98      0.98      0.98      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.34it/s, F1=0.827, eval_acc=0.983, eval_loss=3.05, eval_precision=0.814, eval_recall=0.843]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.86      0.89      1416
          NS       0.85      0.89      0.87      2857
          NT       0.70      0.79      0.74      1314

   micro avg       0.83      0.86      0.84      5587
   macro avg       0.82      0.85      0.83      5587
weighted avg       0.83      0.86      0.84      5587



Epoch: 7/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.23it/s, F1=0.983, train_acc=0.999, train_loss=0.229, train_precision=0.981, train_recall=0.984]


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.98      0.98       520
          NS       0.99      0.99      0.99      1140
          NT       0.98      0.98      0.98       593

   micro avg       0.98      0.99      0.98      2253
   macro avg       0.98      0.98      0.98      2253
weighted avg       0.98      0.99      0.98      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.37it/s, F1=0.857, eval_acc=0.985, eval_loss=3, eval_precision=0.839, eval_recall=0.881]   


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.95      0.94      1416
          NS       0.86      0.90      0.88      2857
          NT       0.75      0.83      0.79      1314

   micro avg       0.86      0.89      0.87      5587
   macro avg       0.85      0.89      0.87      5587
weighted avg       0.86      0.89      0.88      5587



Epoch: 8/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.45it/s, F1=0.987, train_acc=0.999, train_loss=0.181, train_precision=0.985, train_recall=0.989]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       520
          NS       0.99      0.99      0.99      1140
          NT       0.97      0.98      0.98       593

   micro avg       0.98      0.99      0.99      2253
   macro avg       0.98      0.99      0.99      2253
weighted avg       0.99      0.99      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.24it/s, F1=0.852, eval_acc=0.985, eval_loss=3.04, eval_precision=0.838, eval_recall=0.872]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.93      0.93      1416
          NS       0.85      0.89      0.87      2857
          NT       0.77      0.82      0.80      1314

   micro avg       0.85      0.88      0.87      5587
   macro avg       0.85      0.88      0.87      5587
weighted avg       0.86      0.88      0.87      5587



Epoch: 9/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.24it/s, F1=0.983, train_acc=0.999, train_loss=0.29, train_precision=0.978, train_recall=0.988] 


train_reports:
              precision    recall  f1-score   support

          NR       0.99      1.00      0.99       520
          NS       0.99      0.99      0.99      1140
          NT       0.96      0.98      0.97       593

   micro avg       0.98      0.99      0.98      2253
   macro avg       0.98      0.99      0.98      2253
weighted avg       0.98      0.99      0.98      2253



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.31it/s, F1=0.845, eval_acc=0.983, eval_loss=2.98, eval_precision=0.83, eval_recall=0.864] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.96      0.93      0.95      1416
          NS       0.82      0.88      0.85      2857
          NT       0.74      0.77      0.76      1314

   micro avg       0.84      0.87      0.85      5587
   macro avg       0.84      0.86      0.85      5587
weighted avg       0.84      0.87      0.85      5587



Epoch: 10/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.43it/s, F1=0.988, train_acc=0.999, train_loss=0.19, train_precision=0.986, train_recall=0.991] 


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       520
          NS       0.99      0.99      0.99      1140
          NT       0.97      0.97      0.97       593

   micro avg       0.98      0.99      0.99      2253
   macro avg       0.98      0.99      0.99      2253
weighted avg       0.98      0.99      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.24it/s, F1=0.856, eval_acc=0.984, eval_loss=3.34, eval_precision=0.87, eval_recall=0.846] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.96      0.93      0.94      1416
          NS       0.87      0.86      0.87      2857
          NT       0.81      0.76      0.78      1314

   micro avg       0.88      0.85      0.87      5587
   macro avg       0.88      0.85      0.86      5587
weighted avg       0.88      0.85      0.87      5587



Epoch: 11/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.21it/s, F1=0.985, train_acc=0.999, train_loss=0.244, train_precision=0.984, train_recall=0.986]


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.99      0.99       520
          NS       0.98      0.99      0.99      1140
          NT       0.97      0.97      0.97       593

   micro avg       0.98      0.99      0.98      2253
   macro avg       0.98      0.98      0.98      2253
weighted avg       0.98      0.99      0.98      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.32it/s, F1=0.836, eval_acc=0.983, eval_loss=3.36, eval_precision=0.806, eval_recall=0.874]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.91      0.94      0.93      1416
          NS       0.79      0.90      0.84      2857
          NT       0.79      0.80      0.80      1314

   micro avg       0.82      0.89      0.85      5587
   macro avg       0.83      0.88      0.85      5587
weighted avg       0.82      0.89      0.85      5587



Epoch: 12/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.48it/s, F1=0.979, train_acc=0.998, train_loss=0.35, train_precision=0.977, train_recall=0.982] 


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.98      0.98       520
          NS       0.97      0.98      0.98      1140
          NT       0.97      0.98      0.98       593

   micro avg       0.97      0.98      0.98      2253
   macro avg       0.97      0.98      0.98      2253
weighted avg       0.97      0.98      0.98      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.33it/s, F1=0.828, eval_acc=0.983, eval_loss=3.11, eval_precision=0.811, eval_recall=0.85] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.91      0.95      0.93      1416
          NS       0.79      0.87      0.83      2857
          NT       0.75      0.70      0.72      1314

   micro avg       0.81      0.85      0.83      5587
   macro avg       0.82      0.84      0.83      5587
weighted avg       0.81      0.85      0.83      5587



Epoch: 13/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.19it/s, F1=0.992, train_acc=0.999, train_loss=0.127, train_precision=0.991, train_recall=0.994]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      1.00      1.00       520
          NS       0.99      1.00      1.00      1140
          NT       0.98      0.98      0.98       593

   micro avg       0.99      0.99      0.99      2253
   macro avg       0.99      0.99      0.99      2253
weighted avg       0.99      0.99      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.33it/s, F1=0.878, eval_acc=0.986, eval_loss=3.14, eval_precision=0.877, eval_recall=0.882]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.96      0.96      1416
          NS       0.87      0.90      0.89      2857
          NT       0.82      0.78      0.80      1314

   micro avg       0.88      0.89      0.88      5587
   macro avg       0.88      0.88      0.88      5587
weighted avg       0.88      0.89      0.88      5587



Epoch: 14/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.44it/s, F1=0.991, train_acc=0.999, train_loss=0.143, train_precision=0.991, train_recall=0.992]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       520
          NS       0.99      0.99      0.99      1140
          NT       0.99      0.99      0.99       593

   micro avg       0.99      0.99      0.99      2253
   macro avg       0.99      0.99      0.99      2253
weighted avg       0.99      0.99      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.53it/s, F1=0.859, eval_acc=0.984, eval_loss=3.51, eval_precision=0.846, eval_recall=0.877]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.96      0.95      1416
          NS       0.85      0.87      0.86      2857
          NT       0.75      0.83      0.79      1314

   micro avg       0.85      0.88      0.86      5587
   macro avg       0.85      0.88      0.86      5587
weighted avg       0.85      0.88      0.86      5587



Epoch: 15/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.45it/s, F1=0.998, train_acc=1, train_loss=0.0381, train_precision=0.998, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       520
          NS       1.00      1.00      1.00      1140
          NT       1.00      1.00      1.00       593

   micro avg       1.00      1.00      1.00      2253
   macro avg       1.00      1.00      1.00      2253
weighted avg       1.00      1.00      1.00      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.32it/s, F1=0.872, eval_acc=0.985, eval_loss=3.71, eval_precision=0.874, eval_recall=0.874]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.96      0.95      1416
          NS       0.88      0.87      0.88      2857
          NT       0.80      0.79      0.79      1314

   micro avg       0.88      0.88      0.88      5587
   macro avg       0.87      0.87      0.87      5587
weighted avg       0.88      0.88      0.88      5587



Epoch: 16/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.47it/s, F1=0.997, train_acc=1, train_loss=0.0622, train_precision=0.996, train_recall=0.998]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       520
          NS       0.99      1.00      0.99      1140
          NT       1.00      1.00      1.00       593

   micro avg       1.00      1.00      1.00      2253
   macro avg       1.00      1.00      1.00      2253
weighted avg       1.00      1.00      1.00      2253



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.60it/s, F1=0.867, eval_acc=0.985, eval_loss=3.73, eval_precision=0.855, eval_recall=0.883]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.95      0.95      1416
          NS       0.85      0.90      0.87      2857
          NT       0.80      0.81      0.80      1314

   micro avg       0.86      0.89      0.88      5587
   macro avg       0.87      0.89      0.88      5587
weighted avg       0.86      0.89      0.88      5587



Epoch: 17/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.45it/s, F1=0.992, train_acc=1, train_loss=0.0978, train_precision=0.989, train_recall=0.996]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       520
          NS       0.99      1.00      0.99      1140
          NT       0.99      1.00      1.00       593

   micro avg       0.99      1.00      0.99      2253
   macro avg       0.99      1.00      0.99      2253
weighted avg       0.99      1.00      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.32it/s, F1=0.852, eval_acc=0.984, eval_loss=3.92, eval_precision=0.858, eval_recall=0.85] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.96      0.95      1416
          NS       0.84      0.86      0.85      2857
          NT       0.82      0.73      0.77      1314

   micro avg       0.86      0.86      0.86      5587
   macro avg       0.86      0.85      0.86      5587
weighted avg       0.86      0.86      0.86      5587



Epoch: 18/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.43it/s, F1=0.977, train_acc=0.998, train_loss=0.429, train_precision=0.972, train_recall=0.984]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       520
          NS       0.98      0.99      0.98      1140
          NT       0.96      0.98      0.97       593

   micro avg       0.98      0.99      0.98      2253
   macro avg       0.98      0.99      0.98      2253
weighted avg       0.98      0.99      0.98      2253



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.61it/s, F1=0.83, eval_acc=0.981, eval_loss=4.19, eval_precision=0.811, eval_recall=0.855] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.92      0.93      1416
          NS       0.83      0.87      0.85      2857
          NT       0.73      0.82      0.77      1314

   micro avg       0.83      0.87      0.85      5587
   macro avg       0.84      0.87      0.85      5587
weighted avg       0.84      0.87      0.85      5587



Epoch: 19/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.45it/s, F1=0.984, train_acc=0.998, train_loss=0.35, train_precision=0.981, train_recall=0.988] 


train_reports:
              precision    recall  f1-score   support

          NR       1.00      0.99      1.00       520
          NS       0.99      0.99      0.99      1140
          NT       0.94      0.97      0.96       593

   micro avg       0.98      0.99      0.98      2253
   macro avg       0.98      0.99      0.98      2253
weighted avg       0.98      0.99      0.98      2253



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.30it/s, F1=0.862, eval_acc=0.984, eval_loss=3.52, eval_precision=0.856, eval_recall=0.873]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.92      0.94      0.93      1416
          NS       0.86      0.88      0.87      2857
          NT       0.82      0.80      0.81      1314

   micro avg       0.87      0.88      0.87      5587
   macro avg       0.87      0.87      0.87      5587
weighted avg       0.86      0.88      0.87      5587



Epoch: 20/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.46it/s, F1=0.986, train_acc=0.999, train_loss=0.172, train_precision=0.983, train_recall=0.989]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       520
          NS       0.99      0.99      0.99      1140
          NT       0.97      0.98      0.98       593

   micro avg       0.98      0.99      0.99      2253
   macro avg       0.98      0.99      0.99      2253
weighted avg       0.98      0.99      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:18<00:00,  3.70it/s, F1=0.845, eval_acc=0.983, eval_loss=3.63, eval_precision=0.842, eval_recall=0.853]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.92      0.90      0.91      1416
          NS       0.84      0.89      0.86      2857
          NT       0.86      0.74      0.79      1314

   micro avg       0.86      0.86      0.86      5587
   macro avg       0.87      0.84      0.86      5587
weighted avg       0.86      0.86      0.86      5587



Epoch: 21/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.46it/s, F1=0.994, train_acc=1, train_loss=0.153, train_precision=0.995, train_recall=0.994]    


train_reports:
              precision    recall  f1-score   support

          NR       0.99      1.00      0.99       520
          NS       0.99      0.99      0.99      1140
          NT       1.00      1.00      1.00       593

   micro avg       0.99      0.99      0.99      2253
   macro avg       0.99      1.00      0.99      2253
weighted avg       0.99      0.99      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.30it/s, F1=0.854, eval_acc=0.984, eval_loss=3.48, eval_precision=0.855, eval_recall=0.855]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.92      0.92      1416
          NS       0.86      0.88      0.87      2857
          NT       0.83      0.80      0.82      1314

   micro avg       0.87      0.87      0.87      5587
   macro avg       0.88      0.87      0.87      5587
weighted avg       0.87      0.87      0.87      5587



Epoch: 22/30 Train: 100%|██████████| 169/169 [00:51<00:00,  3.25it/s, F1=0.998, train_acc=1, train_loss=0.0964, train_precision=0.998, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       520
          NS       1.00      1.00      1.00      1140
          NT       0.99      1.00      0.99       593

   micro avg       1.00      1.00      1.00      2253
   macro avg       1.00      1.00      1.00      2253
weighted avg       1.00      1.00      1.00      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.37it/s, F1=0.859, eval_acc=0.984, eval_loss=4.03, eval_precision=0.873, eval_recall=0.848]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.96      0.94      0.95      1416
          NS       0.86      0.87      0.86      2857
          NT       0.85      0.76      0.80      1314

   micro avg       0.88      0.86      0.87      5587
   macro avg       0.89      0.85      0.87      5587
weighted avg       0.88      0.86      0.87      5587



Epoch: 23/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.44it/s, F1=0.99, train_acc=0.999, train_loss=0.16, train_precision=0.989, train_recall=0.992]  


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       520
          NS       0.99      0.99      0.99      1140
          NT       0.98      0.99      0.98       593

   micro avg       0.99      0.99      0.99      2253
   macro avg       0.99      0.99      0.99      2253
weighted avg       0.99      0.99      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.26it/s, F1=0.852, eval_acc=0.984, eval_loss=3.46, eval_precision=0.857, eval_recall=0.85] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.96      0.93      0.94      1416
          NS       0.86      0.87      0.86      2857
          NT       0.81      0.78      0.80      1314

   micro avg       0.87      0.86      0.87      5587
   macro avg       0.88      0.86      0.87      5587
weighted avg       0.87      0.86      0.87      5587



Epoch: 24/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.24it/s, F1=0.995, train_acc=1, train_loss=0.107, train_precision=0.994, train_recall=0.995]    


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       520
          NS       1.00      1.00      1.00      1140
          NT       0.99      0.99      0.99       593

   micro avg       0.99      1.00      0.99      2253
   macro avg       0.99      1.00      0.99      2253
weighted avg       0.99      1.00      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.31it/s, F1=0.86, eval_acc=0.983, eval_loss=3.73, eval_precision=0.836, eval_recall=0.889] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.96      0.95      1416
          NS       0.85      0.90      0.88      2857
          NT       0.77      0.83      0.80      1314

   micro avg       0.85      0.90      0.88      5587
   macro avg       0.85      0.90      0.87      5587
weighted avg       0.85      0.90      0.88      5587



Epoch: 25/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.44it/s, F1=0.993, train_acc=0.999, train_loss=0.173, train_precision=0.992, train_recall=0.994]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       520
          NS       0.99      0.99      0.99      1140
          NT       0.98      0.99      0.99       593

   micro avg       0.99      0.99      0.99      2253
   macro avg       0.99      0.99      0.99      2253
weighted avg       0.99      0.99      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.25it/s, F1=0.871, eval_acc=0.984, eval_loss=3.66, eval_precision=0.865, eval_recall=0.879]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.95      0.94      1416
          NS       0.88      0.90      0.89      2857
          NT       0.78      0.78      0.78      1314

   micro avg       0.87      0.88      0.88      5587
   macro avg       0.86      0.88      0.87      5587
weighted avg       0.87      0.88      0.88      5587



Epoch: 26/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.22it/s, F1=0.988, train_acc=0.998, train_loss=0.361, train_precision=0.986, train_recall=0.989]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       520
          NS       0.99      0.99      0.99      1140
          NT       0.97      0.98      0.98       593

   micro avg       0.99      0.99      0.99      2253
   macro avg       0.98      0.99      0.99      2253
weighted avg       0.99      0.99      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.35it/s, F1=0.821, eval_acc=0.978, eval_loss=3.8, eval_precision=0.807, eval_recall=0.839] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.96      0.94      1416
          NS       0.84      0.81      0.82      2857
          NT       0.68      0.83      0.74      1314

   micro avg       0.82      0.85      0.83      5587
   macro avg       0.82      0.86      0.84      5587
weighted avg       0.82      0.85      0.84      5587



Epoch: 27/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.47it/s, F1=0.988, train_acc=0.999, train_loss=0.277, train_precision=0.985, train_recall=0.992]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      1.00      1.00       520
          NS       0.98      0.99      0.99      1140
          NT       0.98      0.99      0.98       593

   micro avg       0.98      0.99      0.99      2253
   macro avg       0.99      0.99      0.99      2253
weighted avg       0.98      0.99      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.31it/s, F1=0.839, eval_acc=0.984, eval_loss=3.21, eval_precision=0.832, eval_recall=0.85] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.89      0.91      1416
          NS       0.83      0.88      0.85      2857
          NT       0.80      0.79      0.80      1314

   micro avg       0.85      0.86      0.85      5587
   macro avg       0.85      0.85      0.85      5587
weighted avg       0.85      0.86      0.85      5587



Epoch: 28/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.22it/s, F1=0.994, train_acc=1, train_loss=0.0758, train_precision=0.992, train_recall=0.996]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       520
          NS       0.99      0.99      0.99      1140
          NT       1.00      1.00      1.00       593

   micro avg       0.99      1.00      0.99      2253
   macro avg       0.99      1.00      1.00      2253
weighted avg       0.99      1.00      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.34it/s, F1=0.87, eval_acc=0.984, eval_loss=3.43, eval_precision=0.862, eval_recall=0.882] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.95      0.95      1416
          NS       0.89      0.89      0.89      2857
          NT       0.78      0.83      0.80      1314

   micro avg       0.88      0.89      0.88      5587
   macro avg       0.87      0.89      0.88      5587
weighted avg       0.88      0.89      0.88      5587



Epoch: 29/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.43it/s, F1=0.995, train_acc=1, train_loss=0.0533, train_precision=0.996, train_recall=0.995]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       520
          NS       1.00      1.00      1.00      1140
          NT       0.99      0.99      0.99       593

   micro avg       1.00      1.00      1.00      2253
   macro avg       1.00      1.00      1.00      2253
weighted avg       1.00      1.00      1.00      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.35it/s, F1=0.874, eval_acc=0.985, eval_loss=3.5, eval_precision=0.866, eval_recall=0.886] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.95      0.95      1416
          NS       0.88      0.90      0.89      2857
          NT       0.81      0.81      0.81      1314

   micro avg       0.88      0.89      0.89      5587
   macro avg       0.88      0.89      0.88      5587
weighted avg       0.88      0.89      0.89      5587



Epoch: 30/30 Train: 100%|██████████| 169/169 [00:53<00:00,  3.18it/s, F1=0.999, train_acc=1, train_loss=0.0234, train_precision=0.999, train_recall=0.999]  


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       520
          NS       1.00      1.00      1.00      1140
          NT       1.00      1.00      1.00       593

   micro avg       1.00      1.00      1.00      2253
   macro avg       1.00      1.00      1.00      2253
weighted avg       1.00      1.00      1.00      2253



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.21it/s, F1=0.879, eval_acc=0.985, eval_loss=3.52, eval_precision=0.877, eval_recall=0.883]


eval_reports:


calculate data/few_shot/msra/train_1350.json etag:   0%|          | 0.00/808k [00:00<?, ?B/s]

              precision    recall  f1-score   support

          NR       0.95      0.95      0.95      1416
          NS       0.89      0.90      0.90      2857
          NT       0.80      0.80      0.80      1314

   micro avg       0.89      0.89      0.89      5587
   macro avg       0.88      0.89      0.88      5587
weighted avg       0.89      0.89      0.89      5587

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/msra/train_1350.json",
    "eval_file": "data/few_shot/msra/dev.json",
    "test_file": "data/few_shot/msra/test.json",
    "tag_file": "data/few_shot/msra/labels.txt",
    "bert_vocab_file": "./model/chinese_wwm_ext/vocab.txt",
    "output_eval": true,
    "max_scan_num": 1000000,
    "add_seq_vocab": false,
    "max_seq_length": 150,
    "max_word_num": 5,
    "default_t

calculate data/few_shot/msra/train_1350.json etag: 100%|██████████| 808k/808k [00:00<00:00, 308MB/s]
calculate data/few_shot/msra/dev.json etag: 100%|██████████| 2.12M/2.12M [00:00<00:00, 340MB/s]
calculate data/few_shot/msra/test.json etag: 100%|██████████| 2.12M/2.12M [00:00<00:00, 370MB/s]
calculate data/few_shot/msra/labels.txt etag: 100%|██████████| 62.0/62.0 [00:00<00:00, 119kB/s]


load cached ./temp/0a0e7393bc7beec17cf50eebefb4418b_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/lexicon_tree


count line size data/few_shot/msra/labels.txt: 14L [00:00, 132551.37L/s]
build line mapper: 14L [00:00, 120082.32L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 14/14 [00:00<00:00, 4765.87it/s]
load vocab from list: 100%|██████████| 13/13 [00:00<00:00, 149386.17it/s]
load dataset from data/few_shot/msra/train_1350.json: 0it [00:00, ?it/s]

load cached ./temp/0a0e7393bc7beec17cf50eebefb4418b_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/matched_words
load cached ./temp/0a0e7393bc7beec17cf50eebefb4418b_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/word_vocab
load cached ./temp/0a0e7393bc7beec17cf50eebefb4418b_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/vocab_embedding


load dataset from data/few_shot/msra/train_1350.json: 1350it [00:02, 587.79it/s]
load dataset from data/few_shot/msra/dev.json: 4365it [00:06, 674.51it/s]
Some weights of the model checkpoint at save_pretrained/msra_pretrain_lebert_1350_pretraind_task/Bert_1290/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model 

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.45it/s, F1=0.104, train_acc=0.812, train_loss=35.9, train_precision=0.092, train_recall=0.125]        


train_reports:
              precision    recall  f1-score   support

          NR       0.05      0.15      0.08       520
          NS       0.10      0.16      0.12      1140
          NT       0.01      0.07      0.02       593

   micro avg       0.04      0.14      0.06      2253
   macro avg       0.05      0.13      0.07      2253
weighted avg       0.06      0.14      0.08      2253



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.22it/s, F1=0.629, eval_acc=0.967, eval_loss=4.85, eval_precision=0.561, eval_recall=0.724]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.87      0.91      0.89      1416
          NS       0.69      0.77      0.73      2857
          NT       0.18      0.36      0.24      1314

   micro avg       0.54      0.71      0.62      5587
   macro avg       0.58      0.68      0.62      5587
weighted avg       0.62      0.71      0.66      5587



Epoch: 2/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.22it/s, F1=0.776, train_acc=0.982, train_loss=3.64, train_precision=0.745, train_recall=0.819]


train_reports:
              precision    recall  f1-score   support

          NR       0.93      0.93      0.93       520
          NS       0.83      0.87      0.85      1140
          NT       0.51      0.69      0.59       593

   micro avg       0.75      0.84      0.79      2253
   macro avg       0.76      0.83      0.79      2253
weighted avg       0.77      0.84      0.80      2253



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.24it/s, F1=0.799, eval_acc=0.981, eval_loss=3.3, eval_precision=0.8, eval_recall=0.802]   


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.90      0.91      1416
          NS       0.82      0.85      0.83      2857
          NT       0.62      0.61      0.61      1314

   micro avg       0.80      0.80      0.80      5587
   macro avg       0.79      0.78      0.79      5587
weighted avg       0.80      0.80      0.80      5587



Epoch: 3/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.44it/s, F1=0.903, train_acc=0.992, train_loss=1.45, train_precision=0.889, train_recall=0.921]


train_reports:
              precision    recall  f1-score   support

          NR       0.96      0.96      0.96       520
          NS       0.91      0.94      0.93      1140
          NT       0.79      0.87      0.82       593

   micro avg       0.89      0.93      0.91      2253
   macro avg       0.89      0.92      0.90      2253
weighted avg       0.89      0.93      0.91      2253



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.29it/s, F1=0.846, eval_acc=0.984, eval_loss=3.1, eval_precision=0.82, eval_recall=0.879]  


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.94      0.94      1416
          NS       0.84      0.89      0.87      2857
          NT       0.68      0.78      0.73      1314

   micro avg       0.82      0.88      0.85      5587
   macro avg       0.82      0.87      0.84      5587
weighted avg       0.83      0.88      0.85      5587



Epoch: 4/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.24it/s, F1=0.935, train_acc=0.995, train_loss=1, train_precision=0.925, train_recall=0.95]     


train_reports:
              precision    recall  f1-score   support

          NR       0.96      0.97      0.96       520
          NS       0.94      0.96      0.95      1140
          NT       0.86      0.92      0.89       593

   micro avg       0.92      0.95      0.94      2253
   macro avg       0.92      0.95      0.93      2253
weighted avg       0.92      0.95      0.94      2253



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.26it/s, F1=0.841, eval_acc=0.984, eval_loss=3.41, eval_precision=0.84, eval_recall=0.845] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.92      0.93      1416
          NS       0.82      0.89      0.85      2857
          NT       0.75      0.70      0.73      1314

   micro avg       0.83      0.85      0.84      5587
   macro avg       0.84      0.84      0.84      5587
weighted avg       0.83      0.85      0.84      5587



Epoch: 5/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.45it/s, F1=0.929, train_acc=0.994, train_loss=1.08, train_precision=0.914, train_recall=0.949]


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.98      0.98       520
          NS       0.91      0.96      0.93      1140
          NT       0.82      0.90      0.86       593

   micro avg       0.90      0.95      0.92      2253
   macro avg       0.90      0.95      0.92      2253
weighted avg       0.90      0.95      0.92      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.32it/s, F1=0.854, eval_acc=0.985, eval_loss=3.6, eval_precision=0.849, eval_recall=0.862] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.95      0.95      1416
          NS       0.86      0.87      0.86      2857
          NT       0.75      0.75      0.75      1314

   micro avg       0.85      0.86      0.86      5587
   macro avg       0.85      0.86      0.85      5587
weighted avg       0.85      0.86      0.86      5587



Epoch: 6/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.21it/s, F1=0.96, train_acc=0.997, train_loss=0.589, train_precision=0.954, train_recall=0.968] 


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.98      0.98       520
          NS       0.98      0.98      0.98      1140
          NT       0.89      0.94      0.92       593

   micro avg       0.95      0.97      0.96      2253
   macro avg       0.95      0.97      0.96      2253
weighted avg       0.95      0.97      0.96      2253



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.25it/s, F1=0.824, eval_acc=0.981, eval_loss=3.25, eval_precision=0.797, eval_recall=0.857]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.93      0.94      1416
          NS       0.81      0.87      0.84      2857
          NT       0.65      0.78      0.71      1314

   micro avg       0.80      0.87      0.83      5587
   macro avg       0.80      0.86      0.83      5587
weighted avg       0.81      0.87      0.84      5587



Epoch: 7/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.46it/s, F1=0.981, train_acc=0.998, train_loss=0.319, train_precision=0.978, train_recall=0.985]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       520
          NS       0.98      0.99      0.99      1140
          NT       0.95      0.97      0.96       593

   micro avg       0.98      0.98      0.98      2253
   macro avg       0.98      0.98      0.98      2253
weighted avg       0.98      0.98      0.98      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.32it/s, F1=0.851, eval_acc=0.984, eval_loss=3.7, eval_precision=0.834, eval_recall=0.872] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.95      0.95      1416
          NS       0.87      0.89      0.88      2857
          NT       0.70      0.81      0.75      1314

   micro avg       0.84      0.88      0.86      5587
   macro avg       0.84      0.88      0.86      5587
weighted avg       0.85      0.88      0.87      5587



Epoch: 8/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.24it/s, F1=0.985, train_acc=0.999, train_loss=0.141, train_precision=0.985, train_recall=0.987]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       520
          NS       0.99      0.99      0.99      1140
          NT       0.97      0.98      0.98       593

   micro avg       0.99      0.99      0.99      2253
   macro avg       0.99      0.99      0.99      2253
weighted avg       0.99      0.99      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.30it/s, F1=0.862, eval_acc=0.985, eval_loss=3.94, eval_precision=0.85, eval_recall=0.878] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.96      0.95      1416
          NS       0.82      0.89      0.86      2857
          NT       0.79      0.77      0.78      1314

   micro avg       0.84      0.88      0.86      5587
   macro avg       0.85      0.87      0.86      5587
weighted avg       0.84      0.88      0.86      5587



Epoch: 9/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.42it/s, F1=0.984, train_acc=0.999, train_loss=0.199, train_precision=0.981, train_recall=0.988]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       520
          NS       0.99      0.99      0.99      1140
          NT       0.97      0.98      0.98       593

   micro avg       0.98      0.99      0.99      2253
   macro avg       0.98      0.99      0.99      2253
weighted avg       0.98      0.99      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.26it/s, F1=0.846, eval_acc=0.984, eval_loss=4.18, eval_precision=0.847, eval_recall=0.848]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.92      0.93      1416
          NS       0.83      0.87      0.85      2857
          NT       0.78      0.75      0.77      1314

   micro avg       0.85      0.86      0.85      5587
   macro avg       0.85      0.85      0.85      5587
weighted avg       0.85      0.86      0.85      5587



Epoch: 10/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.21it/s, F1=0.991, train_acc=0.999, train_loss=0.177, train_precision=0.988, train_recall=0.994]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      1.00      0.99       520
          NS       0.99      0.99      0.99      1140
          NT       0.98      0.99      0.98       593

   micro avg       0.99      0.99      0.99      2253
   macro avg       0.99      0.99      0.99      2253
weighted avg       0.99      0.99      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.36it/s, F1=0.849, eval_acc=0.984, eval_loss=3.9, eval_precision=0.83, eval_recall=0.872]  


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.94      0.95      1416
          NS       0.83      0.88      0.85      2857
          NT       0.72      0.81      0.76      1314

   micro avg       0.83      0.88      0.85      5587
   macro avg       0.83      0.88      0.85      5587
weighted avg       0.83      0.88      0.86      5587



Epoch: 11/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.45it/s, F1=0.978, train_acc=0.998, train_loss=0.416, train_precision=0.975, train_recall=0.982]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       520
          NS       0.99      0.99      0.99      1140
          NT       0.94      0.96      0.95       593

   micro avg       0.98      0.99      0.98      2253
   macro avg       0.97      0.98      0.98      2253
weighted avg       0.98      0.99      0.98      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.36it/s, F1=0.85, eval_acc=0.985, eval_loss=3.44, eval_precision=0.833, eval_recall=0.872] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.94      0.94      1416
          NS       0.85      0.90      0.87      2857
          NT       0.72      0.79      0.75      1314

   micro avg       0.84      0.88      0.86      5587
   macro avg       0.84      0.88      0.86      5587
weighted avg       0.84      0.88      0.86      5587



Epoch: 12/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.22it/s, F1=0.976, train_acc=0.998, train_loss=0.446, train_precision=0.972, train_recall=0.981]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       520
          NS       0.98      0.99      0.98      1140
          NT       0.94      0.96      0.95       593

   micro avg       0.97      0.98      0.98      2253
   macro avg       0.97      0.98      0.98      2253
weighted avg       0.97      0.98      0.98      2253



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.31it/s, F1=0.841, eval_acc=0.982, eval_loss=4.44, eval_precision=0.84, eval_recall=0.846] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.95      0.94      1416
          NS       0.82      0.86      0.84      2857
          NT       0.72      0.69      0.70      1314

   micro avg       0.83      0.84      0.83      5587
   macro avg       0.82      0.83      0.83      5587
weighted avg       0.82      0.84      0.83      5587



Epoch: 13/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.43it/s, F1=0.986, train_acc=0.999, train_loss=0.304, train_precision=0.984, train_recall=0.989]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      1.00      0.99       520
          NS       0.99      0.99      0.99      1140
          NT       0.96      0.97      0.97       593

   micro avg       0.98      0.99      0.99      2253
   macro avg       0.98      0.99      0.99      2253
weighted avg       0.98      0.99      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.31it/s, F1=0.858, eval_acc=0.984, eval_loss=3.67, eval_precision=0.848, eval_recall=0.871]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.94      0.94      1416
          NS       0.85      0.90      0.87      2857
          NT       0.76      0.75      0.75      1314

   micro avg       0.85      0.87      0.86      5587
   macro avg       0.85      0.86      0.85      5587
weighted avg       0.85      0.87      0.86      5587



Epoch: 14/30 Train: 100%|██████████| 169/169 [00:51<00:00,  3.30it/s, F1=0.989, train_acc=0.999, train_loss=0.154, train_precision=0.986, train_recall=0.993]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       520
          NS       0.99      0.99      0.99      1140
          NT       0.98      0.99      0.98       593

   micro avg       0.99      0.99      0.99      2253
   macro avg       0.99      0.99      0.99      2253
weighted avg       0.99      0.99      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.36it/s, F1=0.845, eval_acc=0.981, eval_loss=4.44, eval_precision=0.822, eval_recall=0.875]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.92      0.94      0.93      1416
          NS       0.83      0.88      0.85      2857
          NT       0.73      0.79      0.76      1314

   micro avg       0.83      0.87      0.85      5587
   macro avg       0.83      0.87      0.85      5587
weighted avg       0.83      0.87      0.85      5587



Epoch: 15/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.41it/s, F1=0.987, train_acc=0.999, train_loss=0.152, train_precision=0.985, train_recall=0.991]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       520
          NS       0.99      1.00      0.99      1140
          NT       0.98      0.99      0.99       593

   micro avg       0.99      0.99      0.99      2253
   macro avg       0.99      0.99      0.99      2253
weighted avg       0.99      0.99      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.60it/s, F1=0.858, eval_acc=0.983, eval_loss=4.48, eval_precision=0.855, eval_recall=0.863]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.93      0.94      1416
          NS       0.83      0.88      0.85      2857
          NT       0.79      0.76      0.78      1314

   micro avg       0.85      0.86      0.86      5587
   macro avg       0.85      0.86      0.86      5587
weighted avg       0.85      0.86      0.86      5587



Epoch: 16/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.44it/s, F1=0.993, train_acc=0.999, train_loss=0.149, train_precision=0.991, train_recall=0.994]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       520
          NS       1.00      1.00      1.00      1140
          NT       0.98      0.99      0.98       593

   micro avg       0.99      0.99      0.99      2253
   macro avg       0.99      0.99      0.99      2253
weighted avg       0.99      0.99      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.36it/s, F1=0.856, eval_acc=0.983, eval_loss=4.47, eval_precision=0.858, eval_recall=0.857]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.92      0.93      1416
          NS       0.84      0.86      0.85      2857
          NT       0.78      0.75      0.76      1314

   micro avg       0.85      0.85      0.85      5587
   macro avg       0.85      0.85      0.85      5587
weighted avg       0.85      0.85      0.85      5587



Epoch: 17/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.44it/s, F1=0.994, train_acc=1, train_loss=0.0902, train_precision=0.994, train_recall=0.995]   


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       520
          NS       0.99      0.99      0.99      1140
          NT       0.99      0.99      0.99       593

   micro avg       0.99      0.99      0.99      2253
   macro avg       0.99      0.99      0.99      2253
weighted avg       0.99      0.99      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.60it/s, F1=0.861, eval_acc=0.984, eval_loss=4.17, eval_precision=0.844, eval_recall=0.884]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.93      0.93      1416
          NS       0.86      0.90      0.88      2857
          NT       0.76      0.81      0.78      1314

   micro avg       0.85      0.89      0.87      5587
   macro avg       0.85      0.88      0.87      5587
weighted avg       0.85      0.89      0.87      5587



Epoch: 18/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.44it/s, F1=0.976, train_acc=0.998, train_loss=0.529, train_precision=0.971, train_recall=0.983]


train_reports:
              precision    recall  f1-score   support

          NR       0.97      0.97      0.97       520
          NS       0.97      0.99      0.98      1140
          NT       0.97      0.98      0.97       593

   micro avg       0.97      0.98      0.97      2253
   macro avg       0.97      0.98      0.97      2253
weighted avg       0.97      0.98      0.97      2253



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.22it/s, F1=0.78, eval_acc=0.975, eval_loss=4.35, eval_precision=0.731, eval_recall=0.846] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.85      0.88      0.87      1416
          NS       0.83      0.85      0.84      2857
          NT       0.57      0.83      0.68      1314

   micro avg       0.76      0.85      0.80      5587
   macro avg       0.75      0.86      0.80      5587
weighted avg       0.77      0.85      0.81      5587



Epoch: 19/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.46it/s, F1=0.982, train_acc=0.999, train_loss=0.305, train_precision=0.977, train_recall=0.988]


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.99      0.98       520
          NS       0.99      0.99      0.99      1140
          NT       0.95      0.98      0.97       593

   micro avg       0.98      0.99      0.98      2253
   macro avg       0.97      0.99      0.98      2253
weighted avg       0.98      0.99      0.98      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.34it/s, F1=0.86, eval_acc=0.985, eval_loss=3.83, eval_precision=0.858, eval_recall=0.864] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.95      0.94      1416
          NS       0.86      0.88      0.87      2857
          NT       0.79      0.76      0.78      1314

   micro avg       0.86      0.87      0.87      5587
   macro avg       0.86      0.87      0.86      5587
weighted avg       0.86      0.87      0.87      5587



Epoch: 20/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.22it/s, F1=0.991, train_acc=0.999, train_loss=0.185, train_precision=0.991, train_recall=0.992]


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.98      0.98       520
          NS       1.00      1.00      1.00      1140
          NT       0.99      0.99      0.99       593

   micro avg       0.99      0.99      0.99      2253
   macro avg       0.99      0.99      0.99      2253
weighted avg       0.99      0.99      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.35it/s, F1=0.849, eval_acc=0.984, eval_loss=3.87, eval_precision=0.843, eval_recall=0.859]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.89      0.91      1416
          NS       0.86      0.89      0.88      2857
          NT       0.73      0.80      0.76      1314

   micro avg       0.85      0.87      0.86      5587
   macro avg       0.85      0.86      0.85      5587
weighted avg       0.85      0.87      0.86      5587



Epoch: 21/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.43it/s, F1=0.993, train_acc=0.999, train_loss=0.187, train_precision=0.993, train_recall=0.993]


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.99      0.99       520
          NS       0.99      0.99      0.99      1140
          NT       0.99      0.99      0.99       593

   micro avg       0.99      0.99      0.99      2253
   macro avg       0.99      0.99      0.99      2253
weighted avg       0.99      0.99      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.30it/s, F1=0.855, eval_acc=0.984, eval_loss=3.67, eval_precision=0.836, eval_recall=0.879]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.93      0.94      1416
          NS       0.84      0.89      0.86      2857
          NT       0.75      0.83      0.79      1314

   micro avg       0.84      0.89      0.86      5587
   macro avg       0.85      0.88      0.86      5587
weighted avg       0.85      0.89      0.87      5587



Epoch: 22/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.24it/s, F1=0.999, train_acc=1, train_loss=0.0291, train_precision=0.999, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       520
          NS       1.00      1.00      1.00      1140
          NT       1.00      1.00      1.00       593

   micro avg       1.00      1.00      1.00      2253
   macro avg       1.00      1.00      1.00      2253
weighted avg       1.00      1.00      1.00      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.35it/s, F1=0.873, eval_acc=0.985, eval_loss=4.22, eval_precision=0.868, eval_recall=0.882]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.96      0.92      0.94      1416
          NS       0.88      0.90      0.89      2857
          NT       0.77      0.82      0.79      1314

   micro avg       0.87      0.89      0.88      5587
   macro avg       0.87      0.88      0.87      5587
weighted avg       0.87      0.89      0.88      5587



Epoch: 23/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.41it/s, F1=0.995, train_acc=1, train_loss=0.0552, train_precision=0.994, train_recall=0.996]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      1.00      1.00       520
          NS       1.00      1.00      1.00      1140
          NT       0.99      0.99      0.99       593

   micro avg       1.00      1.00      1.00      2253
   macro avg       0.99      1.00      0.99      2253
weighted avg       1.00      1.00      1.00      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.34it/s, F1=0.859, eval_acc=0.984, eval_loss=4.56, eval_precision=0.85, eval_recall=0.871] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.94      0.93      1416
          NS       0.85      0.88      0.86      2857
          NT       0.76      0.81      0.78      1314

   micro avg       0.85      0.88      0.86      5587
   macro avg       0.85      0.87      0.86      5587
weighted avg       0.85      0.88      0.86      5587



Epoch: 24/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.21it/s, F1=0.977, train_acc=0.998, train_loss=0.55, train_precision=0.973, train_recall=0.983] 


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.99      0.99       520
          NS       0.98      0.99      0.99      1140
          NT       0.95      0.97      0.96       593

   micro avg       0.97      0.98      0.98      2253
   macro avg       0.97      0.98      0.98      2253
weighted avg       0.97      0.98      0.98      2253



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.17it/s, F1=0.852, eval_acc=0.984, eval_loss=3.75, eval_precision=0.833, eval_recall=0.876]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.92      0.93      1416
          NS       0.84      0.89      0.87      2857
          NT       0.75      0.81      0.78      1314

   micro avg       0.84      0.88      0.86      5587
   macro avg       0.84      0.88      0.86      5587
weighted avg       0.84      0.88      0.86      5587



Epoch: 25/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.45it/s, F1=0.991, train_acc=0.999, train_loss=0.133, train_precision=0.988, train_recall=0.994]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      1.00      1.00       520
          NS       1.00      1.00      1.00      1140
          NT       0.97      0.99      0.98       593

   micro avg       0.99      1.00      0.99      2253
   macro avg       0.99      0.99      0.99      2253
weighted avg       0.99      1.00      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:18<00:00,  3.67it/s, F1=0.859, eval_acc=0.984, eval_loss=4.14, eval_precision=0.853, eval_recall=0.867]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.91      0.93      1416
          NS       0.84      0.89      0.86      2857
          NT       0.78      0.78      0.78      1314

   micro avg       0.85      0.87      0.86      5587
   macro avg       0.86      0.86      0.86      5587
weighted avg       0.85      0.87      0.86      5587



Epoch: 26/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.48it/s, F1=0.998, train_acc=1, train_loss=0.0906, train_precision=0.997, train_recall=0.998]  


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       520
          NS       1.00      1.00      1.00      1140
          NT       0.99      0.99      0.99       593

   micro avg       1.00      1.00      1.00      2253
   macro avg       1.00      1.00      1.00      2253
weighted avg       1.00      1.00      1.00      2253



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.16it/s, F1=0.843, eval_acc=0.983, eval_loss=4.33, eval_precision=0.829, eval_recall=0.862]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.91      0.92      1416
          NS       0.82      0.88      0.85      2857
          NT       0.78      0.79      0.78      1314

   micro avg       0.84      0.87      0.85      5587
   macro avg       0.84      0.86      0.85      5587
weighted avg       0.84      0.87      0.85      5587



Epoch: 27/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.42it/s, F1=0.998, train_acc=1, train_loss=0.0503, train_precision=0.999, train_recall=0.998]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       520
          NS       1.00      1.00      1.00      1140
          NT       1.00      1.00      1.00       593

   micro avg       1.00      1.00      1.00      2253
   macro avg       1.00      1.00      1.00      2253
weighted avg       1.00      1.00      1.00      2253



Eval Result: 100%|██████████| 69/69 [00:18<00:00,  3.65it/s, F1=0.844, eval_acc=0.982, eval_loss=4.81, eval_precision=0.833, eval_recall=0.858]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.93      0.94      1416
          NS       0.83      0.85      0.84      2857
          NT       0.75      0.82      0.78      1314

   micro avg       0.83      0.87      0.85      5587
   macro avg       0.84      0.87      0.85      5587
weighted avg       0.84      0.87      0.85      5587



Epoch: 28/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.41it/s, F1=0.98, train_acc=0.998, train_loss=0.361, train_precision=0.978, train_recall=0.983] 


train_reports:
              precision    recall  f1-score   support

          NR       0.99      1.00      1.00       520
          NS       0.98      0.98      0.98      1140
          NT       0.95      0.97      0.96       593

   micro avg       0.97      0.98      0.98      2253
   macro avg       0.97      0.98      0.98      2253
weighted avg       0.97      0.98      0.98      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.32it/s, F1=0.83, eval_acc=0.982, eval_loss=4.26, eval_precision=0.826, eval_recall=0.838] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.91      0.90      0.90      1416
          NS       0.84      0.85      0.85      2857
          NT       0.73      0.79      0.76      1314

   micro avg       0.83      0.85      0.84      5587
   macro avg       0.83      0.85      0.84      5587
weighted avg       0.83      0.85      0.84      5587



Epoch: 29/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.25it/s, F1=0.99, train_acc=0.999, train_loss=0.092, train_precision=0.989, train_recall=0.992]  


train_reports:
              precision    recall  f1-score   support

          NR       0.99      1.00      1.00       520
          NS       0.99      0.99      0.99      1140
          NT       0.98      0.99      0.99       593

   micro avg       0.99      0.99      0.99      2253
   macro avg       0.99      0.99      0.99      2253
weighted avg       0.99      0.99      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.27it/s, F1=0.845, eval_acc=0.982, eval_loss=4.51, eval_precision=0.836, eval_recall=0.856]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.93      0.93      1416
          NS       0.86      0.86      0.86      2857
          NT       0.73      0.81      0.77      1314

   micro avg       0.84      0.87      0.85      5587
   macro avg       0.84      0.87      0.85      5587
weighted avg       0.85      0.87      0.86      5587



Epoch: 30/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.38it/s, F1=0.995, train_acc=1, train_loss=0.0952, train_precision=0.994, train_recall=0.996]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       520
          NS       0.99      1.00      1.00      1140
          NT       0.99      0.99      0.99       593

   micro avg       1.00      1.00      1.00      2253
   macro avg       1.00      1.00      1.00      2253
weighted avg       1.00      1.00      1.00      2253



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.29it/s, F1=0.835, eval_acc=0.981, eval_loss=4.4, eval_precision=0.829, eval_recall=0.846] 


eval_reports:


calculate data/few_shot/msra/train_1350.json etag: 100%|██████████| 808k/808k [00:00<00:00, 296MB/s]
calculate data/few_shot/msra/dev.json etag:   0%|          | 0.00/2.12M [00:00<?, ?B/s]

              precision    recall  f1-score   support

          NR       0.94      0.93      0.94      1416
          NS       0.87      0.84      0.85      2857
          NT       0.70      0.82      0.76      1314

   micro avg       0.84      0.86      0.85      5587
   macro avg       0.84      0.87      0.85      5587
weighted avg       0.85      0.86      0.85      5587

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/msra/train_1350.json",
    "eval_file": "data/few_shot/msra/dev.json",
    "test_file": "data/few_shot/msra/test.json",
    "tag_file": "data/few_shot/msra/labels.txt",
    "bert_vocab_file": "./model/chinese_wwm_ext/vocab.txt",
    "output_eval": true,
    "max_scan_num": 1000000,
    "add_seq_vocab": false,
    "max_seq_length": 150,
    "max_word_num": 5,
    "default_t

calculate data/few_shot/msra/dev.json etag: 100%|██████████| 2.12M/2.12M [00:00<00:00, 339MB/s]
calculate data/few_shot/msra/test.json etag: 100%|██████████| 2.12M/2.12M [00:00<00:00, 349MB/s]
calculate data/few_shot/msra/labels.txt etag: 100%|██████████| 62.0/62.0 [00:00<00:00, 119kB/s]


load cached ./temp/0a0e7393bc7beec17cf50eebefb4418b_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/lexicon_tree


count line size data/few_shot/msra/labels.txt: 14L [00:00, 112061.56L/s]
build line mapper: 14L [00:00, 119108.02L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 14/14 [00:00<00:00, 4206.32it/s]
load vocab from list: 100%|██████████| 13/13 [00:00<00:00, 163741.60it/s]
load dataset from data/few_shot/msra/train_1350.json: 0it [00:00, ?it/s]

load cached ./temp/0a0e7393bc7beec17cf50eebefb4418b_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/matched_words
load cached ./temp/0a0e7393bc7beec17cf50eebefb4418b_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/word_vocab
load cached ./temp/0a0e7393bc7beec17cf50eebefb4418b_99dcd8ca7c1c46d2956db3748f842917_99dcd8ca7c1c46d2956db3748f842917_b9c74da512a2f72965246b3f0dc0bdf4/1000000/vocab_embedding


load dataset from data/few_shot/msra/train_1350.json: 1350it [00:02, 585.50it/s]
load dataset from data/few_shot/msra/dev.json: 4365it [00:06, 678.29it/s]
Some weights of the model checkpoint at save_pretrained/msra_pretrain_lebert_1350_pretraind_task/Bert_1290/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model 

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.20it/s, F1=0.127, train_acc=0.771, train_loss=41.1, train_precision=0.121, train_recall=0.143]        


train_reports:
              precision    recall  f1-score   support

          NR       0.10      0.20      0.13       520
          NS       0.04      0.13      0.06      1140
          NT       0.01      0.08      0.02       593

   micro avg       0.03      0.13      0.05      2253
   macro avg       0.05      0.14      0.07      2253
weighted avg       0.04      0.13      0.06      2253



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.30it/s, F1=0.581, eval_acc=0.956, eval_loss=5.72, eval_precision=0.521, eval_recall=0.669]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.69      0.87      0.77      1416
          NS       0.48      0.55      0.52      2857
          NT       0.45      0.73      0.56      1314

   micro avg       0.53      0.67      0.59      5587
   macro avg       0.54      0.72      0.61      5587
weighted avg       0.53      0.67      0.59      5587



Epoch: 2/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.42it/s, F1=0.731, train_acc=0.977, train_loss=3.77, train_precision=0.709, train_recall=0.765]


train_reports:
              precision    recall  f1-score   support

          NR       0.86      0.90      0.88       520
          NS       0.69      0.74      0.71      1140
          NT       0.60      0.73      0.66       593

   micro avg       0.70      0.77      0.73      2253
   macro avg       0.72      0.79      0.75      2253
weighted avg       0.71      0.77      0.74      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.32it/s, F1=0.827, eval_acc=0.982, eval_loss=2.34, eval_precision=0.816, eval_recall=0.844]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.91      0.95      0.93      1416
          NS       0.85      0.84      0.85      2857
          NT       0.70      0.77      0.74      1314

   micro avg       0.83      0.85      0.84      5587
   macro avg       0.82      0.85      0.84      5587
weighted avg       0.83      0.85      0.84      5587



Epoch: 3/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.19it/s, F1=0.886, train_acc=0.991, train_loss=1.42, train_precision=0.876, train_recall=0.899]


train_reports:
              precision    recall  f1-score   support

          NR       0.94      0.94      0.94       520
          NS       0.89      0.92      0.91      1140
          NT       0.79      0.86      0.82       593

   micro avg       0.88      0.91      0.89      2253
   macro avg       0.88      0.91      0.89      2253
weighted avg       0.88      0.91      0.89      2253



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.21it/s, F1=0.842, eval_acc=0.982, eval_loss=2.34, eval_precision=0.838, eval_recall=0.849]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.96      0.95      1416
          NS       0.83      0.85      0.84      2857
          NT       0.75      0.73      0.74      1314

   micro avg       0.84      0.85      0.85      5587
   macro avg       0.84      0.85      0.84      5587
weighted avg       0.84      0.85      0.85      5587



Epoch: 4/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.43it/s, F1=0.948, train_acc=0.996, train_loss=0.689, train_precision=0.944, train_recall=0.953]


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.97      0.98       520
          NS       0.95      0.96      0.96      1140
          NT       0.89      0.93      0.91       593

   micro avg       0.94      0.96      0.95      2253
   macro avg       0.94      0.95      0.95      2253
weighted avg       0.94      0.96      0.95      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.34it/s, F1=0.849, eval_acc=0.984, eval_loss=2.38, eval_precision=0.825, eval_recall=0.879]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.95      0.94      1416
          NS       0.83      0.90      0.87      2857
          NT       0.74      0.80      0.77      1314

   micro avg       0.83      0.89      0.86      5587
   macro avg       0.83      0.88      0.86      5587
weighted avg       0.84      0.89      0.86      5587



Epoch: 5/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.21it/s, F1=0.966, train_acc=0.998, train_loss=0.431, train_precision=0.962, train_recall=0.972]


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.99      0.98       520
          NS       0.98      0.98      0.98      1140
          NT       0.92      0.95      0.94       593

   micro avg       0.96      0.97      0.97      2253
   macro avg       0.96      0.97      0.97      2253
weighted avg       0.96      0.97      0.97      2253



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.26it/s, F1=0.875, eval_acc=0.986, eval_loss=2.17, eval_precision=0.87, eval_recall=0.882] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.96      0.94      0.95      1416
          NS       0.89      0.90      0.89      2857
          NT       0.77      0.80      0.79      1314

   micro avg       0.88      0.89      0.88      5587
   macro avg       0.87      0.88      0.88      5587
weighted avg       0.88      0.89      0.88      5587



Epoch: 6/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.43it/s, F1=0.975, train_acc=0.998, train_loss=0.443, train_precision=0.972, train_recall=0.979]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       520
          NS       0.97      0.98      0.98      1140
          NT       0.95      0.97      0.96       593

   micro avg       0.97      0.98      0.98      2253
   macro avg       0.97      0.98      0.98      2253
weighted avg       0.97      0.98      0.98      2253



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.54it/s, F1=0.846, eval_acc=0.982, eval_loss=3.02, eval_precision=0.837, eval_recall=0.859]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.95      0.94      1416
          NS       0.85      0.88      0.86      2857
          NT       0.71      0.72      0.71      1314

   micro avg       0.84      0.86      0.85      5587
   macro avg       0.83      0.85      0.84      5587
weighted avg       0.84      0.86      0.85      5587



Epoch: 7/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.45it/s, F1=0.975, train_acc=0.998, train_loss=0.425, train_precision=0.971, train_recall=0.98] 


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       520
          NS       0.98      0.99      0.99      1140
          NT       0.93      0.96      0.95       593

   micro avg       0.97      0.98      0.98      2253
   macro avg       0.97      0.98      0.98      2253
weighted avg       0.97      0.98      0.98      2253



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.26it/s, F1=0.849, eval_acc=0.982, eval_loss=2.83, eval_precision=0.826, eval_recall=0.878]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.92      0.96      0.94      1416
          NS       0.87      0.87      0.87      2857
          NT       0.70      0.84      0.77      1314

   micro avg       0.84      0.89      0.86      5587
   macro avg       0.83      0.89      0.86      5587
weighted avg       0.84      0.89      0.86      5587



Epoch: 8/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.43it/s, F1=0.98, train_acc=0.998, train_loss=0.362, train_precision=0.978, train_recall=0.983] 


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       520
          NS       0.99      0.99      0.99      1140
          NT       0.95      0.97      0.96       593

   micro avg       0.98      0.98      0.98      2253
   macro avg       0.98      0.98      0.98      2253
weighted avg       0.98      0.98      0.98      2253



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.46it/s, F1=0.846, eval_acc=0.982, eval_loss=3.11, eval_precision=0.847, eval_recall=0.849]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.93      0.94      1416
          NS       0.86      0.85      0.86      2857
          NT       0.75      0.78      0.77      1314

   micro avg       0.86      0.85      0.86      5587
   macro avg       0.85      0.85      0.85      5587
weighted avg       0.86      0.85      0.86      5587



Epoch: 9/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.44it/s, F1=0.985, train_acc=0.999, train_loss=0.342, train_precision=0.984, train_recall=0.987]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       520
          NS       0.99      0.99      0.99      1140
          NT       0.97      0.98      0.98       593

   micro avg       0.98      0.99      0.99      2253
   macro avg       0.98      0.99      0.99      2253
weighted avg       0.98      0.99      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.32it/s, F1=0.851, eval_acc=0.984, eval_loss=3.27, eval_precision=0.863, eval_recall=0.842]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.96      0.92      0.94      1416
          NS       0.88      0.86      0.87      2857
          NT       0.79      0.78      0.79      1314

   micro avg       0.88      0.86      0.87      5587
   macro avg       0.88      0.85      0.87      5587
weighted avg       0.88      0.86      0.87      5587



Epoch: 10/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.40it/s, F1=0.974, train_acc=0.998, train_loss=0.361, train_precision=0.97, train_recall=0.978] 


train_reports:
              precision    recall  f1-score   support

          NR       0.95      0.97      0.96       520
          NS       0.98      0.99      0.98      1140
          NT       0.97      0.98      0.98       593

   micro avg       0.97      0.98      0.98      2253
   macro avg       0.97      0.98      0.97      2253
weighted avg       0.97      0.98      0.98      2253



Eval Result: 100%|██████████| 69/69 [00:19<00:00,  3.56it/s, F1=0.864, eval_acc=0.985, eval_loss=2.86, eval_precision=0.869, eval_recall=0.862]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.94      0.94      1416
          NS       0.89      0.87      0.88      2857
          NT       0.82      0.79      0.80      1314

   micro avg       0.88      0.87      0.88      5587
   macro avg       0.88      0.87      0.88      5587
weighted avg       0.88      0.87      0.88      5587



Epoch: 11/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.49it/s, F1=0.992, train_acc=0.999, train_loss=0.128, train_precision=0.991, train_recall=0.994]


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.99      0.99       520
          NS       0.99      0.99      0.99      1140
          NT       0.99      0.99      0.99       593

   micro avg       0.99      0.99      0.99      2253
   macro avg       0.99      0.99      0.99      2253
weighted avg       0.99      0.99      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.35it/s, F1=0.869, eval_acc=0.984, eval_loss=3.22, eval_precision=0.869, eval_recall=0.87] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.94      0.93      1416
          NS       0.88      0.88      0.88      2857
          NT       0.81      0.79      0.80      1314

   micro avg       0.88      0.88      0.88      5587
   macro avg       0.87      0.87      0.87      5587
weighted avg       0.88      0.88      0.88      5587



Epoch: 12/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.21it/s, F1=0.991, train_acc=0.999, train_loss=0.192, train_precision=0.989, train_recall=0.993]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       520
          NS       1.00      1.00      1.00      1140
          NT       0.97      0.98      0.97       593

   micro avg       0.99      0.99      0.99      2253
   macro avg       0.99      0.99      0.99      2253
weighted avg       0.99      0.99      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.33it/s, F1=0.856, eval_acc=0.984, eval_loss=3.44, eval_precision=0.849, eval_recall=0.866]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.95      0.94      1416
          NS       0.85      0.90      0.88      2857
          NT       0.77      0.74      0.76      1314

   micro avg       0.86      0.88      0.87      5587
   macro avg       0.86      0.86      0.86      5587
weighted avg       0.86      0.88      0.87      5587



Epoch: 13/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.47it/s, F1=0.993, train_acc=0.999, train_loss=0.136, train_precision=0.992, train_recall=0.993]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      1.00      0.99       520
          NS       0.99      0.99      0.99      1140
          NT       0.98      0.99      0.98       593

   micro avg       0.99      0.99      0.99      2253
   macro avg       0.99      0.99      0.99      2253
weighted avg       0.99      0.99      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.33it/s, F1=0.85, eval_acc=0.984, eval_loss=2.78, eval_precision=0.834, eval_recall=0.871] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.95      0.94      1416
          NS       0.85      0.89      0.87      2857
          NT       0.73      0.79      0.76      1314

   micro avg       0.84      0.88      0.86      5587
   macro avg       0.84      0.88      0.86      5587
weighted avg       0.85      0.88      0.86      5587



Epoch: 14/30 Train: 100%|██████████| 169/169 [00:53<00:00,  3.19it/s, F1=0.982, train_acc=0.999, train_loss=0.252, train_precision=0.979, train_recall=0.986]


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.99      0.99       520
          NS       0.98      0.99      0.98      1140
          NT       0.97      0.98      0.98       593

   micro avg       0.98      0.99      0.98      2253
   macro avg       0.98      0.99      0.98      2253
weighted avg       0.98      0.99      0.98      2253



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.22it/s, F1=0.833, eval_acc=0.98, eval_loss=4, eval_precision=0.848, eval_recall=0.822]    


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.95      0.94      1416
          NS       0.82      0.81      0.82      2857
          NT       0.78      0.72      0.75      1314

   micro avg       0.84      0.82      0.83      5587
   macro avg       0.84      0.83      0.83      5587
weighted avg       0.84      0.82      0.83      5587



Epoch: 15/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.42it/s, F1=0.98, train_acc=0.999, train_loss=0.196, train_precision=0.976, train_recall=0.986] 


train_reports:
              precision    recall  f1-score   support

          NR       0.98      0.99      0.99       520
          NS       0.99      1.00      0.99      1140
          NT       0.99      0.99      0.99       593

   micro avg       0.99      0.99      0.99      2253
   macro avg       0.99      0.99      0.99      2253
weighted avg       0.99      0.99      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.33it/s, F1=0.855, eval_acc=0.983, eval_loss=3.4, eval_precision=0.846, eval_recall=0.867] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.94      0.94      1416
          NS       0.85      0.87      0.86      2857
          NT       0.75      0.81      0.78      1314

   micro avg       0.85      0.87      0.86      5587
   macro avg       0.85      0.87      0.86      5587
weighted avg       0.85      0.87      0.86      5587



Epoch: 16/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.21it/s, F1=0.994, train_acc=0.999, train_loss=0.111, train_precision=0.993, train_recall=0.995] 


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       520
          NS       0.99      0.99      0.99      1140
          NT       0.98      0.99      0.99       593

   micro avg       0.99      0.99      0.99      2253
   macro avg       0.99      0.99      0.99      2253
weighted avg       0.99      0.99      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.38it/s, F1=0.853, eval_acc=0.982, eval_loss=3.8, eval_precision=0.869, eval_recall=0.841] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.94      0.95      1416
          NS       0.86      0.83      0.84      2857
          NT       0.80      0.76      0.78      1314

   micro avg       0.87      0.84      0.86      5587
   macro avg       0.87      0.84      0.86      5587
weighted avg       0.87      0.84      0.86      5587



Epoch: 17/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.48it/s, F1=0.995, train_acc=1, train_loss=0.0814, train_precision=0.993, train_recall=0.996]   


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       520
          NS       0.99      0.99      0.99      1140
          NT       0.99      1.00      0.99       593

   micro avg       0.99      1.00      0.99      2253
   macro avg       0.99      1.00      1.00      2253
weighted avg       0.99      1.00      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.25it/s, F1=0.866, eval_acc=0.985, eval_loss=2.99, eval_precision=0.852, eval_recall=0.884]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.95      0.94      1416
          NS       0.87      0.89      0.88      2857
          NT       0.78      0.82      0.80      1314

   micro avg       0.86      0.89      0.88      5587
   macro avg       0.86      0.89      0.87      5587
weighted avg       0.86      0.89      0.88      5587



Epoch: 18/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.22it/s, F1=0.998, train_acc=1, train_loss=0.0366, train_precision=0.998, train_recall=0.998]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       520
          NS       1.00      1.00      1.00      1140
          NT       1.00      1.00      1.00       593

   micro avg       1.00      1.00      1.00      2253
   macro avg       1.00      1.00      1.00      2253
weighted avg       1.00      1.00      1.00      2253



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.21it/s, F1=0.866, eval_acc=0.985, eval_loss=3.2, eval_precision=0.864, eval_recall=0.87]  


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.92      0.94      1416
          NS       0.89      0.89      0.89      2857
          NT       0.79      0.82      0.80      1314

   micro avg       0.88      0.88      0.88      5587
   macro avg       0.87      0.88      0.88      5587
weighted avg       0.88      0.88      0.88      5587



Epoch: 19/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.43it/s, F1=0.995, train_acc=1, train_loss=0.0912, train_precision=0.995, train_recall=0.995]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       520
          NS       0.99      0.99      0.99      1140
          NT       0.99      0.99      0.99       593

   micro avg       0.99      0.99      0.99      2253
   macro avg       0.99      0.99      0.99      2253
weighted avg       0.99      0.99      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.31it/s, F1=0.832, eval_acc=0.983, eval_loss=3.45, eval_precision=0.801, eval_recall=0.871]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.92      0.95      0.94      1416
          NS       0.78      0.86      0.82      2857
          NT       0.71      0.82      0.76      1314

   micro avg       0.80      0.87      0.83      5587
   macro avg       0.80      0.88      0.84      5587
weighted avg       0.80      0.87      0.84      5587



Epoch: 20/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.25it/s, F1=0.988, train_acc=1, train_loss=0.108, train_precision=0.987, train_recall=0.988]    


train_reports:
              precision    recall  f1-score   support

          NR       0.99      1.00      0.99       520
          NS       0.99      0.99      0.99      1140
          NT       1.00      0.99      1.00       593

   micro avg       0.99      0.99      0.99      2253
   macro avg       0.99      0.99      0.99      2253
weighted avg       0.99      0.99      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.34it/s, F1=0.875, eval_acc=0.986, eval_loss=3.41, eval_precision=0.882, eval_recall=0.872]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.94      0.95      1416
          NS       0.87      0.90      0.89      2857
          NT       0.82      0.78      0.80      1314

   micro avg       0.88      0.88      0.88      5587
   macro avg       0.88      0.87      0.88      5587
weighted avg       0.88      0.88      0.88      5587



Epoch: 21/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.42it/s, F1=0.988, train_acc=0.999, train_loss=0.138, train_precision=0.986, train_recall=0.989]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       520
          NS       0.99      1.00      0.99      1140
          NT       0.99      0.99      0.99       593

   micro avg       0.99      1.00      0.99      2253
   macro avg       0.99      1.00      0.99      2253
weighted avg       0.99      1.00      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:18<00:00,  3.69it/s, F1=0.847, eval_acc=0.983, eval_loss=3.56, eval_precision=0.819, eval_recall=0.883]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.94      0.94      1416
          NS       0.88      0.89      0.88      2857
          NT       0.68      0.85      0.76      1314

   micro avg       0.84      0.89      0.86      5587
   macro avg       0.83      0.89      0.86      5587
weighted avg       0.85      0.89      0.87      5587



Epoch: 22/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.44it/s, F1=0.986, train_acc=0.999, train_loss=0.221, train_precision=0.985, train_recall=0.988]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       520
          NS       0.99      0.98      0.99      1140
          NT       0.98      0.99      0.99       593

   micro avg       0.99      0.99      0.99      2253
   macro avg       0.99      0.99      0.99      2253
weighted avg       0.99      0.99      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.31it/s, F1=0.864, eval_acc=0.984, eval_loss=3.64, eval_precision=0.863, eval_recall=0.868]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.90      0.95      0.93      1416
          NS       0.89      0.88      0.88      2857
          NT       0.79      0.78      0.79      1314

   micro avg       0.87      0.87      0.87      5587
   macro avg       0.86      0.87      0.86      5587
weighted avg       0.87      0.87      0.87      5587



Epoch: 23/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.44it/s, F1=0.994, train_acc=0.999, train_loss=0.109, train_precision=0.995, train_recall=0.994]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       520
          NS       0.99      1.00      1.00      1140
          NT       0.99      0.99      0.99       593

   micro avg       0.99      0.99      0.99      2253
   macro avg       0.99      0.99      0.99      2253
weighted avg       0.99      0.99      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:18<00:00,  3.67it/s, F1=0.853, eval_acc=0.982, eval_loss=4.09, eval_precision=0.846, eval_recall=0.864]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.95      0.94      1416
          NS       0.84      0.87      0.85      2857
          NT       0.76      0.78      0.77      1314

   micro avg       0.85      0.87      0.86      5587
   macro avg       0.85      0.87      0.86      5587
weighted avg       0.85      0.87      0.86      5587



Epoch: 24/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.44it/s, F1=0.985, train_acc=0.999, train_loss=0.258, train_precision=0.984, train_recall=0.988]


train_reports:
              precision    recall  f1-score   support

          NR       0.99      0.99      0.99       520
          NS       1.00      1.00      1.00      1140
          NT       0.96      0.97      0.97       593

   micro avg       0.99      0.99      0.99      2253
   macro avg       0.98      0.99      0.98      2253
weighted avg       0.99      0.99      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.31it/s, F1=0.858, eval_acc=0.983, eval_loss=3.33, eval_precision=0.841, eval_recall=0.88] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.93      0.90      0.92      1416
          NS       0.86      0.92      0.89      2857
          NT       0.79      0.78      0.78      1314

   micro avg       0.86      0.88      0.87      5587
   macro avg       0.86      0.87      0.86      5587
weighted avg       0.86      0.88      0.87      5587



Epoch: 25/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.42it/s, F1=0.994, train_acc=1, train_loss=0.0936, train_precision=0.993, train_recall=0.995]   


train_reports:
              precision    recall  f1-score   support

          NR       0.99      1.00      0.99       520
          NS       0.99      1.00      1.00      1140
          NT       0.99      0.99      0.99       593

   micro avg       0.99      1.00      0.99      2253
   macro avg       0.99      1.00      0.99      2253
weighted avg       0.99      1.00      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:18<00:00,  3.70it/s, F1=0.87, eval_acc=0.985, eval_loss=3.46, eval_precision=0.873, eval_recall=0.87]  


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.94      0.95      1416
          NS       0.88      0.89      0.88      2857
          NT       0.81      0.78      0.79      1314

   micro avg       0.88      0.88      0.88      5587
   macro avg       0.88      0.87      0.87      5587
weighted avg       0.88      0.88      0.88      5587



Epoch: 26/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.42it/s, F1=0.996, train_acc=0.999, train_loss=0.1, train_precision=0.996, train_recall=0.997]   


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       520
          NS       1.00      1.00      1.00      1140
          NT       0.98      0.99      0.99       593

   micro avg       1.00      1.00      1.00      2253
   macro avg       0.99      1.00      1.00      2253
weighted avg       1.00      1.00      1.00      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.38it/s, F1=0.849, eval_acc=0.984, eval_loss=3.26, eval_precision=0.826, eval_recall=0.876]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.94      0.94      1416
          NS       0.81      0.88      0.85      2857
          NT       0.74      0.82      0.78      1314

   micro avg       0.83      0.88      0.85      5587
   macro avg       0.84      0.88      0.86      5587
weighted avg       0.83      0.88      0.86      5587



Epoch: 27/30 Train: 100%|██████████| 169/169 [00:52<00:00,  3.21it/s, F1=0.991, train_acc=0.999, train_loss=0.107, train_precision=0.99, train_recall=0.992] 


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       520
          NS       0.99      0.99      0.99      1140
          NT       0.99      0.99      0.99       593

   micro avg       0.99      0.99      0.99      2253
   macro avg       0.99      0.99      0.99      2253
weighted avg       0.99      0.99      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.34it/s, F1=0.863, eval_acc=0.984, eval_loss=3.64, eval_precision=0.863, eval_recall=0.864]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.94      0.95      1416
          NS       0.86      0.88      0.87      2857
          NT       0.80      0.77      0.78      1314

   micro avg       0.87      0.87      0.87      5587
   macro avg       0.87      0.86      0.87      5587
weighted avg       0.87      0.87      0.87      5587



Epoch: 28/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.45it/s, F1=0.994, train_acc=1, train_loss=0.0919, train_precision=0.993, train_recall=0.996]   


train_reports:
              precision    recall  f1-score   support

          NR       0.99      1.00      1.00       520
          NS       0.99      1.00      1.00      1140
          NT       0.99      0.99      0.99       593

   micro avg       0.99      1.00      0.99      2253
   macro avg       0.99      1.00      0.99      2253
weighted avg       0.99      1.00      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.34it/s, F1=0.855, eval_acc=0.984, eval_loss=3.62, eval_precision=0.838, eval_recall=0.875]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.94      0.94      0.94      1416
          NS       0.84      0.89      0.86      2857
          NT       0.76      0.81      0.78      1314

   micro avg       0.84      0.88      0.86      5587
   macro avg       0.85      0.88      0.86      5587
weighted avg       0.85      0.88      0.86      5587



Epoch: 29/30 Train: 100%|██████████| 169/169 [00:51<00:00,  3.29it/s, F1=0.996, train_acc=1, train_loss=0.0751, train_precision=0.996, train_recall=0.997]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      1.00      1.00       520
          NS       0.99      1.00      1.00      1140
          NT       1.00      1.00      1.00       593

   micro avg       1.00      1.00      1.00      2253
   macro avg       1.00      1.00      1.00      2253
weighted avg       1.00      1.00      1.00      2253



Eval Result: 100%|██████████| 69/69 [00:15<00:00,  4.34it/s, F1=0.869, eval_acc=0.985, eval_loss=3.09, eval_precision=0.869, eval_recall=0.872]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

          NR       0.95      0.94      0.95      1416
          NS       0.88      0.87      0.87      2857
          NT       0.80      0.82      0.81      1314

   micro avg       0.88      0.88      0.88      5587
   macro avg       0.88      0.88      0.88      5587
weighted avg       0.88      0.88      0.88      5587



Epoch: 30/30 Train: 100%|██████████| 169/169 [00:49<00:00,  3.40it/s, F1=0.991, train_acc=0.999, train_loss=0.166, train_precision=0.99, train_recall=0.991]


train_reports:
              precision    recall  f1-score   support

          NR       1.00      0.99      1.00       520
          NS       0.99      0.99      0.99      1140
          NT       0.97      0.98      0.98       593

   micro avg       0.99      0.99      0.99      2253
   macro avg       0.99      0.99      0.99      2253
weighted avg       0.99      0.99      0.99      2253



Eval Result: 100%|██████████| 69/69 [00:16<00:00,  4.25it/s, F1=0.842, eval_acc=0.981, eval_loss=3.24, eval_precision=0.818, eval_recall=0.871]


eval_reports:


calculate data/few_shot/resume/train_250.json etag: 100%|██████████| 108k/108k [00:00<00:00, 163MB/s]
calculate data/few_shot/resume/dev.json etag:   0%|          | 0.00/208k [00:00<?, ?B/s]

              precision    recall  f1-score   support

          NR       0.92      0.95      0.93      1416
          NS       0.87      0.86      0.86      2857
          NT       0.67      0.83      0.74      1314

   micro avg       0.83      0.88      0.85      5587
   macro avg       0.82      0.88      0.85      5587
weighted avg       0.83      0.88      0.85      5587

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/resume/train_250.json",
    "eval_file": "data/few_shot/resume/dev.json",
    "test_file": "data/few_shot/resume/test.json",
    "tag_file": "data/few_shot/resume/labels.txt",
    "bert_vocab_file": "./model/chinese_wwm_ext/vocab.txt",
    "output_eval": true,
    "max_scan_num": 1000000,
    "add_seq_vocab": false,
    "max_seq_length": 150,
    "max_word_num": 5,
    "de

calculate data/few_shot/resume/dev.json etag: 100%|██████████| 208k/208k [00:00<00:00, 13.4MB/s]
calculate data/few_shot/resume/test.json etag: 100%|██████████| 230k/230k [00:00<00:00, 17.9MB/s]
calculate data/few_shot/resume/labels.txt etag: 100%|██████████| 181/181 [00:00<00:00, 318kB/s]


load cached ./temp/258a32339a7cddecc92751214f251651_578a629df36736a7b0ca315689a0fbc2_a783a23408031aaf8881013b1b168597_61206f767c93b652c614f8099bc479e7/1000000/lexicon_tree


count line size data/few_shot/resume/labels.txt: 29L [00:00, 211171.56L/s]
build line mapper: 29L [00:00, 246224.32L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 29/29 [00:00<00:00, 7996.50it/s]
load vocab from list: 100%|██████████| 28/28 [00:00<00:00, 267518.25it/s]
load dataset from data/few_shot/resume/train_250.json: 0it [00:00, ?it/s]

load cached ./temp/258a32339a7cddecc92751214f251651_578a629df36736a7b0ca315689a0fbc2_a783a23408031aaf8881013b1b168597_61206f767c93b652c614f8099bc479e7/1000000/matched_words
load cached ./temp/258a32339a7cddecc92751214f251651_578a629df36736a7b0ca315689a0fbc2_a783a23408031aaf8881013b1b168597_61206f767c93b652c614f8099bc479e7/1000000/word_vocab
load cached ./temp/258a32339a7cddecc92751214f251651_578a629df36736a7b0ca315689a0fbc2_a783a23408031aaf8881013b1b168597_61206f767c93b652c614f8099bc479e7/1000000/vocab_embedding


load dataset from data/few_shot/resume/train_250.json: 250it [00:00, 896.25it/s]
load dataset from data/few_shot/resume/dev.json: 463it [00:00, 856.62it/s]
Some weights of the model checkpoint at save_pretrained/resume_pretrain_lebert_250_pretraind_task/Bert_240/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.79it/s, F1=0.00231, train_acc=0.129, train_loss=101, train_precision=0.00215, train_recall=0.00333]  


train_reports:
              precision    recall  f1-score   support

        CONT       0.00      0.00      0.00        18
         EDU       0.00      0.00      0.00        48
         LOC       0.00      0.00      0.00         2
        NAME       0.00      0.00      0.00        80
         ORG       0.00      0.01      0.00       265
         PRO       0.00      0.00      0.00        11
        RACE       0.00      0.00      0.00         9
       TITLE       0.00      0.00      0.00       353

   micro avg       0.00      0.00      0.00       786
   macro avg       0.00      0.00      0.00       786
weighted avg       0.00      0.00      0.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.67it/s, F1=0.0173, eval_acc=0.557, eval_loss=65.4, eval_precision=0.0417, eval_recall=0.011]  


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.00      0.00      0.00        33
         EDU       0.00      0.00      0.00       106
         LOC       0.00      0.00      0.00         2
        NAME       0.00      0.00      0.00       110
         ORG       0.06      0.03      0.04       523
         PRO       0.00      0.00      0.00        18
        RACE       0.00      0.00      0.00        15
       TITLE       0.00      0.00      0.00       690

   micro avg       0.05      0.01      0.02      1497
   macro avg       0.01      0.00      0.01      1497
weighted avg       0.02      0.01      0.02      1497



Epoch: 2/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.80it/s, F1=0.0616, train_acc=0.633, train_loss=43.5, train_precision=0.0643, train_recall=0.068]  


train_reports:
              precision    recall  f1-score   support

        CONT       0.00      0.00      0.00        18
         EDU       0.00      0.00      0.00        48
         LOC       0.00      0.00      0.00         2
        NAME       0.00      0.00      0.00        80
         ORG       0.19      0.19      0.19       265
         PRO       0.00      0.00      0.00        11
        RACE       0.00      0.00      0.00         9
       TITLE       0.01      0.02      0.02       353

   micro avg       0.08      0.07      0.08       786
   macro avg       0.03      0.03      0.03       786
weighted avg       0.07      0.07      0.07       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.238, eval_acc=0.717, eval_loss=29.9, eval_precision=0.197, eval_recall=0.301]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.00      0.00      0.00        33
         EDU       0.00      0.00      0.00       106
         LOC       0.00      0.00      0.00         2
        NAME       0.00      0.00      0.00       110
         ORG       0.39      0.57      0.46       523
         PRO       0.00      0.00      0.00        18
        RACE       0.00      0.00      0.00        15
       TITLE       0.09      0.20      0.12       690

   micro avg       0.19      0.29      0.23      1497
   macro avg       0.06      0.10      0.07      1497
weighted avg       0.18      0.29      0.22      1497



Epoch: 3/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.93it/s, F1=0.416, train_acc=0.802, train_loss=20.4, train_precision=0.371, train_recall=0.484] 


train_reports:
              precision    recall  f1-score   support

        CONT       0.00      0.00      0.00        18
         EDU       0.29      0.21      0.24        48
         LOC       0.00      0.00      0.00         2
        NAME       0.00      0.00      0.00        80
         ORG       0.45      0.67      0.54       265
         PRO       0.00      0.00      0.00        11
        RACE       0.00      0.00      0.00         9
       TITLE       0.35      0.57      0.44       353

   micro avg       0.35      0.49      0.41       786
   macro avg       0.14      0.18      0.15       786
weighted avg       0.33      0.49      0.39       786



Eval Result: 100%|██████████| 8/8 [00:04<00:00,  1.74it/s, F1=0.633, eval_acc=0.87, eval_loss=15.1, eval_precision=0.565, eval_recall=0.722] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.00      0.00      0.00        33
         EDU       0.62      0.70      0.66       106
         LOC       0.00      0.00      0.00         2
        NAME       0.03      0.05      0.04       110
         ORG       0.69      0.80      0.74       523
         PRO       0.00      0.00      0.00        18
        RACE       0.00      0.00      0.00        15
       TITLE       0.60      0.82      0.69       690

   micro avg       0.55      0.71      0.62      1497
   macro avg       0.24      0.30      0.27      1497
weighted avg       0.56      0.71      0.63      1497



Epoch: 4/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.97it/s, F1=0.707, train_acc=0.932, train_loss=8.33, train_precision=0.659, train_recall=0.772]


train_reports:
              precision    recall  f1-score   support

        CONT       0.00      0.00      0.00        18
         EDU       0.52      0.65      0.57        48
         LOC       0.00      0.00      0.00         2
        NAME       0.32      0.49      0.38        80
         ORG       0.79      0.86      0.83       265
         PRO       0.00      0.00      0.00        11
        RACE       0.00      0.00      0.00         9
       TITLE       0.72      0.87      0.79       353

   micro avg       0.64      0.77      0.70       786
   macro avg       0.29      0.36      0.32       786
weighted avg       0.65      0.77      0.71       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.66it/s, F1=0.764, eval_acc=0.934, eval_loss=7.47, eval_precision=0.716, eval_recall=0.822]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.01      0.03      0.02        33
         EDU       0.57      0.69      0.63       106
         LOC       0.00      0.00      0.00         2
        NAME       0.90      0.88      0.89       110
         ORG       0.77      0.85      0.81       523
         PRO       0.00      0.00      0.00        18
        RACE       0.00      0.00      0.00        15
       TITLE       0.72      0.89      0.80       690

   micro avg       0.70      0.82      0.76      1497
   macro avg       0.37      0.42      0.39      1497
weighted avg       0.71      0.82      0.76      1497



Epoch: 5/30 Train: 100%|██████████| 32/32 [00:07<00:00,  4.01it/s, F1=0.837, train_acc=0.962, train_loss=4.72, train_precision=0.808, train_recall=0.874]


train_reports:
              precision    recall  f1-score   support

        CONT       0.45      0.78      0.57        18
         EDU       0.55      0.73      0.62        48
         LOC       0.00      0.00      0.00         2
        NAME       0.94      0.93      0.93        80
         ORG       0.84      0.92      0.88       265
         PRO       0.00      0.00      0.00        11
        RACE       1.00      0.11      0.20         9
       TITLE       0.87      0.94      0.90       353

   micro avg       0.82      0.89      0.85       786
   macro avg       0.58      0.55      0.51       786
weighted avg       0.82      0.89      0.85       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.71it/s, F1=0.841, eval_acc=0.944, eval_loss=6.85, eval_precision=0.804, eval_recall=0.884]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.84      0.97      0.90        33
         EDU       0.65      0.79      0.71       106
         LOC       0.00      0.00      0.00         2
        NAME       0.97      0.93      0.95       110
         ORG       0.79      0.88      0.83       523
         PRO       0.00      0.00      0.00        18
        RACE       0.93      0.87      0.90        15
       TITLE       0.82      0.91      0.86       690

   micro avg       0.79      0.88      0.83      1497
   macro avg       0.63      0.67      0.64      1497
weighted avg       0.80      0.88      0.84      1497



Epoch: 6/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.92it/s, F1=0.921, train_acc=0.986, train_loss=2, train_precision=0.901, train_recall=0.945]   


train_reports:
              precision    recall  f1-score   support

        CONT       0.90      1.00      0.95        18
         EDU       0.67      0.85      0.75        48
         LOC       0.00      0.00      0.00         2
        NAME       0.94      0.96      0.95        80
         ORG       0.91      0.95      0.93       265
         PRO       0.00      0.00      0.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       0.93      0.97      0.95       353

   micro avg       0.89      0.94      0.91       786
   macro avg       0.67      0.72      0.69       786
weighted avg       0.89      0.94      0.91       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.71it/s, F1=0.856, eval_acc=0.952, eval_loss=5.88, eval_precision=0.82, eval_recall=0.898] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.80      0.97      0.88        33
         EDU       0.80      0.90      0.84       106
         LOC       0.00      0.00      0.00         2
        NAME       0.97      0.93      0.95       110
         ORG       0.82      0.89      0.85       523
         PRO       0.00      0.00      0.00        18
        RACE       0.93      0.93      0.93        15
       TITLE       0.82      0.92      0.87       690

   micro avg       0.81      0.90      0.85      1497
   macro avg       0.64      0.69      0.67      1497
weighted avg       0.82      0.90      0.86      1497



Epoch: 7/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.92it/s, F1=0.953, train_acc=0.989, train_loss=1.44, train_precision=0.941, train_recall=0.967]


train_reports:
              precision    recall  f1-score   support

        CONT       0.86      1.00      0.92        18
         EDU       0.87      0.96      0.91        48
         LOC       0.00      0.00      0.00         2
        NAME       0.95      0.95      0.95        80
         ORG       0.94      0.97      0.95       265
         PRO       0.25      0.36      0.30        11
        RACE       1.00      1.00      1.00         9
       TITLE       0.97      0.99      0.98       353

   micro avg       0.93      0.96      0.95       786
   macro avg       0.73      0.78      0.75       786
weighted avg       0.94      0.96      0.95       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.861, eval_acc=0.952, eval_loss=5.69, eval_precision=0.817, eval_recall=0.911]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.97      0.97      0.97        33
         EDU       0.85      0.95      0.90       106
         LOC       0.00      0.00      0.00         2
        NAME       0.98      0.97      0.98       110
         ORG       0.78      0.89      0.84       523
         PRO       0.26      0.50      0.35        18
        RACE       0.93      0.93      0.93        15
       TITLE       0.78      0.90      0.84       690

   micro avg       0.80      0.91      0.85      1497
   macro avg       0.70      0.77      0.73      1497
weighted avg       0.80      0.91      0.85      1497



Epoch: 8/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.96it/s, F1=0.963, train_acc=0.994, train_loss=0.88, train_precision=0.955, train_recall=0.971] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       0.88      0.92      0.90        48
         LOC       0.00      0.00      0.00         2
        NAME       0.97      0.96      0.97        80
         ORG       0.96      0.97      0.96       265
         PRO       0.62      0.73      0.67        11
        RACE       0.90      1.00      0.95         9
       TITLE       0.98      0.99      0.98       353

   micro avg       0.95      0.97      0.96       786
   macro avg       0.79      0.82      0.80       786
weighted avg       0.96      0.97      0.96       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.879, eval_acc=0.96, eval_loss=4.77, eval_precision=0.839, eval_recall=0.924] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.97      0.97      0.97        33
         EDU       0.91      0.96      0.94       106
         LOC       0.00      0.00      0.00         2
        NAME       0.96      0.98      0.97       110
         ORG       0.79      0.90      0.84       523
         PRO       0.48      0.72      0.58        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.82      0.92      0.87       690

   micro avg       0.82      0.92      0.87      1497
   macro avg       0.73      0.81      0.77      1497
weighted avg       0.83      0.92      0.87      1497



Epoch: 9/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.88it/s, F1=0.987, train_acc=0.997, train_loss=0.482, train_precision=0.984, train_recall=0.99] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       0.00      0.00      0.00         2
        NAME       0.99      1.00      0.99        80
         ORG       0.97      0.98      0.98       265
         PRO       0.91      0.91      0.91        11
        RACE       1.00      1.00      1.00         9
       TITLE       0.99      1.00      1.00       353

   micro avg       0.98      0.99      0.99       786
   macro avg       0.86      0.86      0.86       786
weighted avg       0.98      0.99      0.99       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.71it/s, F1=0.897, eval_acc=0.96, eval_loss=5.28, eval_precision=0.867, eval_recall=0.931] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.97      0.97      0.97        33
         EDU       0.93      0.98      0.95       106
         LOC       0.00      0.00      0.00         2
        NAME       0.98      0.99      0.99       110
         ORG       0.82      0.91      0.86       523
         PRO       0.46      0.72      0.57        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.85      0.92      0.88       690

   micro avg       0.85      0.92      0.88      1497
   macro avg       0.74      0.81      0.77      1497
weighted avg       0.85      0.92      0.89      1497



Epoch: 10/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.99it/s, F1=0.991, train_acc=0.999, train_loss=0.301, train_precision=0.988, train_recall=0.994]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       0.98      1.00      0.99        48
         LOC       0.50      0.50      0.50         2
        NAME       0.99      1.00      0.99        80
         ORG       0.99      0.99      0.99       265
         PRO       0.91      0.91      0.91        11
        RACE       1.00      1.00      1.00         9
       TITLE       0.99      1.00      1.00       353

   micro avg       0.99      0.99      0.99       786
   macro avg       0.92      0.92      0.92       786
weighted avg       0.99      0.99      0.99       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.65it/s, F1=0.893, eval_acc=0.96, eval_loss=5.59, eval_precision=0.859, eval_recall=0.931] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.97      0.97      0.97        33
         EDU       0.94      0.97      0.95       106
         LOC       0.00      0.00      0.00         2
        NAME       0.96      0.99      0.98       110
         ORG       0.81      0.89      0.85       523
         PRO       0.64      1.00      0.78        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.85      0.94      0.89       690

   micro avg       0.85      0.93      0.89      1497
   macro avg       0.76      0.84      0.80      1497
weighted avg       0.85      0.93      0.89      1497



Epoch: 11/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.84it/s, F1=0.993, train_acc=0.999, train_loss=0.221, train_precision=0.991, train_recall=0.995]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       0.50      0.50      0.50         2
        NAME       0.99      1.00      0.99        80
         ORG       0.98      0.99      0.99       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       0.99      0.99      0.99       786
   macro avg       0.93      0.94      0.93       786
weighted avg       0.99      0.99      0.99       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.54it/s, F1=0.899, eval_acc=0.959, eval_loss=6.14, eval_precision=0.87, eval_recall=0.932] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.97      0.97      0.97        33
         EDU       0.94      0.98      0.96       106
         LOC       0.00      0.00      0.00         2
        NAME       0.96      0.99      0.98       110
         ORG       0.83      0.91      0.87       523
         PRO       0.72      1.00      0.84        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.84      0.91      0.88       690

   micro avg       0.85      0.92      0.89      1497
   macro avg       0.77      0.85      0.81      1497
weighted avg       0.85      0.92      0.89      1497



Epoch: 12/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.95it/s, F1=0.998, train_acc=1, train_loss=0.146, train_precision=0.997, train_recall=0.998]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       0.99      1.00      0.99       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.72it/s, F1=0.905, eval_acc=0.96, eval_loss=6.29, eval_precision=0.877, eval_recall=0.935] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.97      0.97      0.97        33
         EDU       0.93      0.97      0.95       106
         LOC       0.00      0.00      0.00         2
        NAME       0.96      0.99      0.98       110
         ORG       0.83      0.91      0.87       523
         PRO       0.72      1.00      0.84        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.86      0.92      0.89       690

   micro avg       0.86      0.93      0.89      1497
   macro avg       0.78      0.85      0.81      1497
weighted avg       0.86      0.93      0.89      1497



Epoch: 13/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.91it/s, F1=0.997, train_acc=0.999, train_loss=0.127, train_precision=0.996, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      0.99        80
         ORG       0.99      1.00      0.99       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.71it/s, F1=0.91, eval_acc=0.962, eval_loss=6.16, eval_precision=0.881, eval_recall=0.941] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.94      0.98      0.96       106
         LOC       0.00      0.00      0.00         2
        NAME       0.96      0.98      0.97       110
         ORG       0.84      0.91      0.88       523
         PRO       0.69      1.00      0.82        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.86      0.93      0.89       690

   micro avg       0.86      0.93      0.90      1497
   macro avg       0.78      0.85      0.81      1497
weighted avg       0.87      0.93      0.90      1497



Epoch: 14/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.93it/s, F1=0.998, train_acc=1, train_loss=0.0973, train_precision=0.998, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       0.99      1.00      0.99       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.42it/s, F1=0.912, eval_acc=0.961, eval_loss=6.53, eval_precision=0.885, eval_recall=0.942]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.94      0.98      0.96       106
         LOC       0.50      0.50      0.50         2
        NAME       0.96      0.99      0.98       110
         ORG       0.84      0.91      0.87       523
         PRO       0.69      1.00      0.82        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.86      0.93      0.90       690

   micro avg       0.87      0.93      0.90      1497
   macro avg       0.84      0.91      0.87      1497
weighted avg       0.87      0.93      0.90      1497



Epoch: 15/30 Train: 100%|██████████| 32/32 [00:10<00:00,  2.92it/s, F1=0.99, train_acc=0.998, train_loss=0.236, train_precision=0.987, train_recall=0.992] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      0.99        80
         ORG       0.99      0.99      0.99       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       0.99      0.99      0.99       353

   micro avg       0.99      0.99      0.99       786
   macro avg       1.00      1.00      1.00       786
weighted avg       0.99      0.99      0.99       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.51it/s, F1=0.895, eval_acc=0.956, eval_loss=7.48, eval_precision=0.863, eval_recall=0.931]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.94      0.98      0.96       106
         LOC       0.00      0.00      0.00         2
        NAME       0.97      0.98      0.98       110
         ORG       0.80      0.92      0.86       523
         PRO       0.75      1.00      0.86        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.85      0.91      0.88       690

   micro avg       0.85      0.93      0.89      1497
   macro avg       0.78      0.85      0.81      1497
weighted avg       0.85      0.93      0.89      1497



Epoch: 16/30 Train: 100%|██████████| 32/32 [00:07<00:00,  4.04it/s, F1=0.995, train_acc=0.999, train_loss=0.176, train_precision=0.994, train_recall=0.996]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       0.98      0.99      0.99       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       0.99      0.99      0.99       786
   macro avg       1.00      1.00      1.00       786
weighted avg       0.99      0.99      0.99       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.67it/s, F1=0.892, eval_acc=0.956, eval_loss=7.14, eval_precision=0.856, eval_recall=0.932]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.92      0.97      0.94       106
         LOC       0.50      0.50      0.50         2
        NAME       0.97      0.99      0.98       110
         ORG       0.81      0.90      0.85       523
         PRO       0.64      1.00      0.78        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.83      0.92      0.87       690

   micro avg       0.84      0.93      0.88      1497
   macro avg       0.82      0.91      0.86      1497
weighted avg       0.84      0.93      0.88      1497



Epoch: 17/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.87it/s, F1=0.997, train_acc=1, train_loss=0.0967, train_precision=0.997, train_recall=0.997]    


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       0.99      0.99      0.99       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.72it/s, F1=0.9, eval_acc=0.959, eval_loss=6.77, eval_precision=0.868, eval_recall=0.935]  


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.93      0.97      0.95       106
         LOC       0.00      0.00      0.00         2
        NAME       0.97      0.98      0.98       110
         ORG       0.81      0.92      0.86       523
         PRO       0.62      1.00      0.77        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.85      0.92      0.88       690

   micro avg       0.85      0.93      0.89      1497
   macro avg       0.77      0.85      0.80      1497
weighted avg       0.85      0.93      0.89      1497



Epoch: 18/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.92it/s, F1=0.99, train_acc=0.999, train_loss=0.0978, train_precision=0.989, train_recall=0.991]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       0.99      0.99      0.99       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       0.99      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       0.99      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.59it/s, F1=0.905, eval_acc=0.96, eval_loss=6.86, eval_precision=0.875, eval_recall=0.937] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.93      0.98      0.95       106
         LOC       0.50      0.50      0.50         2
        NAME       0.97      0.98      0.98       110
         ORG       0.83      0.91      0.87       523
         PRO       0.64      1.00      0.78        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.85      0.92      0.89       690

   micro avg       0.86      0.93      0.89      1497
   macro avg       0.83      0.91      0.86      1497
weighted avg       0.86      0.93      0.89      1497



Epoch: 19/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.88it/s, F1=1, train_acc=1, train_loss=0.0681, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       1.00      1.00      1.00       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.73it/s, F1=0.906, eval_acc=0.96, eval_loss=6.88, eval_precision=0.877, eval_recall=0.939] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.93      0.98      0.95       106
         LOC       0.50      0.50      0.50         2
        NAME       0.97      0.99      0.98       110
         ORG       0.83      0.91      0.87       523
         PRO       0.60      1.00      0.75        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.86      0.92      0.89       690

   micro avg       0.86      0.93      0.89      1497
   macro avg       0.82      0.91      0.86      1497
weighted avg       0.86      0.93      0.89      1497



Epoch: 20/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.88it/s, F1=0.998, train_acc=1, train_loss=0.0567, train_precision=0.998, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       0.99      1.00      0.99       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.67it/s, F1=0.907, eval_acc=0.96, eval_loss=7.04, eval_precision=0.878, eval_recall=0.939] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.93      0.98      0.95       106
         LOC       1.00      1.00      1.00         2
        NAME       0.97      0.99      0.98       110
         ORG       0.82      0.91      0.87       523
         PRO       0.62      1.00      0.77        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.86      0.92      0.89       690

   micro avg       0.86      0.93      0.89      1497
   macro avg       0.89      0.98      0.93      1497
weighted avg       0.86      0.93      0.90      1497



Epoch: 21/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.92it/s, F1=0.999, train_acc=1, train_loss=0.0332, train_precision=0.999, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       1.00      1.00      1.00       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.71it/s, F1=0.902, eval_acc=0.96, eval_loss=7.12, eval_precision=0.87, eval_recall=0.938]  


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.92      0.98      0.95       106
         LOC       0.50      0.50      0.50         2
        NAME       0.97      0.99      0.98       110
         ORG       0.82      0.91      0.86       523
         PRO       0.62      1.00      0.77        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.86      0.93      0.89       690

   micro avg       0.86      0.93      0.89      1497
   macro avg       0.83      0.91      0.87      1497
weighted avg       0.86      0.93      0.89      1497



Epoch: 22/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.91it/s, F1=0.999, train_acc=1, train_loss=0.0308, train_precision=0.999, train_recall=1]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       1.00      1.00      1.00       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.60it/s, F1=0.903, eval_acc=0.961, eval_loss=6.96, eval_precision=0.87, eval_recall=0.939] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.97      0.97      0.97        33
         EDU       0.91      0.98      0.95       106
         LOC       1.00      1.00      1.00         2
        NAME       0.97      0.98      0.98       110
         ORG       0.82      0.91      0.86       523
         PRO       0.64      1.00      0.78        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.86      0.93      0.89       690

   micro avg       0.86      0.93      0.89      1497
   macro avg       0.89      0.97      0.93      1497
weighted avg       0.86      0.93      0.89      1497



Epoch: 23/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.98it/s, F1=0.999, train_acc=1, train_loss=0.0316, train_precision=0.999, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       1.00      1.00      1.00       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.906, eval_acc=0.959, eval_loss=7.71, eval_precision=0.877, eval_recall=0.939]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.93      0.98      0.95       106
         LOC       0.50      0.50      0.50         2
        NAME       0.97      0.99      0.98       110
         ORG       0.82      0.91      0.86       523
         PRO       0.60      1.00      0.75        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.86      0.93      0.89       690

   micro avg       0.86      0.93      0.89      1497
   macro avg       0.83      0.91      0.86      1497
weighted avg       0.86      0.93      0.89      1497



Epoch: 24/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.98it/s, F1=1, train_acc=1, train_loss=0.0364, train_precision=0.999, train_recall=1]    


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       1.00      1.00      1.00       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.63it/s, F1=0.902, eval_acc=0.96, eval_loss=7.21, eval_precision=0.87, eval_recall=0.937]  


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.91      0.98      0.95       106
         LOC       1.00      1.00      1.00         2
        NAME       0.97      0.98      0.98       110
         ORG       0.81      0.91      0.86       523
         PRO       0.64      1.00      0.78        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.86      0.93      0.89       690

   micro avg       0.86      0.93      0.89      1497
   macro avg       0.89      0.97      0.93      1497
weighted avg       0.86      0.93      0.89      1497



Epoch: 25/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.88it/s, F1=1, train_acc=1, train_loss=0.0242, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       1.00      1.00      1.00       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.42it/s, F1=0.902, eval_acc=0.958, eval_loss=7.95, eval_precision=0.871, eval_recall=0.938]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.92      0.98      0.95       106
         LOC       1.00      1.00      1.00         2
        NAME       0.97      0.98      0.98       110
         ORG       0.82      0.92      0.87       523
         PRO       0.67      1.00      0.80        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.85      0.92      0.89       690

   micro avg       0.86      0.93      0.89      1497
   macro avg       0.90      0.98      0.93      1497
weighted avg       0.86      0.93      0.89      1497



Epoch: 26/30 Train: 100%|██████████| 32/32 [00:11<00:00,  2.81it/s, F1=1, train_acc=1, train_loss=0.0201, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       1.00      1.00      1.00       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.24it/s, F1=0.9, eval_acc=0.958, eval_loss=7.77, eval_precision=0.869, eval_recall=0.936]  


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.92      0.98      0.95       106
         LOC       1.00      1.00      1.00         2
        NAME       0.96      0.98      0.97       110
         ORG       0.81      0.92      0.86       523
         PRO       0.64      1.00      0.78        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.86      0.92      0.89       690

   micro avg       0.85      0.93      0.89      1497
   macro avg       0.89      0.97      0.93      1497
weighted avg       0.86      0.93      0.89      1497



Epoch: 27/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.89it/s, F1=1, train_acc=1, train_loss=0.0173, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       1.00      1.00      1.00       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.57it/s, F1=0.905, eval_acc=0.958, eval_loss=7.97, eval_precision=0.875, eval_recall=0.939]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.92      0.98      0.95       106
         LOC       1.00      1.00      1.00         2
        NAME       0.96      0.98      0.97       110
         ORG       0.82      0.91      0.86       523
         PRO       0.67      1.00      0.80        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.86      0.92      0.89       690

   micro avg       0.86      0.93      0.89      1497
   macro avg       0.90      0.97      0.93      1497
weighted avg       0.86      0.93      0.89      1497



Epoch: 28/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.95it/s, F1=1, train_acc=1, train_loss=0.0149, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       1.00      1.00      1.00       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.9, eval_acc=0.958, eval_loss=7.99, eval_precision=0.868, eval_recall=0.936]  


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.92      0.98      0.95       106
         LOC       1.00      1.00      1.00         2
        NAME       0.97      0.99      0.98       110
         ORG       0.81      0.91      0.86       523
         PRO       0.67      1.00      0.80        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.85      0.92      0.88       690

   micro avg       0.85      0.93      0.89      1497
   macro avg       0.90      0.98      0.93      1497
weighted avg       0.85      0.93      0.89      1497



Epoch: 29/30 Train: 100%|██████████| 32/32 [00:07<00:00,  4.00it/s, F1=0.999, train_acc=1, train_loss=0.0439, train_precision=0.999, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       1.00      1.00      1.00       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.68it/s, F1=0.901, eval_acc=0.957, eval_loss=8.29, eval_precision=0.869, eval_recall=0.935]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.92      0.98      0.95       106
         LOC       1.00      1.00      1.00         2
        NAME       0.97      0.99      0.98       110
         ORG       0.82      0.91      0.86       523
         PRO       0.69      1.00      0.82        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.85      0.92      0.88       690

   micro avg       0.85      0.93      0.89      1497
   macro avg       0.90      0.98      0.93      1497
weighted avg       0.86      0.93      0.89      1497



Epoch: 30/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.88it/s, F1=0.999, train_acc=0.999, train_loss=0.171, train_precision=0.999, train_recall=1]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       1.00      1.00      1.00       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.64it/s, F1=0.889, eval_acc=0.957, eval_loss=7.07, eval_precision=0.852, eval_recall=0.93] 


eval_reports:


calculate data/few_shot/resume/train_250.json etag: 100%|██████████| 108k/108k [00:00<00:00, 120MB/s]
calculate data/few_shot/resume/dev.json etag: 100%|██████████| 208k/208k [00:00<00:00, 209MB/s]
calculate data/few_shot/resume/test.json etag: 100%|██████████| 230k/230k [00:00<00:00, 222MB/s]
calculate data/few_shot/resume/labels.txt etag: 100%|██████████| 181/181 [00:00<00:00, 348kB/s]

              precision    recall  f1-score   support

        CONT       0.97      1.00      0.99        33
         EDU       0.90      0.96      0.93       106
         LOC       1.00      1.00      1.00         2
        NAME       0.97      0.98      0.98       110
         ORG       0.81      0.90      0.85       523
         PRO       0.55      1.00      0.71        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.85      0.92      0.88       690

   micro avg       0.84      0.92      0.88      1497
   macro avg       0.87      0.97      0.91      1497
weighted avg       0.85      0.92      0.88      1497

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/resume/train_250.json",
    "eval_file": "data/few_shot/resume/dev.json",
    "test_file": "data/few_shot


count line size data/few_shot/resume/labels.txt: 29L [00:00, 232571.35L/s]
build line mapper: 29L [00:00, 244246.62L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 29/29 [00:00<00:00, 8536.97it/s]
load vocab from list: 100%|██████████| 28/28 [00:00<00:00, 244667.73it/s]
load dataset from data/few_shot/resume/train_250.json: 94it [00:00, 921.95it/s]

load cached ./temp/258a32339a7cddecc92751214f251651_578a629df36736a7b0ca315689a0fbc2_a783a23408031aaf8881013b1b168597_61206f767c93b652c614f8099bc479e7/1000000/matched_words
load cached ./temp/258a32339a7cddecc92751214f251651_578a629df36736a7b0ca315689a0fbc2_a783a23408031aaf8881013b1b168597_61206f767c93b652c614f8099bc479e7/1000000/word_vocab
load cached ./temp/258a32339a7cddecc92751214f251651_578a629df36736a7b0ca315689a0fbc2_a783a23408031aaf8881013b1b168597_61206f767c93b652c614f8099bc479e7/1000000/vocab_embedding


load dataset from data/few_shot/resume/train_250.json: 250it [00:00, 883.54it/s]
load dataset from data/few_shot/resume/dev.json: 463it [00:00, 827.25it/s]
Some weights of the model checkpoint at save_pretrained/resume_pretrain_lebert_250_pretraind_task/Bert_240/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.80it/s, F1=0, train_acc=0.209, train_loss=92.8, train_precision=0, train_recall=0]


train_reports:
              precision    recall  f1-score   support

        CONT       0.00      0.00      0.00        18
         EDU       0.00      0.00      0.00        48
         LOC       0.00      0.00      0.00         2
        NAME       0.00      0.00      0.00        80
         ORG       0.00      0.00      0.00       265
         PRO       0.00      0.00      0.00        11
        RACE       0.00      0.00      0.00         9
       TITLE       0.00      0.00      0.00       353

   micro avg       0.00      0.00      0.00       786
   macro avg       0.00      0.00      0.00       786
weighted avg       0.00      0.00      0.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.43it/s, F1=0, eval_acc=0.43, eval_loss=62.2, eval_precision=0, eval_recall=0] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.00      0.00      0.00        33
         EDU       0.00      0.00      0.00       106
         LOC       0.00      0.00      0.00         2
        NAME       0.00      0.00      0.00       110
         ORG       0.00      0.00      0.00       523
         PRO       0.00      0.00      0.00        18
        RACE       0.00      0.00      0.00        15
       TITLE       0.00      0.00      0.00       690

   micro avg       0.00      0.00      0.00      1497
   macro avg       0.00      0.00      0.00      1497
weighted avg       0.00      0.00      0.00      1497



Epoch: 2/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.80it/s, F1=0.165, train_acc=0.627, train_loss=40.3, train_precision=0.186, train_recall=0.149]    


train_reports:
              precision    recall  f1-score   support

        CONT       0.00      0.00      0.00        18
         EDU       0.00      0.00      0.00        48
         LOC       0.00      0.00      0.00         2
        NAME       0.00      0.00      0.00        80
         ORG       0.22      0.25      0.24       265
         PRO       0.00      0.00      0.00        11
        RACE       0.00      0.00      0.00         9
       TITLE       0.16      0.14      0.15       353

   micro avg       0.18      0.15      0.16       786
   macro avg       0.05      0.05      0.05       786
weighted avg       0.15      0.15      0.15       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.68it/s, F1=0.403, eval_acc=0.722, eval_loss=26.6, eval_precision=0.425, eval_recall=0.384]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.00      0.00      0.00        33
         EDU       0.00      0.00      0.00       106
         LOC       0.00      0.00      0.00         2
        NAME       0.00      0.00      0.00       110
         ORG       0.47      0.57      0.51       523
         PRO       0.00      0.00      0.00        18
        RACE       0.00      0.00      0.00        15
       TITLE       0.38      0.41      0.40       690

   micro avg       0.42      0.39      0.40      1497
   macro avg       0.11      0.12      0.11      1497
weighted avg       0.34      0.39      0.36      1497



Epoch: 3/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.88it/s, F1=0.508, train_acc=0.837, train_loss=16.8, train_precision=0.488, train_recall=0.541]


train_reports:
              precision    recall  f1-score   support

        CONT       0.00      0.00      0.00        18
         EDU       0.01      0.02      0.02        48
         LOC       0.00      0.00      0.00         2
        NAME       0.09      0.07      0.08        80
         ORG       0.50      0.65      0.56       265
         PRO       0.00      0.00      0.00        11
        RACE       0.00      0.00      0.00         9
       TITLE       0.66      0.74      0.70       353

   micro avg       0.49      0.56      0.52       786
   macro avg       0.16      0.18      0.17       786
weighted avg       0.48      0.56      0.51       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.40it/s, F1=0.697, eval_acc=0.903, eval_loss=12.2, eval_precision=0.636, eval_recall=0.771]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.00      0.00      0.00        33
         EDU       0.08      0.20      0.11       106
         LOC       0.00      0.00      0.00         2
        NAME       0.75      0.95      0.84       110
         ORG       0.72      0.82      0.76       523
         PRO       0.00      0.00      0.00        18
        RACE       0.00      0.00      0.00        15
       TITLE       0.76      0.87      0.81       690

   micro avg       0.62      0.77      0.69      1497
   macro avg       0.29      0.35      0.32      1497
weighted avg       0.66      0.77      0.71      1497



Epoch: 4/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.90it/s, F1=0.794, train_acc=0.953, train_loss=6.36, train_precision=0.751, train_recall=0.846]


train_reports:
              precision    recall  f1-score   support

        CONT       0.21      0.22      0.22        18
         EDU       0.12      0.29      0.17        48
         LOC       0.00      0.00      0.00         2
        NAME       0.84      0.97      0.90        80
         ORG       0.82      0.91      0.86       265
         PRO       0.00      0.00      0.00        11
        RACE       0.00      0.00      0.00         9
       TITLE       0.90      0.93      0.92       353

   micro avg       0.74      0.85      0.79       786
   macro avg       0.36      0.42      0.38       786
weighted avg       0.78      0.85      0.81       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.66it/s, F1=0.823, eval_acc=0.928, eval_loss=8.5, eval_precision=0.78, eval_recall=0.872]  


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.85      0.85      0.85        33
         EDU       0.37      0.62      0.46       106
         LOC       0.00      0.00      0.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.77      0.89      0.83       523
         PRO       0.00      0.00      0.00        18
        RACE       0.00      0.00      0.00        15
       TITLE       0.83      0.90      0.86       690

   micro avg       0.77      0.87      0.81      1497
   macro avg       0.48      0.53      0.50      1497
weighted avg       0.77      0.87      0.81      1497



Epoch: 5/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.89it/s, F1=0.871, train_acc=0.966, train_loss=3.85, train_precision=0.852, train_recall=0.893]


train_reports:
              precision    recall  f1-score   support

        CONT       0.71      0.94      0.81        18
         EDU       0.61      0.79      0.69        48
         LOC       0.00      0.00      0.00         2
        NAME       0.97      0.94      0.96        80
         ORG       0.82      0.89      0.86       265
         PRO       0.20      0.18      0.19        11
        RACE       0.00      0.00      0.00         9
       TITLE       0.90      0.93      0.92       353

   micro avg       0.84      0.89      0.86       786
   macro avg       0.53      0.59      0.55       786
weighted avg       0.84      0.89      0.86       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.73it/s, F1=0.836, eval_acc=0.941, eval_loss=7.03, eval_precision=0.783, eval_recall=0.898]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.72      1.00      0.84        33
         EDU       0.71      0.91      0.79       106
         LOC       0.00      0.00      0.00         2
        NAME       0.98      0.98      0.98       110
         ORG       0.74      0.87      0.80       523
         PRO       0.03      0.06      0.04        18
        RACE       0.00      0.00      0.00        15
       TITLE       0.82      0.93      0.87       690

   micro avg       0.77      0.89      0.82      1497
   macro avg       0.50      0.59      0.54      1497
weighted avg       0.77      0.89      0.83      1497



Epoch: 6/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.97it/s, F1=0.924, train_acc=0.987, train_loss=1.89, train_precision=0.906, train_recall=0.945]


train_reports:
              precision    recall  f1-score   support

        CONT       0.86      1.00      0.92        18
         EDU       0.75      0.90      0.82        48
         LOC       0.00      0.00      0.00         2
        NAME       1.00      0.96      0.98        80
         ORG       0.90      0.95      0.92       265
         PRO       0.06      0.09      0.07        11
        RACE       0.33      0.33      0.33         9
       TITLE       0.96      0.98      0.97       353

   micro avg       0.90      0.94      0.92       786
   macro avg       0.61      0.65      0.63       786
weighted avg       0.91      0.94      0.92       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.38it/s, F1=0.884, eval_acc=0.944, eval_loss=7.48, eval_precision=0.852, eval_recall=0.919]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.92      0.98      0.95       106
         LOC       0.00      0.00      0.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.80      0.88      0.84       523
         PRO       0.38      0.56      0.45        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.85      0.92      0.88       690

   micro avg       0.84      0.91      0.87      1497
   macro avg       0.73      0.79      0.76      1497
weighted avg       0.84      0.91      0.88      1497



Epoch: 7/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.87it/s, F1=0.956, train_acc=0.992, train_loss=1.19, train_precision=0.946, train_recall=0.968] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       0.92      0.96      0.94        48
         LOC       0.00      0.00      0.00         2
        NAME       0.98      1.00      0.99        80
         ORG       0.94      0.97      0.95       265
         PRO       0.54      0.64      0.58        11
        RACE       0.89      0.89      0.89         9
       TITLE       0.97      0.98      0.97       353

   micro avg       0.95      0.97      0.96       786
   macro avg       0.78      0.80      0.79       786
weighted avg       0.95      0.97      0.96       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.63it/s, F1=0.896, eval_acc=0.953, eval_loss=5.52, eval_precision=0.865, eval_recall=0.928]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      0.99      0.97       106
         LOC       0.00      0.00      0.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.81      0.91      0.86       523
         PRO       0.41      0.72      0.52        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.87      0.91      0.89       690

   micro avg       0.85      0.92      0.89      1497
   macro avg       0.75      0.82      0.78      1497
weighted avg       0.86      0.92      0.89      1497



Epoch: 8/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.93it/s, F1=0.983, train_acc=0.997, train_loss=0.526, train_precision=0.978, train_recall=0.988]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       0.00      0.00      0.00         2
        NAME       0.99      1.00      0.99        80
         ORG       0.98      0.98      0.98       265
         PRO       0.69      0.82      0.75        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       0.98      0.99      0.99       786
   macro avg       0.83      0.85      0.84       786
weighted avg       0.98      0.99      0.99       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.48it/s, F1=0.886, eval_acc=0.955, eval_loss=5.78, eval_precision=0.849, eval_recall=0.929]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.97      1.00      0.99        33
         EDU       0.95      1.00      0.98       106
         LOC       0.00      0.00      0.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.79      0.90      0.84       523
         PRO       0.59      0.94      0.72        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.85      0.91      0.88       690

   micro avg       0.84      0.92      0.88      1497
   macro avg       0.76      0.85      0.80      1497
weighted avg       0.84      0.92      0.88      1497



Epoch: 9/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.93it/s, F1=0.992, train_acc=0.998, train_loss=0.325, train_precision=0.991, train_recall=0.994]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       0.33      0.50      0.40         2
        NAME       0.99      1.00      0.99        80
         ORG       0.99      0.99      0.99       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       0.99      0.99      0.99       786
   macro avg       0.91      0.94      0.92       786
weighted avg       0.99      0.99      0.99       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.71it/s, F1=0.9, eval_acc=0.953, eval_loss=6.5, eval_precision=0.867, eval_recall=0.935]   


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      0.98      0.97       106
         LOC       0.00      0.00      0.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.80      0.92      0.86       523
         PRO       0.71      0.94      0.81        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.87      0.92      0.89       690

   micro avg       0.86      0.93      0.89      1497
   macro avg       0.78      0.85      0.81      1497
weighted avg       0.86      0.93      0.89      1497



Epoch: 10/30 Train: 100%|██████████| 32/32 [00:11<00:00,  2.89it/s, F1=0.996, train_acc=0.999, train_loss=0.215, train_precision=0.996, train_recall=0.997]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       0.99      1.00      0.99       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.69it/s, F1=0.901, eval_acc=0.954, eval_loss=6.92, eval_precision=0.87, eval_recall=0.936] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      1.00      0.98       106
         LOC       0.00      0.00      0.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.82      0.91      0.86       523
         PRO       0.69      1.00      0.82        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.86      0.92      0.89       690

   micro avg       0.86      0.93      0.90      1497
   macro avg       0.78      0.85      0.81      1497
weighted avg       0.86      0.93      0.90      1497



Epoch: 11/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.88it/s, F1=0.996, train_acc=0.999, train_loss=0.18, train_precision=0.996, train_recall=0.996] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       0.99      0.99      0.99       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.69it/s, F1=0.898, eval_acc=0.956, eval_loss=6.38, eval_precision=0.865, eval_recall=0.934]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.94      0.97      0.96       106
         LOC       0.00      0.00      0.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.81      0.91      0.86       523
         PRO       0.67      1.00      0.80        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.87      0.92      0.89       690

   micro avg       0.86      0.93      0.89      1497
   macro avg       0.78      0.85      0.81      1497
weighted avg       0.86      0.93      0.89      1497



Epoch: 12/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.89it/s, F1=0.997, train_acc=0.999, train_loss=0.145, train_precision=0.996, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      0.99        80
         ORG       0.99      1.00      0.99       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.63it/s, F1=0.904, eval_acc=0.955, eval_loss=7.02, eval_precision=0.874, eval_recall=0.938]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      0.99      0.97       106
         LOC       0.00      0.00      0.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.83      0.92      0.87       523
         PRO       0.69      1.00      0.82        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.87      0.92      0.90       690

   micro avg       0.87      0.93      0.90      1497
   macro avg       0.78      0.85      0.81      1497
weighted avg       0.87      0.93      0.90      1497



Epoch: 13/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.90it/s, F1=0.998, train_acc=1, train_loss=0.114, train_precision=0.998, train_recall=0.998]    


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       0.99      0.99      0.99       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.49it/s, F1=0.902, eval_acc=0.956, eval_loss=6.56, eval_precision=0.87, eval_recall=0.936] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      1.00      0.98       106
         LOC       0.00      0.00      0.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.82      0.91      0.86       523
         PRO       0.72      1.00      0.84        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.86      0.92      0.89       690

   micro avg       0.86      0.93      0.89      1497
   macro avg       0.78      0.85      0.82      1497
weighted avg       0.86      0.93      0.90      1497



Epoch: 14/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.90it/s, F1=0.998, train_acc=1, train_loss=0.0946, train_precision=0.998, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       0.99      1.00      0.99       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.71it/s, F1=0.902, eval_acc=0.957, eval_loss=7.02, eval_precision=0.87, eval_recall=0.938] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      0.99      0.97       106
         LOC       0.00      0.00      0.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.82      0.92      0.86       523
         PRO       0.72      1.00      0.84        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.87      0.92      0.89       690

   micro avg       0.86      0.93      0.90      1497
   macro avg       0.78      0.85      0.82      1497
weighted avg       0.86      0.93      0.90      1497



Epoch: 15/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.93it/s, F1=0.998, train_acc=1, train_loss=0.104, train_precision=0.998, train_recall=0.998]     


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       0.99      0.99      0.99       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.69it/s, F1=0.907, eval_acc=0.957, eval_loss=7.23, eval_precision=0.875, eval_recall=0.942]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.94      0.98      0.96       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.83      0.93      0.88       523
         PRO       0.72      1.00      0.84        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.87      0.92      0.89       690

   micro avg       0.87      0.94      0.90      1497
   macro avg       0.87      0.98      0.92      1497
weighted avg       0.87      0.94      0.90      1497



Epoch: 16/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.93it/s, F1=0.997, train_acc=1, train_loss=0.077, train_precision=0.996, train_recall=0.999]     


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      0.99        80
         ORG       0.99      1.00      0.99       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.899, eval_acc=0.956, eval_loss=7.24, eval_precision=0.865, eval_recall=0.936]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.94      0.98      0.96       106
         LOC       0.00      0.00      0.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.81      0.91      0.86       523
         PRO       0.72      1.00      0.84        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.86      0.92      0.89       690

   micro avg       0.86      0.93      0.89      1497
   macro avg       0.78      0.85      0.81      1497
weighted avg       0.86      0.93      0.89      1497



Epoch: 17/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.93it/s, F1=0.996, train_acc=1, train_loss=0.0786, train_precision=0.995, train_recall=0.998]    


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       0.99      0.99      0.99       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       0.99      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       0.99      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.60it/s, F1=0.906, eval_acc=0.955, eval_loss=7.69, eval_precision=0.875, eval_recall=0.939]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.94      0.98      0.96       106
         LOC       0.00      0.00      0.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.82      0.92      0.87       523
         PRO       0.69      1.00      0.82        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.87      0.92      0.90       690

   micro avg       0.87      0.93      0.90      1497
   macro avg       0.78      0.85      0.81      1497
weighted avg       0.87      0.93      0.90      1497



Epoch: 18/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.87it/s, F1=0.998, train_acc=1, train_loss=0.0516, train_precision=0.998, train_recall=0.999]    


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       0.99      1.00      0.99       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.52it/s, F1=0.896, eval_acc=0.956, eval_loss=7.36, eval_precision=0.86, eval_recall=0.935] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      0.99      0.97       106
         LOC       0.00      0.00      0.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.81      0.91      0.86       523
         PRO       0.55      1.00      0.71        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.87      0.92      0.90       690

   micro avg       0.86      0.93      0.89      1497
   macro avg       0.76      0.85      0.80      1497
weighted avg       0.86      0.93      0.89      1497



Epoch: 19/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.92it/s, F1=0.999, train_acc=1, train_loss=0.0455, train_precision=0.999, train_recall=0.999]   


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       1.00      1.00      1.00       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.51it/s, F1=0.901, eval_acc=0.956, eval_loss=7.66, eval_precision=0.866, eval_recall=0.939]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.94      0.99      0.96       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.82      0.92      0.87       523
         PRO       0.60      1.00      0.75        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.87      0.92      0.90       690

   micro avg       0.86      0.94      0.90      1497
   macro avg       0.85      0.98      0.90      1497
weighted avg       0.87      0.94      0.90      1497



Epoch: 20/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.75it/s, F1=0.999, train_acc=1, train_loss=0.0438, train_precision=0.998, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       0.99      1.00      0.99       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.71it/s, F1=0.892, eval_acc=0.957, eval_loss=7.27, eval_precision=0.855, eval_recall=0.934]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.94      0.98      0.96       106
         LOC       0.33      0.50      0.40         2
        NAME       0.98      1.00      0.99       110
         ORG       0.80      0.91      0.85       523
         PRO       0.56      1.00      0.72        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.86      0.92      0.89       690

   micro avg       0.85      0.93      0.89      1497
   macro avg       0.80      0.91      0.85      1497
weighted avg       0.85      0.93      0.89      1497



Epoch: 21/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.93it/s, F1=0.999, train_acc=1, train_loss=0.0444, train_precision=0.999, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       1.00      1.00      1.00       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:05<00:00,  1.52it/s, F1=0.904, eval_acc=0.956, eval_loss=8.06, eval_precision=0.872, eval_recall=0.94] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.94      0.99      0.96       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.82      0.92      0.87       523
         PRO       0.62      1.00      0.77        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.87      0.93      0.90       690

   micro avg       0.87      0.94      0.90      1497
   macro avg       0.90      0.98      0.93      1497
weighted avg       0.87      0.94      0.90      1497



Epoch: 22/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.91it/s, F1=0.997, train_acc=1, train_loss=0.0863, train_precision=0.997, train_recall=0.997]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       0.99      0.99      0.99       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.64it/s, F1=0.898, eval_acc=0.958, eval_loss=7.19, eval_precision=0.864, eval_recall=0.936]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.94      0.98      0.96       106
         LOC       0.33      0.50      0.40         2
        NAME       0.98      1.00      0.99       110
         ORG       0.81      0.91      0.86       523
         PRO       0.60      1.00      0.75        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.86      0.93      0.89       690

   micro avg       0.86      0.93      0.89      1497
   macro avg       0.81      0.91      0.85      1497
weighted avg       0.86      0.93      0.89      1497



Epoch: 23/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.74it/s, F1=1, train_acc=1, train_loss=0.0417, train_precision=0.999, train_recall=1]       


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       1.00      1.00      1.00       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.65it/s, F1=0.892, eval_acc=0.957, eval_loss=7.05, eval_precision=0.854, eval_recall=0.935]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.94      0.98      0.96       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.79      0.91      0.85       523
         PRO       0.58      1.00      0.73        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.86      0.93      0.89       690

   micro avg       0.85      0.93      0.89      1497
   macro avg       0.84      0.98      0.90      1497
weighted avg       0.85      0.93      0.89      1497



Epoch: 24/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.90it/s, F1=0.998, train_acc=1, train_loss=0.0432, train_precision=0.998, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       0.99      1.00      0.99       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.66it/s, F1=0.907, eval_acc=0.958, eval_loss=7.34, eval_precision=0.877, eval_recall=0.94] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.93      0.98      0.95       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.84      0.92      0.88       523
         PRO       0.64      1.00      0.78        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.87      0.93      0.90       690

   micro avg       0.87      0.94      0.90      1497
   macro avg       0.86      0.98      0.91      1497
weighted avg       0.87      0.94      0.90      1497



Epoch: 25/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.81it/s, F1=1, train_acc=1, train_loss=0.0275, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       1.00      1.00      1.00       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.68it/s, F1=0.896, eval_acc=0.957, eval_loss=7.48, eval_precision=0.861, eval_recall=0.937]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.93      0.98      0.95       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.81      0.91      0.86       523
         PRO       0.58      1.00      0.73        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.86      0.93      0.89       690

   micro avg       0.85      0.93      0.89      1497
   macro avg       0.85      0.98      0.90      1497
weighted avg       0.86      0.93      0.89      1497



Epoch: 26/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.92it/s, F1=1, train_acc=1, train_loss=0.0214, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       1.00      1.00      1.00       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.55it/s, F1=0.899, eval_acc=0.958, eval_loss=7.52, eval_precision=0.864, eval_recall=0.938]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.93      0.98      0.95       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.82      0.92      0.87       523
         PRO       0.56      1.00      0.72        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.86      0.92      0.89       690

   micro avg       0.86      0.94      0.90      1497
   macro avg       0.85      0.98      0.90      1497
weighted avg       0.86      0.94      0.90      1497



Epoch: 27/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.88it/s, F1=0.997, train_acc=1, train_loss=0.0284, train_precision=0.997, train_recall=0.998]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       0.99      1.00      0.99       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.71it/s, F1=0.902, eval_acc=0.956, eval_loss=8.19, eval_precision=0.868, eval_recall=0.938]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.94      0.99      0.96       106
         LOC       0.67      1.00      0.80         2
        NAME       0.99      1.00      1.00       110
         ORG       0.83      0.92      0.87       523
         PRO       0.64      1.00      0.78        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.86      0.92      0.89       690

   micro avg       0.86      0.94      0.90      1497
   macro avg       0.86      0.98      0.91      1497
weighted avg       0.87      0.94      0.90      1497



Epoch: 28/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.90it/s, F1=1, train_acc=1, train_loss=0.0209, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       1.00      1.00      1.00       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.69it/s, F1=0.903, eval_acc=0.958, eval_loss=8.05, eval_precision=0.869, eval_recall=0.94] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.94      0.99      0.96       106
         LOC       0.67      1.00      0.80         2
        NAME       0.99      1.00      1.00       110
         ORG       0.82      0.92      0.87       523
         PRO       0.64      1.00      0.78        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.86      0.93      0.89       690

   micro avg       0.86      0.94      0.90      1497
   macro avg       0.86      0.98      0.91      1497
weighted avg       0.86      0.94      0.90      1497



Epoch: 29/30 Train: 100%|██████████| 32/32 [00:08<00:00,  4.00it/s, F1=0.999, train_acc=1, train_loss=0.0239, train_precision=0.999, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       1.00      1.00      1.00       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.19it/s, F1=0.9, eval_acc=0.958, eval_loss=8.04, eval_precision=0.866, eval_recall=0.938]  


eval_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.94      0.99      0.96       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.83      0.92      0.87       523
         PRO       0.64      1.00      0.78        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.85      0.92      0.89       690

   micro avg       0.86      0.94      0.90      1497
   macro avg       0.86      0.98      0.91      1497
weighted avg       0.86      0.94      0.90      1497



Epoch: 30/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.89it/s, F1=1, train_acc=1, train_loss=0.0161, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       1.00      1.00      1.00       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.903, eval_acc=0.958, eval_loss=7.98, eval_precision=0.87, eval_recall=0.94]  


eval_reports:


calculate data/few_shot/resume/train_250.json etag: 100%|██████████| 108k/108k [00:00<00:00, 152MB/s]
calculate data/few_shot/resume/dev.json etag: 100%|██████████| 208k/208k [00:00<00:00, 196MB/s]
calculate data/few_shot/resume/test.json etag: 100%|██████████| 230k/230k [00:00<00:00, 208MB/s]
calculate data/few_shot/resume/labels.txt etag: 100%|██████████| 181/181 [00:00<00:00, 369kB/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.94      0.99      0.96       106
         LOC       0.67      1.00      0.80         2
        NAME       0.99      1.00      1.00       110
         ORG       0.83      0.92      0.87       523
         PRO       0.64      1.00      0.78        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.87      0.93      0.89       690

   micro avg       0.86      0.94      0.90      1497
   macro avg       0.86      0.98      0.91      1497
weighted avg       0.87      0.94      0.90      1497

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/resume/train_250.json",
    "eval_file": "data/few_shot/resume/dev.json",
    "test_file": "data/few_shot


count line size data/few_shot/resume/labels.txt: 29L [00:00, 207214.34L/s]
build line mapper: 29L [00:00, 232127.51L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 29/29 [00:00<00:00, 9695.88it/s]
load vocab from list: 100%|██████████| 28/28 [00:00<00:00, 273117.47it/s]
load dataset from data/few_shot/resume/train_250.json: 93it [00:00, 927.45it/s]

load cached ./temp/258a32339a7cddecc92751214f251651_578a629df36736a7b0ca315689a0fbc2_a783a23408031aaf8881013b1b168597_61206f767c93b652c614f8099bc479e7/1000000/matched_words
load cached ./temp/258a32339a7cddecc92751214f251651_578a629df36736a7b0ca315689a0fbc2_a783a23408031aaf8881013b1b168597_61206f767c93b652c614f8099bc479e7/1000000/word_vocab
load cached ./temp/258a32339a7cddecc92751214f251651_578a629df36736a7b0ca315689a0fbc2_a783a23408031aaf8881013b1b168597_61206f767c93b652c614f8099bc479e7/1000000/vocab_embedding


load dataset from data/few_shot/resume/train_250.json: 250it [00:00, 881.39it/s]
load dataset from data/few_shot/resume/dev.json: 463it [00:00, 826.72it/s]
Some weights of the model checkpoint at save_pretrained/resume_pretrain_lebert_250_pretraind_task/Bert_240/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.82it/s, F1=0, train_acc=0.0695, train_loss=141, train_precision=0, train_recall=0]


train_reports:
              precision    recall  f1-score   support

        CONT       0.00      0.00      0.00        18
         EDU       0.00      0.00      0.00        48
         LOC       0.00      0.00      0.00         2
        NAME       0.00      0.00      0.00        80
         ORG       0.00      0.00      0.00       265
         PRO       0.00      0.00      0.00        11
        RACE       0.00      0.00      0.00         9
       TITLE       0.00      0.00      0.00       353

   micro avg       0.00      0.00      0.00       786
   macro avg       0.00      0.00      0.00       786
weighted avg       0.00      0.00      0.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.68it/s, F1=0, eval_acc=0.293, eval_loss=110, eval_precision=0, eval_recall=0]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.00      0.00      0.00        33
         EDU       0.00      0.00      0.00       106
         LOC       0.00      0.00      0.00         2
        NAME       0.00      0.00      0.00       110
         ORG       0.00      0.00      0.00       523
         PRO       0.00      0.00      0.00        18
        RACE       0.00      0.00      0.00        15
       TITLE       0.00      0.00      0.00       690

   micro avg       0.00      0.00      0.00      1497
   macro avg       0.00      0.00      0.00      1497
weighted avg       0.00      0.00      0.00      1497



Epoch: 2/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.95it/s, F1=0.0251, train_acc=0.444, train_loss=67.7, train_precision=0.0178, train_recall=0.0436]     


train_reports:
              precision    recall  f1-score   support

        CONT       0.00      0.00      0.00        18
         EDU       0.00      0.00      0.00        48
         LOC       0.00      0.00      0.00         2
        NAME       0.00      0.00      0.00        80
         ORG       0.02      0.11      0.03       265
         PRO       0.00      0.00      0.00        11
        RACE       0.00      0.00      0.00         9
       TITLE       0.00      0.02      0.01       353

   micro avg       0.01      0.04      0.02       786
   macro avg       0.00      0.02      0.00       786
weighted avg       0.01      0.04      0.01       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.159, eval_acc=0.656, eval_loss=43.9, eval_precision=0.114, eval_recall=0.267]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.00      0.00      0.00        33
         EDU       0.00      0.00      0.00       106
         LOC       0.00      0.00      0.00         2
        NAME       0.00      0.00      0.00       110
         ORG       0.22      0.57      0.32       523
         PRO       0.00      0.00      0.00        18
        RACE       0.00      0.00      0.00        15
       TITLE       0.04      0.14      0.07       690

   micro avg       0.11      0.27      0.15      1497
   macro avg       0.03      0.09      0.05      1497
weighted avg       0.10      0.27      0.14      1497



Epoch: 3/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.92it/s, F1=0.227, train_acc=0.77, train_loss=27.8, train_precision=0.182, train_recall=0.316] 


train_reports:
              precision    recall  f1-score   support

        CONT       0.00      0.00      0.00        18
         EDU       0.00      0.00      0.00        48
         LOC       0.00      0.00      0.00         2
        NAME       0.08      0.14      0.10        80
         ORG       0.28      0.57      0.38       265
         PRO       0.00      0.00      0.00        11
        RACE       0.00      0.00      0.00         9
       TITLE       0.11      0.25      0.15       353

   micro avg       0.16      0.32      0.21       786
   macro avg       0.06      0.12      0.08       786
weighted avg       0.15      0.32      0.20       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.453, eval_acc=0.837, eval_loss=21.2, eval_precision=0.354, eval_recall=0.634]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.00      0.00      0.00        33
         EDU       0.00      0.00      0.00       106
         LOC       0.00      0.00      0.00         2
        NAME       0.55      0.86      0.67       110
         ORG       0.40      0.76      0.53       523
         PRO       0.00      0.00      0.00        18
        RACE       0.00      0.00      0.00        15
       TITLE       0.33      0.64      0.44       690

   micro avg       0.34      0.63      0.44      1497
   macro avg       0.16      0.28      0.20      1497
weighted avg       0.33      0.63      0.43      1497



Epoch: 4/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.86it/s, F1=0.639, train_acc=0.914, train_loss=11.1, train_precision=0.566, train_recall=0.748]


train_reports:
              precision    recall  f1-score   support

        CONT       0.24      0.33      0.28        18
         EDU       0.02      0.04      0.02        48
         LOC       0.00      0.00      0.00         2
        NAME       0.62      0.79      0.69        80
         ORG       0.60      0.85      0.70       265
         PRO       0.00      0.00      0.00        11
        RACE       0.00      0.00      0.00         9
       TITLE       0.61      0.83      0.70       353

   micro avg       0.53      0.75      0.62       786
   macro avg       0.26      0.36      0.30       786
weighted avg       0.54      0.75      0.63       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.69it/s, F1=0.663, eval_acc=0.915, eval_loss=15.1, eval_precision=0.571, eval_recall=0.794]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.65      0.91      0.76        33
         EDU       0.11      0.25      0.15       106
         LOC       0.00      0.00      0.00         2
        NAME       0.87      1.00      0.93       110
         ORG       0.47      0.74      0.58       523
         PRO       0.00      0.00      0.00        18
        RACE       0.00      0.00      0.00        15
       TITLE       0.70      0.90      0.79       690

   micro avg       0.55      0.79      0.65      1497
   macro avg       0.35      0.48      0.40      1497
weighted avg       0.58      0.79      0.66      1497



Epoch: 5/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.88it/s, F1=0.834, train_acc=0.965, train_loss=5.63, train_precision=0.792, train_recall=0.885]


train_reports:
              precision    recall  f1-score   support

        CONT       0.62      1.00      0.77        18
         EDU       0.32      0.58      0.41        48
         LOC       0.00      0.00      0.00         2
        NAME       0.93      0.94      0.93        80
         ORG       0.81      0.90      0.85       265
         PRO       0.00      0.00      0.00        11
        RACE       0.00      0.00      0.00         9
       TITLE       0.85      0.95      0.90       353

   micro avg       0.78      0.88      0.83       786
   macro avg       0.44      0.55      0.48       786
weighted avg       0.78      0.88      0.83       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.789, eval_acc=0.945, eval_loss=9.83, eval_precision=0.709, eval_recall=0.895]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.59      0.97      0.74        33
         EDU       0.62      0.86      0.72       106
         LOC       0.00      0.00      0.00         2
        NAME       0.87      1.00      0.93       110
         ORG       0.64      0.88      0.74       523
         PRO       0.00      0.00      0.00        18
        RACE       0.00      0.00      0.00        15
       TITLE       0.73      0.92      0.81       690

   micro avg       0.68      0.89      0.77      1497
   macro avg       0.43      0.58      0.49      1497
weighted avg       0.68      0.89      0.77      1497



Epoch: 6/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.66it/s, F1=0.809, train_acc=0.968, train_loss=4.69, train_precision=0.757, train_recall=0.875]


train_reports:
              precision    recall  f1-score   support

        CONT       0.67      1.00      0.80        18
         EDU       0.57      0.79      0.66        48
         LOC       0.00      0.00      0.00         2
        NAME       0.98      1.00      0.99        80
         ORG       0.74      0.88      0.81       265
         PRO       0.00      0.00      0.00        11
        RACE       0.00      0.00      0.00         9
       TITLE       0.80      0.92      0.85       353

   micro avg       0.75      0.88      0.81       786
   macro avg       0.47      0.57      0.51       786
weighted avg       0.76      0.88      0.81       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.68it/s, F1=0.816, eval_acc=0.933, eval_loss=14.2, eval_precision=0.748, eval_recall=0.901]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.78      0.97      0.86        33
         EDU       0.62      0.88      0.73       106
         LOC       0.00      0.00      0.00         2
        NAME       0.99      0.99      0.99       110
         ORG       0.71      0.88      0.78       523
         PRO       0.00      0.00      0.00        18
        RACE       0.65      0.73      0.69        15
       TITLE       0.77      0.91      0.83       690

   micro avg       0.73      0.89      0.80      1497
   macro avg       0.56      0.67      0.61      1497
weighted avg       0.74      0.89      0.81      1497



Epoch: 7/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.92it/s, F1=0.898, train_acc=0.983, train_loss=2.61, train_precision=0.869, train_recall=0.934]


train_reports:
              precision    recall  f1-score   support

        CONT       0.78      1.00      0.88        18
         EDU       0.69      0.88      0.77        48
         LOC       0.00      0.00      0.00         2
        NAME       0.94      0.93      0.93        80
         ORG       0.88      0.95      0.92       265
         PRO       0.00      0.00      0.00        11
        RACE       0.50      0.67      0.57         9
       TITLE       0.90      0.96      0.93       353

   micro avg       0.85      0.93      0.89       786
   macro avg       0.59      0.67      0.62       786
weighted avg       0.86      0.93      0.89       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.56it/s, F1=0.828, eval_acc=0.943, eval_loss=12.4, eval_precision=0.766, eval_recall=0.904]


eval_reports:
              precision    recall  f1-score   support

        CONT       0.86      0.97      0.91        33
         EDU       0.74      0.92      0.82       106
         LOC       0.00      0.00      0.00         2
        NAME       0.95      1.00      0.97       110
         ORG       0.71      0.87      0.78       523
         PRO       0.06      0.17      0.09        18
        RACE       0.82      0.93      0.87        15
       TITLE       0.79      0.92      0.85       690

   micro avg       0.75      0.90      0.82      1497
   macro avg       0.62      0.72      0.66      1497
weighted avg       0.76      0.90      0.83      1497



Epoch: 8/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.95it/s, F1=0.961, train_acc=0.993, train_loss=1.2, train_precision=0.952, train_recall=0.971] 


train_reports:
              precision    recall  f1-score   support

        CONT       0.90      1.00      0.95        18
         EDU       0.89      0.98      0.93        48
         LOC       0.00      0.00      0.00         2
        NAME       0.99      0.96      0.97        80
         ORG       0.94      0.97      0.96       265
         PRO       0.47      0.64      0.54        11
        RACE       1.00      1.00      1.00         9
       TITLE       0.99      0.99      0.99       353

   micro avg       0.95      0.97      0.96       786
   macro avg       0.77      0.82      0.79       786
weighted avg       0.95      0.97      0.96       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.67it/s, F1=0.859, eval_acc=0.953, eval_loss=9.84, eval_precision=0.812, eval_recall=0.915]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.85      0.92      0.89       106
         LOC       0.00      0.00      0.00         2
        NAME       0.97      1.00      0.99       110
         ORG       0.74      0.89      0.81       523
         PRO       0.25      0.56      0.34        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.80      0.90      0.85       690

   micro avg       0.78      0.91      0.84      1497
   macro avg       0.68      0.78      0.72      1497
weighted avg       0.79      0.91      0.84      1497



Epoch: 9/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.99it/s, F1=0.96, train_acc=0.993, train_loss=1.15, train_precision=0.948, train_recall=0.973] 


train_reports:
              precision    recall  f1-score   support

        CONT       0.90      1.00      0.95        18
         EDU       0.94      0.98      0.96        48
         LOC       0.00      0.00      0.00         2
        NAME       0.99      1.00      0.99        80
         ORG       0.93      0.97      0.95       265
         PRO       0.69      0.82      0.75        11
        RACE       1.00      1.00      1.00         9
       TITLE       0.97      0.98      0.98       353

   micro avg       0.95      0.97      0.96       786
   macro avg       0.80      0.84      0.82       786
weighted avg       0.95      0.97      0.96       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.861, eval_acc=0.948, eval_loss=11.9, eval_precision=0.809, eval_recall=0.922]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.91      0.97      0.94        33
         EDU       0.89      0.96      0.93       106
         LOC       0.00      0.00      0.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.75      0.89      0.81       523
         PRO       0.48      0.89      0.63        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.79      0.91      0.84       690

   micro avg       0.79      0.91      0.85      1497
   macro avg       0.71      0.83      0.76      1497
weighted avg       0.79      0.91      0.85      1497



Epoch: 10/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.87it/s, F1=0.981, train_acc=0.997, train_loss=0.5, train_precision=0.973, train_recall=0.99]   


train_reports:
              precision    recall  f1-score   support

        CONT       0.90      1.00      0.95        18
         EDU       0.96      0.98      0.97        48
         LOC       0.00      0.00      0.00         2
        NAME       1.00      1.00      1.00        80
         ORG       0.97      0.99      0.98       265
         PRO       0.92      1.00      0.96        11
        RACE       1.00      1.00      1.00         9
       TITLE       0.99      1.00      0.99       353

   micro avg       0.98      0.99      0.98       786
   macro avg       0.84      0.87      0.86       786
weighted avg       0.98      0.99      0.98       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.59it/s, F1=0.869, eval_acc=0.956, eval_loss=10.2, eval_precision=0.821, eval_recall=0.925]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.90      0.97      0.93       106
         LOC       0.33      0.50      0.40         2
        NAME       0.96      1.00      0.98       110
         ORG       0.73      0.88      0.80       523
         PRO       0.43      0.89      0.58        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.83      0.93      0.87       690

   micro avg       0.80      0.92      0.86      1497
   macro avg       0.75      0.89      0.81      1497
weighted avg       0.81      0.92      0.86      1497



Epoch: 11/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.92it/s, F1=0.988, train_acc=0.998, train_loss=0.353, train_precision=0.985, train_recall=0.992]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       0.94      0.98      0.96        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       0.97      0.98      0.97       265
         PRO       0.92      1.00      0.96        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       0.98      0.99      0.99       786
   macro avg       0.98      1.00      0.99       786
weighted avg       0.98      0.99      0.99       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.878, eval_acc=0.955, eval_loss=10.8, eval_precision=0.833, eval_recall=0.93] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.90      0.95      0.93       106
         LOC       0.33      0.50      0.40         2
        NAME       0.97      1.00      0.99       110
         ORG       0.75      0.89      0.82       523
         PRO       0.50      0.83      0.62        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.83      0.93      0.88       690

   micro avg       0.81      0.92      0.86      1497
   macro avg       0.76      0.88      0.82      1497
weighted avg       0.82      0.92      0.87      1497



Epoch: 12/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.85it/s, F1=0.994, train_acc=0.999, train_loss=0.24, train_precision=0.993, train_recall=0.996] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       0.96      0.98      0.97        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       0.99      0.99      0.99       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       0.99      0.99      0.99       786
   macro avg       0.99      1.00      0.99       786
weighted avg       0.99      0.99      0.99       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.65it/s, F1=0.87, eval_acc=0.955, eval_loss=10.9, eval_precision=0.824, eval_recall=0.923] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.91      0.97      0.94       106
         LOC       0.67      1.00      0.80         2
        NAME       0.96      0.99      0.97       110
         ORG       0.74      0.88      0.80       523
         PRO       0.46      0.94      0.62        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.83      0.92      0.88       690

   micro avg       0.81      0.92      0.86      1497
   macro avg       0.80      0.96      0.86      1497
weighted avg       0.81      0.92      0.86      1497



Epoch: 13/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.92it/s, F1=0.994, train_acc=0.999, train_loss=0.22, train_precision=0.991, train_recall=0.997] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      0.99        80
         ORG       0.98      0.99      0.99       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       0.99      1.00      1.00       353

   micro avg       0.99      1.00      0.99       786
   macro avg       1.00      1.00      1.00       786
weighted avg       0.99      1.00      0.99       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.66it/s, F1=0.876, eval_acc=0.957, eval_loss=10.4, eval_precision=0.833, eval_recall=0.926]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.91      0.97      0.94       106
         LOC       0.50      1.00      0.67         2
        NAME       0.96      0.99      0.98       110
         ORG       0.75      0.89      0.81       523
         PRO       0.55      0.94      0.69        18
        RACE       0.83      1.00      0.91        15
       TITLE       0.83      0.91      0.87       690

   micro avg       0.81      0.92      0.86      1497
   macro avg       0.78      0.96      0.85      1497
weighted avg       0.81      0.92      0.86      1497



Epoch: 14/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.89it/s, F1=0.995, train_acc=0.999, train_loss=0.144, train_precision=0.993, train_recall=0.997]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       0.99      1.00      0.99       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       0.99      0.99      0.99       353

   micro avg       0.99      1.00      0.99       786
   macro avg       1.00      1.00      1.00       786
weighted avg       0.99      1.00      0.99       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.35it/s, F1=0.879, eval_acc=0.957, eval_loss=10.7, eval_precision=0.837, eval_recall=0.927]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.89      0.97      0.93       106
         LOC       0.50      1.00      0.67         2
        NAME       0.97      0.99      0.98       110
         ORG       0.76      0.89      0.82       523
         PRO       0.53      0.94      0.68        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.84      0.92      0.88       690

   micro avg       0.82      0.92      0.87      1497
   macro avg       0.79      0.96      0.86      1497
weighted avg       0.83      0.92      0.87      1497



Epoch: 15/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.94it/s, F1=0.978, train_acc=0.997, train_loss=0.425, train_precision=0.97, train_recall=0.987] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       0.96      0.99      0.97       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       0.97      0.99      0.98       353

   micro avg       0.97      0.99      0.98       786
   macro avg       0.99      1.00      0.99       786
weighted avg       0.97      0.99      0.98       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.71it/s, F1=0.871, eval_acc=0.954, eval_loss=11.6, eval_precision=0.827, eval_recall=0.922]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.91      0.97      0.94       106
         LOC       0.67      1.00      0.80         2
        NAME       0.96      1.00      0.98       110
         ORG       0.76      0.88      0.81       523
         PRO       0.51      1.00      0.68        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.81      0.92      0.86       690

   micro avg       0.81      0.92      0.86      1497
   macro avg       0.81      0.97      0.87      1497
weighted avg       0.81      0.92      0.86      1497



Epoch: 16/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.96it/s, F1=0.975, train_acc=0.996, train_loss=0.567, train_precision=0.967, train_recall=0.983]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       0.92      0.96      0.94       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       0.97      0.99      0.98       353

   micro avg       0.96      0.98      0.97       786
   macro avg       0.99      0.99      0.99       786
weighted avg       0.96      0.98      0.97       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.73it/s, F1=0.863, eval_acc=0.95, eval_loss=11.5, eval_precision=0.813, eval_recall=0.921] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.93      0.97      0.95       106
         LOC       0.00      0.00      0.00         2
        NAME       0.96      1.00      0.98       110
         ORG       0.74      0.91      0.82       523
         PRO       0.55      0.94      0.69        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.80      0.90      0.85       690

   micro avg       0.80      0.92      0.85      1497
   macro avg       0.73      0.84      0.77      1497
weighted avg       0.80      0.92      0.85      1497



Epoch: 17/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.82it/s, F1=0.99, train_acc=0.999, train_loss=0.287, train_precision=0.986, train_recall=0.993] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       0.97      0.98      0.98       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       0.99      1.00      0.99       353

   micro avg       0.99      0.99      0.99       786
   macro avg       1.00      1.00      1.00       786
weighted avg       0.99      0.99      0.99       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.871, eval_acc=0.955, eval_loss=10.9, eval_precision=0.82, eval_recall=0.93] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.92      0.97      0.94       106
         LOC       1.00      1.00      1.00         2
        NAME       0.96      1.00      0.98       110
         ORG       0.74      0.89      0.81       523
         PRO       0.53      1.00      0.69        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.81      0.92      0.86       690

   micro avg       0.80      0.92      0.86      1497
   macro avg       0.85      0.97      0.90      1497
weighted avg       0.81      0.92      0.86      1497



Epoch: 18/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.86it/s, F1=0.985, train_acc=0.998, train_loss=0.294, train_precision=0.984, train_recall=0.986]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       0.99      0.99      0.99        80
         ORG       0.98      0.99      0.99       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       0.99      1.00      1.00       353

   micro avg       0.99      0.99      0.99       786
   macro avg       1.00      1.00      1.00       786
weighted avg       0.99      0.99      0.99       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.64it/s, F1=0.869, eval_acc=0.957, eval_loss=10.3, eval_precision=0.819, eval_recall=0.929]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.90      0.97      0.94       106
         LOC       1.00      1.00      1.00         2
        NAME       0.96      1.00      0.98       110
         ORG       0.71      0.89      0.79       523
         PRO       0.64      1.00      0.78        18
        RACE       0.83      1.00      0.91        15
       TITLE       0.82      0.92      0.87       690

   micro avg       0.79      0.92      0.85      1497
   macro avg       0.85      0.97      0.90      1497
weighted avg       0.80      0.92      0.86      1497



Epoch: 19/30 Train: 100%|██████████| 32/32 [00:07<00:00,  4.01it/s, F1=0.995, train_acc=0.999, train_loss=0.114, train_precision=0.994, train_recall=0.996]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       0.99      1.00      0.99       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       0.99      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       0.99      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.874, eval_acc=0.957, eval_loss=10.4, eval_precision=0.824, eval_recall=0.934]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.91      0.97      0.94       106
         LOC       0.67      1.00      0.80         2
        NAME       0.96      1.00      0.98       110
         ORG       0.73      0.90      0.81       523
         PRO       0.62      1.00      0.77        18
        RACE       0.83      1.00      0.91        15
       TITLE       0.81      0.92      0.87       690

   micro avg       0.80      0.93      0.86      1497
   macro avg       0.81      0.97      0.88      1497
weighted avg       0.80      0.93      0.86      1497



Epoch: 20/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.89it/s, F1=0.996, train_acc=0.999, train_loss=0.0938, train_precision=0.995, train_recall=0.997]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       0.98      0.99      0.98       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       0.99      1.00      0.99       786
   macro avg       1.00      1.00      1.00       786
weighted avg       0.99      1.00      0.99       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.67it/s, F1=0.869, eval_acc=0.954, eval_loss=11.8, eval_precision=0.817, eval_recall=0.93] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.93      0.98      0.95       106
         LOC       0.50      0.50      0.50         2
        NAME       0.96      1.00      0.98       110
         ORG       0.75      0.90      0.82       523
         PRO       0.69      1.00      0.82        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.79      0.92      0.85       690

   micro avg       0.80      0.92      0.86      1497
   macro avg       0.81      0.91      0.86      1497
weighted avg       0.80      0.92      0.86      1497



Epoch: 21/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.96it/s, F1=0.998, train_acc=1, train_loss=0.0907, train_precision=0.998, train_recall=0.998]   


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       1.00      0.99      0.99       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.47it/s, F1=0.88, eval_acc=0.959, eval_loss=9.65, eval_precision=0.836, eval_recall=0.93]  


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.93      0.97      0.95       106
         LOC       1.00      1.00      1.00         2
        NAME       0.95      1.00      0.97       110
         ORG       0.75      0.90      0.82       523
         PRO       0.64      1.00      0.78        18
        RACE       0.82      0.93      0.87        15
       TITLE       0.83      0.91      0.87       690

   micro avg       0.81      0.92      0.86      1497
   macro avg       0.86      0.96      0.90      1497
weighted avg       0.82      0.92      0.86      1497



Epoch: 22/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.85it/s, F1=0.991, train_acc=0.999, train_loss=0.0805, train_precision=0.989, train_recall=0.993]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       0.99      0.99      0.99       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       0.99      0.99      0.99       353

   micro avg       0.99      0.99      0.99       786
   macro avg       1.00      1.00      1.00       786
weighted avg       0.99      0.99      0.99       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.55it/s, F1=0.883, eval_acc=0.958, eval_loss=10.9, eval_precision=0.839, eval_recall=0.933]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.91      0.97      0.94       106
         LOC       1.00      1.00      1.00         2
        NAME       0.97      1.00      0.99       110
         ORG       0.76      0.90      0.82       523
         PRO       0.62      1.00      0.77        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.82      0.92      0.87       690

   micro avg       0.81      0.93      0.87      1497
   macro avg       0.86      0.97      0.91      1497
weighted avg       0.82      0.93      0.87      1497



Epoch: 23/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.93it/s, F1=1, train_acc=1, train_loss=0.045, train_precision=1, train_recall=1] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       1.00      1.00      1.00       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.62it/s, F1=0.882, eval_acc=0.956, eval_loss=11.8, eval_precision=0.838, eval_recall=0.931]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.91      0.97      0.94       106
         LOC       0.50      0.50      0.50         2
        NAME       0.97      1.00      0.99       110
         ORG       0.77      0.91      0.83       523
         PRO       0.75      1.00      0.86        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.82      0.91      0.86       690

   micro avg       0.82      0.92      0.87      1497
   macro avg       0.82      0.91      0.86      1497
weighted avg       0.82      0.92      0.87      1497



Epoch: 24/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.84it/s, F1=0.996, train_acc=0.999, train_loss=0.109, train_precision=0.996, train_recall=0.996]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       1.00      1.00      1.00       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       0.99      0.99      0.99       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.74it/s, F1=0.874, eval_acc=0.954, eval_loss=11.4, eval_precision=0.826, eval_recall=0.93] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.93      0.98      0.95       106
         LOC       1.00      1.00      1.00         2
        NAME       0.95      1.00      0.97       110
         ORG       0.75      0.89      0.82       523
         PRO       0.53      1.00      0.69        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.82      0.92      0.87       690

   micro avg       0.81      0.92      0.86      1497
   macro avg       0.86      0.97      0.90      1497
weighted avg       0.81      0.92      0.86      1497



Epoch: 25/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.85it/s, F1=1, train_acc=1, train_loss=0.0376, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       1.00      1.00      1.00       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.71it/s, F1=0.867, eval_acc=0.954, eval_loss=11.5, eval_precision=0.816, eval_recall=0.928]


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.91      0.98      0.95       106
         LOC       1.00      1.00      1.00         2
        NAME       0.96      1.00      0.98       110
         ORG       0.73      0.90      0.81       523
         PRO       0.55      1.00      0.71        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.81      0.91      0.86       690

   micro avg       0.80      0.92      0.86      1497
   macro avg       0.85      0.97      0.90      1497
weighted avg       0.80      0.92      0.86      1497



Epoch: 26/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.94it/s, F1=0.999, train_acc=1, train_loss=0.0433, train_precision=0.998, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       1.00      1.00      1.00       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       0.99      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.72it/s, F1=0.872, eval_acc=0.95, eval_loss=13, eval_precision=0.825, eval_recall=0.926]   


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.90      0.98      0.94       106
         LOC       1.00      1.00      1.00         2
        NAME       0.96      1.00      0.98       110
         ORG       0.76      0.89      0.82       523
         PRO       0.49      1.00      0.65        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.82      0.92      0.87       690

   micro avg       0.81      0.92      0.86      1497
   macro avg       0.85      0.97      0.90      1497
weighted avg       0.82      0.92      0.87      1497



Epoch: 27/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.89it/s, F1=0.997, train_acc=1, train_loss=0.0956, train_precision=0.995, train_recall=0.999]   


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       0.99      1.00      0.99       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       0.99      1.00      1.00       353

   micro avg       0.99      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       0.99      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.71it/s, F1=0.853, eval_acc=0.944, eval_loss=15.6, eval_precision=0.805, eval_recall=0.91] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.94      0.98      0.96       106
         LOC       0.50      0.50      0.50         2
        NAME       0.98      1.00      0.99       110
         ORG       0.73      0.90      0.80       523
         PRO       0.67      1.00      0.80        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.78      0.88      0.83       690

   micro avg       0.79      0.90      0.84      1497
   macro avg       0.81      0.90      0.85      1497
weighted avg       0.79      0.90      0.84      1497



Epoch: 28/30 Train: 100%|██████████| 32/32 [00:11<00:00,  2.74it/s, F1=0.962, train_acc=0.995, train_loss=1.04, train_precision=0.947, train_recall=0.98]  


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       0.96      0.98      0.97        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       0.93      0.98      0.95       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       0.93      0.98      0.95       353

   micro avg       0.94      0.98      0.96       786
   macro avg       0.98      0.99      0.98       786
weighted avg       0.94      0.98      0.96       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.63it/s, F1=0.88, eval_acc=0.948, eval_loss=14.1, eval_precision=0.834, eval_recall=0.933] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.91      0.97      0.94        33
         EDU       0.91      0.96      0.94       106
         LOC       0.00      0.00      0.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.74      0.91      0.82       523
         PRO       0.57      0.94      0.71        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.83      0.92      0.87       690

   micro avg       0.81      0.93      0.86      1497
   macro avg       0.74      0.84      0.78      1497
weighted avg       0.82      0.93      0.87      1497



Epoch: 29/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.90it/s, F1=0.992, train_acc=0.998, train_loss=0.426, train_precision=0.99, train_recall=0.993]  


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      0.99      0.99        80
         ORG       0.98      0.99      0.98       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       1.00      1.00      1.00       353

   micro avg       0.99      0.99      0.99       786
   macro avg       1.00      1.00      1.00       786
weighted avg       0.99      0.99      0.99       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.69it/s, F1=0.88, eval_acc=0.956, eval_loss=10.9, eval_precision=0.833, eval_recall=0.936] 


eval_reports:


  0%|          | 0/32 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      1.00      0.97        33
         EDU       0.86      0.97      0.91       106
         LOC       0.33      1.00      0.50         2
        NAME       0.89      1.00      0.94       110
         ORG       0.78      0.92      0.85       523
         PRO       0.60      1.00      0.75        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.82      0.91      0.86       690

   micro avg       0.81      0.93      0.87      1497
   macro avg       0.76      0.98      0.84      1497
weighted avg       0.81      0.93      0.87      1497



Epoch: 30/30 Train: 100%|██████████| 32/32 [00:08<00:00,  3.97it/s, F1=0.997, train_acc=1, train_loss=0.0694, train_precision=0.996, train_recall=0.998]    


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        18
         EDU       1.00      1.00      1.00        48
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00        80
         ORG       1.00      1.00      1.00       265
         PRO       1.00      1.00      1.00        11
        RACE       1.00      1.00      1.00         9
       TITLE       0.99      1.00      1.00       353

   micro avg       1.00      1.00      1.00       786
   macro avg       1.00      1.00      1.00       786
weighted avg       1.00      1.00      1.00       786



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.887, eval_acc=0.956, eval_loss=11.7, eval_precision=0.839, eval_recall=0.945]


eval_reports:


calculate data/few_shot/resume/train_500.json etag: 100%|██████████| 226k/226k [00:00<00:00, 212MB/s]
calculate data/few_shot/resume/dev.json etag: 100%|██████████| 208k/208k [00:00<00:00, 208MB/s]
calculate data/few_shot/resume/test.json etag: 100%|██████████| 230k/230k [00:00<00:00, 219MB/s]
calculate data/few_shot/resume/labels.txt etag: 100%|██████████| 181/181 [00:00<00:00, 364kB/s]

              precision    recall  f1-score   support

        CONT       0.97      1.00      0.99        33
         EDU       0.90      0.98      0.94       106
         LOC       1.00      1.00      1.00         2
        NAME       0.97      1.00      0.99       110
         ORG       0.77      0.94      0.85       523
         PRO       0.60      1.00      0.75        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.81      0.92      0.86       690

   micro avg       0.81      0.94      0.87      1497
   macro avg       0.86      0.98      0.91      1497
weighted avg       0.82      0.94      0.87      1497

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/resume/train_500.json",
    "eval_file": "data/few_shot/resume/dev.json",
    "test_file": "data/few_shot


count line size data/few_shot/resume/labels.txt: 29L [00:00, 237104.90L/s]
build line mapper: 29L [00:00, 245231.48L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 29/29 [00:00<00:00, 8603.40it/s]
load vocab from list: 100%|██████████| 28/28 [00:00<00:00, 274393.72it/s]
load dataset from data/few_shot/resume/train_500.json: 0it [00:00, ?it/s]

load cached ./temp/1acbeeb28deec326649877a3b4cfe533_578a629df36736a7b0ca315689a0fbc2_a783a23408031aaf8881013b1b168597_61206f767c93b652c614f8099bc479e7/1000000/matched_words
load cached ./temp/1acbeeb28deec326649877a3b4cfe533_578a629df36736a7b0ca315689a0fbc2_a783a23408031aaf8881013b1b168597_61206f767c93b652c614f8099bc479e7/1000000/word_vocab
load cached ./temp/1acbeeb28deec326649877a3b4cfe533_578a629df36736a7b0ca315689a0fbc2_a783a23408031aaf8881013b1b168597_61206f767c93b652c614f8099bc479e7/1000000/vocab_embedding


load dataset from data/few_shot/resume/train_500.json: 500it [00:00, 823.48it/s]
load dataset from data/few_shot/resume/dev.json: 463it [00:00, 823.19it/s]
Some weights of the model checkpoint at save_pretrained/resume_pretrain_lebert_500_pretraind_task/Bert_480/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.77it/s, F1=0.032, train_acc=0.349, train_loss=78.3, train_precision=0.0268, train_recall=0.0412]    


train_reports:
              precision    recall  f1-score   support

        CONT       0.00      0.00      0.00        35
         EDU       0.00      0.00      0.00        99
         LOC       0.00      0.00      0.00         7
        NAME       0.00      0.00      0.00       148
         ORG       0.07      0.11      0.09       547
         PRO       0.00      0.00      0.00        37
        RACE       0.00      0.00      0.00        16
       TITLE       0.01      0.01      0.01       702

   micro avg       0.01      0.04      0.02      1591
   macro avg       0.01      0.02      0.01      1591
weighted avg       0.03      0.04      0.04      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.42it/s, F1=0.217, eval_acc=0.679, eval_loss=32.9, eval_precision=0.18, eval_recall=0.273] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.00      0.00      0.00        33
         EDU       0.00      0.00      0.00       106
         LOC       0.00      0.00      0.00         2
        NAME       0.00      0.00      0.00       110
         ORG       0.29      0.62      0.40       523
         PRO       0.00      0.00      0.00        18
        RACE       0.00      0.00      0.00        15
       TITLE       0.07      0.12      0.09       690

   micro avg       0.18      0.28      0.22      1497
   macro avg       0.05      0.09      0.06      1497
weighted avg       0.13      0.28      0.18      1497



Epoch: 2/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.78it/s, F1=0.47, train_acc=0.853, train_loss=18.1, train_precision=0.413, train_recall=0.553] 


train_reports:
              precision    recall  f1-score   support

        CONT       0.27      0.11      0.16        35
         EDU       0.02      0.04      0.02        99
         LOC       0.00      0.00      0.00         7
        NAME       0.02      0.03      0.02       148
         ORG       0.50      0.71      0.58       547
         PRO       0.00      0.00      0.00        37
        RACE       0.00      0.00      0.00        16
       TITLE       0.53      0.71      0.60       702

   micro avg       0.40      0.57      0.47      1591
   macro avg       0.17      0.20      0.17      1591
weighted avg       0.41      0.57      0.47      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.63it/s, F1=0.732, eval_acc=0.93, eval_loss=8.39, eval_precision=0.666, eval_recall=0.814] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.24      0.24      0.24        33
         EDU       0.41      0.70      0.51       106
         LOC       0.00      0.00      0.00         2
        NAME       0.16      0.27      0.20       110
         ORG       0.73      0.89      0.80       523
         PRO       0.00      0.00      0.00        18
        RACE       0.00      0.00      0.00        15
       TITLE       0.81      0.91      0.86       690

   micro avg       0.64      0.81      0.72      1497
   macro avg       0.29      0.38      0.33      1497
weighted avg       0.67      0.81      0.73      1497



Epoch: 3/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.82it/s, F1=0.784, train_acc=0.959, train_loss=5.27, train_precision=0.736, train_recall=0.846]


train_reports:
              precision    recall  f1-score   support

        CONT       0.66      0.77      0.71        35
         EDU       0.43      0.70      0.53        99
         LOC       0.00      0.00      0.00         7
        NAME       0.53      0.70      0.60       148
         ORG       0.76      0.90      0.83       547
         PRO       0.06      0.11      0.08        37
        RACE       0.33      0.06      0.11        16
       TITLE       0.88      0.94      0.91       702

   micro avg       0.73      0.85      0.78      1591
   macro avg       0.46      0.52      0.47      1591
weighted avg       0.75      0.85      0.79      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.71it/s, F1=0.852, eval_acc=0.95, eval_loss=6.79, eval_precision=0.799, eval_recall=0.917] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.82      1.00      0.90        33
         EDU       0.73      0.78      0.75       106
         LOC       0.00      0.00      0.00         2
        NAME       0.99      0.99      0.99       110
         ORG       0.74      0.90      0.81       523
         PRO       0.27      0.83      0.41        18
        RACE       0.50      0.47      0.48        15
       TITLE       0.83      0.94      0.88       690

   micro avg       0.78      0.91      0.84      1497
   macro avg       0.61      0.74      0.65      1497
weighted avg       0.79      0.91      0.85      1497



Epoch: 4/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.93it/s, F1=0.913, train_acc=0.981, train_loss=2.86, train_precision=0.89, train_recall=0.94]  


train_reports:
              precision    recall  f1-score   support

        CONT       0.78      1.00      0.88        35
         EDU       0.89      0.94      0.91        99
         LOC       0.11      0.14      0.12         7
        NAME       0.95      0.96      0.95       148
         ORG       0.85      0.93      0.89       547
         PRO       0.53      0.70      0.60        37
        RACE       0.88      0.94      0.91        16
       TITLE       0.92      0.95      0.94       702

   micro avg       0.88      0.93      0.90      1591
   macro avg       0.74      0.82      0.78      1591
weighted avg       0.88      0.93      0.91      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.43it/s, F1=0.86, eval_acc=0.954, eval_loss=6.07, eval_precision=0.81, eval_recall=0.921]  


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.88      0.99      0.93       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      0.99      0.99       110
         ORG       0.74      0.88      0.81       523
         PRO       0.51      1.00      0.68        18
        RACE       0.83      1.00      0.91        15
       TITLE       0.79      0.92      0.85       690

   micro avg       0.79      0.92      0.85      1497
   macro avg       0.84      0.97      0.90      1497
weighted avg       0.80      0.92      0.85      1497



Epoch: 5/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.87it/s, F1=0.941, train_acc=0.989, train_loss=1.89, train_precision=0.923, train_recall=0.964] 


train_reports:
              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        35
         EDU       0.99      0.99      0.99        99
         LOC       0.71      0.71      0.71         7
        NAME       0.99      1.00      1.00       148
         ORG       0.89      0.95      0.92       547
         PRO       0.74      0.86      0.80        37
        RACE       0.88      0.88      0.88        16
       TITLE       0.93      0.97      0.95       702

   micro avg       0.92      0.96      0.94      1591
   macro avg       0.88      0.92      0.90      1591
weighted avg       0.92      0.96      0.94      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.72it/s, F1=0.89, eval_acc=0.954, eval_loss=7.12, eval_precision=0.847, eval_recall=0.938] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.91      0.94      0.93       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.78      0.93      0.85       523
         PRO       0.36      0.67      0.47        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.84      0.92      0.88       690

   micro avg       0.83      0.93      0.88      1497
   macro avg       0.84      0.93      0.88      1497
weighted avg       0.83      0.93      0.88      1497



Epoch: 6/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.79it/s, F1=0.935, train_acc=0.988, train_loss=1.66, train_precision=0.913, train_recall=0.961]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       0.93      0.96      0.95        99
         LOC       1.00      1.00      1.00         7
        NAME       0.99      1.00      0.99       148
         ORG       0.90      0.96      0.93       547
         PRO       0.83      0.92      0.87        37
        RACE       0.88      0.88      0.88        16
       TITLE       0.91      0.96      0.93       702

   micro avg       0.91      0.96      0.94      1591
   macro avg       0.93      0.96      0.94      1591
weighted avg       0.91      0.96      0.94      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.62it/s, F1=0.893, eval_acc=0.965, eval_loss=5.01, eval_precision=0.859, eval_recall=0.931]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.94      0.97      0.96       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.80      0.91      0.85       523
         PRO       0.72      1.00      0.84        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.83      0.92      0.87       690

   micro avg       0.84      0.93      0.88      1497
   macro avg       0.89      0.97      0.93      1497
weighted avg       0.84      0.93      0.88      1497



Epoch: 7/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.82it/s, F1=0.97, train_acc=0.994, train_loss=0.849, train_precision=0.964, train_recall=0.978] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       0.99      1.00      1.00       148
         ORG       0.94      0.97      0.96       547
         PRO       1.00      1.00      1.00        37
        RACE       0.88      0.88      0.88        16
       TITLE       0.96      0.98      0.97       702

   micro avg       0.96      0.98      0.97      1591
   macro avg       0.97      0.98      0.98      1591
weighted avg       0.96      0.98      0.97      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.63it/s, F1=0.905, eval_acc=0.964, eval_loss=6.06, eval_precision=0.886, eval_recall=0.926]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.93      0.98      0.95       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.84      0.89      0.87       523
         PRO       0.82      1.00      0.90        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.87      0.92      0.89       690

   micro avg       0.87      0.92      0.90      1497
   macro avg       0.91      0.97      0.94      1497
weighted avg       0.87      0.92      0.90      1497



Epoch: 8/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.80it/s, F1=0.982, train_acc=0.996, train_loss=0.736, train_precision=0.976, train_recall=0.988]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       0.99      1.00      1.00       148
         ORG       0.97      0.99      0.98       547
         PRO       0.97      0.97      0.97        37
        RACE       0.88      0.94      0.91        16
       TITLE       0.98      0.99      0.98       702

   micro avg       0.98      0.99      0.98      1591
   macro avg       0.98      0.99      0.98      1591
weighted avg       0.98      0.99      0.98      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.44it/s, F1=0.892, eval_acc=0.964, eval_loss=5.55, eval_precision=0.858, eval_recall=0.929]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.97      0.97      0.97        33
         EDU       0.93      0.98      0.95       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.80      0.88      0.84       523
         PRO       0.64      1.00      0.78        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.85      0.93      0.89       690

   micro avg       0.85      0.92      0.88      1497
   macro avg       0.88      0.96      0.92      1497
weighted avg       0.85      0.92      0.89      1497



Epoch: 9/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.16it/s, F1=0.979, train_acc=0.996, train_loss=0.538, train_precision=0.972, train_recall=0.986]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       0.98      0.99      0.98        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       0.95      0.98      0.97       547
         PRO       0.92      0.97      0.95        37
        RACE       0.88      0.88      0.88        16
       TITLE       0.97      0.99      0.98       702

   micro avg       0.97      0.98      0.98      1591
   macro avg       0.96      0.98      0.97      1591
weighted avg       0.97      0.98      0.98      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.904, eval_acc=0.963, eval_loss=5.91, eval_precision=0.877, eval_recall=0.934]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.91      0.99      0.95       106
         LOC       1.00      1.00      1.00         2
        NAME       0.97      1.00      0.99       110
         ORG       0.85      0.90      0.87       523
         PRO       0.65      0.94      0.77        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.87      0.93      0.90       690

   micro avg       0.87      0.93      0.90      1497
   macro avg       0.89      0.96      0.92      1497
weighted avg       0.87      0.93      0.90      1497



Epoch: 10/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.79it/s, F1=0.991, train_acc=0.999, train_loss=0.284, train_precision=0.989, train_recall=0.995]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       0.97      0.99      0.98        99
         LOC       1.00      1.00      1.00         7
        NAME       0.99      1.00      1.00       148
         ORG       0.98      0.99      0.98       547
         PRO       1.00      1.00      1.00        37
        RACE       0.88      0.94      0.91        16
       TITLE       0.99      1.00      1.00       702

   micro avg       0.99      0.99      0.99      1591
   macro avg       0.98      0.99      0.98      1591
weighted avg       0.99      0.99      0.99      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.71it/s, F1=0.908, eval_acc=0.965, eval_loss=5.42, eval_precision=0.881, eval_recall=0.938]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      0.97      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.85      0.91      0.88       523
         PRO       0.64      1.00      0.78        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.87      0.93      0.90       690

   micro avg       0.88      0.93      0.90      1497
   macro avg       0.90      0.97      0.93      1497
weighted avg       0.88      0.93      0.91      1497



Epoch: 11/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.87it/s, F1=0.993, train_acc=0.998, train_loss=0.204, train_precision=0.992, train_recall=0.995]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       0.99      1.00      1.00       148
         ORG       0.98      0.99      0.99       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       0.99      1.00      1.00       702

   micro avg       0.99      1.00      0.99      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       0.99      1.00      0.99      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.65it/s, F1=0.901, eval_acc=0.961, eval_loss=6.66, eval_precision=0.876, eval_recall=0.929]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      0.97      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.84      0.89      0.86       523
         PRO       0.69      1.00      0.82        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.85      0.93      0.89       690

   micro avg       0.86      0.92      0.89      1497
   macro avg       0.90      0.96      0.93      1497
weighted avg       0.87      0.92      0.89      1497



Epoch: 12/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.85it/s, F1=0.995, train_acc=0.999, train_loss=0.199, train_precision=0.994, train_recall=0.995]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      0.99      1.00       148
         ORG       0.99      0.99      0.99       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       1.00      1.00      1.00       702

   micro avg       0.99      0.99      0.99      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       0.99      0.99      0.99      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.32it/s, F1=0.91, eval_acc=0.966, eval_loss=6.03, eval_precision=0.88, eval_recall=0.942]  


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      0.97      0.96       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.84      0.91      0.88       523
         PRO       0.67      1.00      0.80        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.87      0.94      0.91       690

   micro avg       0.88      0.94      0.91      1497
   macro avg       0.90      0.98      0.93      1497
weighted avg       0.88      0.94      0.91      1497



Epoch: 13/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.82it/s, F1=0.996, train_acc=1, train_loss=0.0882, train_precision=0.995, train_recall=0.998]    


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       0.99      1.00      1.00       148
         ORG       0.99      1.00      1.00       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       1.00      1.00      1.00       702

   micro avg       0.99      1.00      1.00      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       0.99      1.00      1.00      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.22it/s, F1=0.916, eval_acc=0.964, eval_loss=6.61, eval_precision=0.898, eval_recall=0.935]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      0.97      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.88      0.90      0.89       523
         PRO       0.72      1.00      0.84        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.88      0.93      0.90       690

   micro avg       0.89      0.93      0.91      1497
   macro avg       0.91      0.97      0.94      1497
weighted avg       0.89      0.93      0.91      1497



Epoch: 14/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.84it/s, F1=0.996, train_acc=0.999, train_loss=0.108, train_precision=0.996, train_recall=0.997] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       0.99      1.00      1.00       148
         ORG       1.00      0.99      1.00       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       1.00      1.00      1.00       702

   micro avg       1.00      1.00      1.00      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       1.00      1.00      1.00      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.32it/s, F1=0.907, eval_acc=0.962, eval_loss=6.68, eval_precision=0.883, eval_recall=0.934]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.94      0.97      0.96       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.85      0.90      0.87       523
         PRO       0.72      1.00      0.84        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.86      0.93      0.89       690

   micro avg       0.87      0.93      0.90      1497
   macro avg       0.90      0.98      0.94      1497
weighted avg       0.87      0.93      0.90      1497



Epoch: 15/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.89it/s, F1=0.997, train_acc=1, train_loss=0.0623, train_precision=0.996, train_recall=0.998]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       0.99      0.99      0.99       547
         PRO       0.97      1.00      0.99        37
        RACE       1.00      1.00      1.00        16
       TITLE       1.00      1.00      1.00       702

   micro avg       1.00      1.00      1.00      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       1.00      1.00      1.00      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.66it/s, F1=0.912, eval_acc=0.964, eval_loss=6.65, eval_precision=0.886, eval_recall=0.941]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      0.97      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.85      0.92      0.88       523
         PRO       0.72      1.00      0.84        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.87      0.93      0.90       690

   micro avg       0.88      0.94      0.91      1497
   macro avg       0.91      0.97      0.93      1497
weighted avg       0.88      0.94      0.91      1497



Epoch: 16/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.17it/s, F1=0.996, train_acc=0.999, train_loss=0.0641, train_precision=0.995, train_recall=0.997]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       0.99      0.99      0.99       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       1.00      1.00      1.00       702

   micro avg       0.99      1.00      1.00      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       0.99      1.00      1.00      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.60it/s, F1=0.915, eval_acc=0.963, eval_loss=6.85, eval_precision=0.892, eval_recall=0.94] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      0.97      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.86      0.91      0.89       523
         PRO       0.67      1.00      0.80        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.87      0.93      0.90       690

   micro avg       0.88      0.94      0.91      1497
   macro avg       0.90      0.97      0.93      1497
weighted avg       0.88      0.94      0.91      1497



Epoch: 17/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.85it/s, F1=0.999, train_acc=1, train_loss=0.0278, train_precision=0.999, train_recall=1]    


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       1.00      1.00      1.00       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       1.00      1.00      1.00       702

   micro avg       1.00      1.00      1.00      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       1.00      1.00      1.00      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.63it/s, F1=0.91, eval_acc=0.963, eval_loss=6.95, eval_precision=0.883, eval_recall=0.94]  


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      0.97      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.85      0.92      0.88       523
         PRO       0.67      1.00      0.80        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.86      0.93      0.89       690

   micro avg       0.87      0.94      0.90      1497
   macro avg       0.90      0.97      0.93      1497
weighted avg       0.87      0.94      0.90      1497



Epoch: 18/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.89it/s, F1=0.999, train_acc=1, train_loss=0.0268, train_precision=0.999, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       1.00      1.00      1.00       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       1.00      1.00      1.00       702

   micro avg       1.00      1.00      1.00      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       1.00      1.00      1.00      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.67it/s, F1=0.914, eval_acc=0.964, eval_loss=6.98, eval_precision=0.89, eval_recall=0.941] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      0.97      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.86      0.91      0.88       523
         PRO       0.75      1.00      0.86        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.87      0.94      0.90       690

   micro avg       0.88      0.94      0.91      1497
   macro avg       0.91      0.97      0.94      1497
weighted avg       0.88      0.94      0.91      1497



Epoch: 19/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.79it/s, F1=1, train_acc=1, train_loss=0.0179, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       1.00      1.00      1.00       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       1.00      1.00      1.00       702

   micro avg       1.00      1.00      1.00      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       1.00      1.00      1.00      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.65it/s, F1=0.912, eval_acc=0.963, eval_loss=7.17, eval_precision=0.887, eval_recall=0.94] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      0.97      0.96       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.85      0.91      0.88       523
         PRO       0.69      1.00      0.82        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.87      0.93      0.90       690

   micro avg       0.88      0.94      0.91      1497
   macro avg       0.90      0.97      0.93      1497
weighted avg       0.88      0.94      0.91      1497



Epoch: 20/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.85it/s, F1=0.998, train_acc=1, train_loss=0.0619, train_precision=0.998, train_recall=0.998]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       1.00      1.00      1.00       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       1.00      1.00      1.00       702

   micro avg       1.00      1.00      1.00      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       1.00      1.00      1.00      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.92, eval_acc=0.965, eval_loss=6.9, eval_precision=0.894, eval_recall=0.949]  


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      0.98      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.86      0.92      0.89       523
         PRO       0.75      1.00      0.86        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.88      0.95      0.91       690

   micro avg       0.88      0.95      0.91      1497
   macro avg       0.91      0.97      0.94      1497
weighted avg       0.89      0.95      0.91      1497



Epoch: 21/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.84it/s, F1=0.999, train_acc=1, train_loss=0.0195, train_precision=0.999, train_recall=1]    


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       1.00      1.00      1.00       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       1.00      1.00      1.00       702

   micro avg       1.00      1.00      1.00      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       1.00      1.00      1.00      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.62it/s, F1=0.926, eval_acc=0.967, eval_loss=6.62, eval_precision=0.901, eval_recall=0.953]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      0.98      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.88      0.93      0.90       523
         PRO       0.75      1.00      0.86        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.89      0.95      0.92       690

   micro avg       0.89      0.95      0.92      1497
   macro avg       0.92      0.97      0.94      1497
weighted avg       0.89      0.95      0.92      1497



Epoch: 22/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.20it/s, F1=1, train_acc=1, train_loss=0.0142, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       1.00      1.00      1.00       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       1.00      1.00      1.00       702

   micro avg       1.00      1.00      1.00      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       1.00      1.00      1.00      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.924, eval_acc=0.965, eval_loss=6.98, eval_precision=0.901, eval_recall=0.949]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      0.98      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.97      1.00      0.99       110
         ORG       0.87      0.92      0.90       523
         PRO       0.75      1.00      0.86        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.88      0.95      0.92       690

   micro avg       0.89      0.95      0.92      1497
   macro avg       0.91      0.97      0.94      1497
weighted avg       0.89      0.95      0.92      1497



Epoch: 23/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.84it/s, F1=1, train_acc=1, train_loss=0.0123, train_precision=1, train_recall=1] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       1.00      1.00      1.00       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       1.00      1.00      1.00       702

   micro avg       1.00      1.00      1.00      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       1.00      1.00      1.00      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.44it/s, F1=0.929, eval_acc=0.965, eval_loss=7.05, eval_precision=0.908, eval_recall=0.952]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      0.98      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.97      1.00      0.99       110
         ORG       0.89      0.93      0.91       523
         PRO       0.75      1.00      0.86        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.89      0.95      0.92       690

   micro avg       0.90      0.95      0.92      1497
   macro avg       0.92      0.97      0.94      1497
weighted avg       0.90      0.95      0.92      1497



Epoch: 24/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.82it/s, F1=1, train_acc=1, train_loss=0.00918, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       1.00      1.00      1.00       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       1.00      1.00      1.00       702

   micro avg       1.00      1.00      1.00      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       1.00      1.00      1.00      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.64it/s, F1=0.928, eval_acc=0.966, eval_loss=6.96, eval_precision=0.908, eval_recall=0.95] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      0.97      0.96       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.88      0.93      0.90       523
         PRO       0.75      1.00      0.86        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.89      0.95      0.92       690

   micro avg       0.90      0.95      0.92      1497
   macro avg       0.92      0.97      0.94      1497
weighted avg       0.90      0.95      0.92      1497



Epoch: 25/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.88it/s, F1=1, train_acc=1, train_loss=0.00862, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       1.00      1.00      1.00       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       1.00      1.00      1.00       702

   micro avg       1.00      1.00      1.00      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       1.00      1.00      1.00      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.71it/s, F1=0.924, eval_acc=0.965, eval_loss=7.15, eval_precision=0.903, eval_recall=0.948]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      0.98      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.87      0.92      0.90       523
         PRO       0.75      1.00      0.86        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.88      0.95      0.91       690

   micro avg       0.89      0.95      0.92      1497
   macro avg       0.92      0.97      0.94      1497
weighted avg       0.89      0.95      0.92      1497



Epoch: 26/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.80it/s, F1=1, train_acc=1, train_loss=0.00868, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       1.00      1.00      1.00       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       1.00      1.00      1.00       702

   micro avg       1.00      1.00      1.00      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       1.00      1.00      1.00      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.50it/s, F1=0.927, eval_acc=0.965, eval_loss=7.22, eval_precision=0.906, eval_recall=0.95] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      0.98      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.88      0.92      0.90       523
         PRO       0.75      1.00      0.86        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.89      0.95      0.92       690

   micro avg       0.90      0.95      0.92      1497
   macro avg       0.92      0.97      0.94      1497
weighted avg       0.90      0.95      0.92      1497



Epoch: 27/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.80it/s, F1=1, train_acc=1, train_loss=0.00659, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       1.00      1.00      1.00       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       1.00      1.00      1.00       702

   micro avg       1.00      1.00      1.00      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       1.00      1.00      1.00      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.72it/s, F1=0.93, eval_acc=0.966, eval_loss=7.24, eval_precision=0.909, eval_recall=0.952] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      0.98      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.89      0.93      0.91       523
         PRO       0.75      1.00      0.86        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.89      0.95      0.92       690

   micro avg       0.90      0.95      0.93      1497
   macro avg       0.92      0.97      0.94      1497
weighted avg       0.90      0.95      0.93      1497



Epoch: 28/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.30it/s, F1=1, train_acc=1, train_loss=0.0106, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       1.00      1.00      1.00       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       1.00      1.00      1.00       702

   micro avg       1.00      1.00      1.00      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       1.00      1.00      1.00      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.69it/s, F1=0.928, eval_acc=0.965, eval_loss=7.28, eval_precision=0.907, eval_recall=0.949]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      0.98      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.88      0.93      0.90       523
         PRO       0.75      1.00      0.86        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.89      0.95      0.92       690

   micro avg       0.90      0.95      0.92      1497
   macro avg       0.92      0.97      0.94      1497
weighted avg       0.90      0.95      0.92      1497



Epoch: 29/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.84it/s, F1=1, train_acc=1, train_loss=0.00737, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       1.00      1.00      1.00       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       1.00      1.00      1.00       702

   micro avg       1.00      1.00      1.00      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       1.00      1.00      1.00      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.72it/s, F1=0.923, eval_acc=0.964, eval_loss=7.59, eval_precision=0.899, eval_recall=0.949]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      0.98      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.97      1.00      0.99       110
         ORG       0.87      0.93      0.90       523
         PRO       0.75      1.00      0.86        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.88      0.94      0.91       690

   micro avg       0.89      0.95      0.92      1497
   macro avg       0.91      0.97      0.94      1497
weighted avg       0.89      0.95      0.92      1497



Epoch: 30/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.85it/s, F1=1, train_acc=1, train_loss=0.0122, train_precision=0.999, train_recall=1]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       1.00      1.00      1.00       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       1.00      1.00      1.00       702

   micro avg       1.00      1.00      1.00      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       1.00      1.00      1.00      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.72it/s, F1=0.921, eval_acc=0.965, eval_loss=7.27, eval_precision=0.898, eval_recall=0.946]


eval_reports:


calculate data/few_shot/resume/train_500.json etag: 100%|██████████| 226k/226k [00:00<00:00, 202MB/s]
calculate data/few_shot/resume/dev.json etag: 100%|██████████| 208k/208k [00:00<00:00, 219MB/s]
calculate data/few_shot/resume/test.json etag: 100%|██████████| 230k/230k [00:00<00:00, 221MB/s]
calculate data/few_shot/resume/labels.txt etag: 100%|██████████| 181/181 [00:00<00:00, 309kB/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      0.97      0.96       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.86      0.92      0.89       523
         PRO       0.75      1.00      0.86        18
        RACE       0.93      0.93      0.93        15
       TITLE       0.88      0.95      0.91       690

   micro avg       0.89      0.94      0.92      1497
   macro avg       0.92      0.97      0.94      1497
weighted avg       0.89      0.94      0.92      1497

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/resume/train_500.json",
    "eval_file": "data/few_shot/resume/dev.json",
    "test_file": "data/few_shot


count line size data/few_shot/resume/labels.txt: 29L [00:00, 232127.51L/s]
build line mapper: 29L [00:00, 240385.01L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 29/29 [00:00<00:00, 8635.16it/s]
load vocab from list: 100%|██████████| 28/28 [00:00<00:00, 263911.26it/s]
load dataset from data/few_shot/resume/train_500.json: 93it [00:00, 929.12it/s]

load cached ./temp/1acbeeb28deec326649877a3b4cfe533_578a629df36736a7b0ca315689a0fbc2_a783a23408031aaf8881013b1b168597_61206f767c93b652c614f8099bc479e7/1000000/matched_words
load cached ./temp/1acbeeb28deec326649877a3b4cfe533_578a629df36736a7b0ca315689a0fbc2_a783a23408031aaf8881013b1b168597_61206f767c93b652c614f8099bc479e7/1000000/word_vocab
load cached ./temp/1acbeeb28deec326649877a3b4cfe533_578a629df36736a7b0ca315689a0fbc2_a783a23408031aaf8881013b1b168597_61206f767c93b652c614f8099bc479e7/1000000/vocab_embedding


load dataset from data/few_shot/resume/train_500.json: 500it [00:00, 829.51it/s]
load dataset from data/few_shot/resume/dev.json: 463it [00:00, 823.14it/s]
Some weights of the model checkpoint at save_pretrained/resume_pretrain_lebert_500_pretraind_task/Bert_480/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.82it/s, F1=0.0313, train_acc=0.394, train_loss=79.5, train_precision=0.031, train_recall=0.0361]     


train_reports:
              precision    recall  f1-score   support

        CONT       0.00      0.00      0.00        35
         EDU       0.00      0.00      0.00        99
         LOC       0.00      0.00      0.00         7
        NAME       0.00      0.01      0.00       148
         ORG       0.07      0.08      0.07       547
         PRO       0.00      0.00      0.00        37
        RACE       0.00      0.06      0.01        16
       TITLE       0.03      0.02      0.03       702

   micro avg       0.02      0.04      0.03      1591
   macro avg       0.01      0.02      0.01      1591
weighted avg       0.04      0.04      0.04      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.63it/s, F1=0.191, eval_acc=0.738, eval_loss=34, eval_precision=0.156, eval_recall=0.249]  


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.00      0.00      0.00        33
         EDU       0.00      0.00      0.00       106
         LOC       0.00      0.00      0.00         2
        NAME       0.00      0.00      0.00       110
         ORG       0.29      0.44      0.35       523
         PRO       0.00      0.00      0.00        18
        RACE       0.00      0.00      0.00        15
       TITLE       0.08      0.20      0.12       690

   micro avg       0.15      0.25      0.19      1497
   macro avg       0.05      0.08      0.06      1497
weighted avg       0.14      0.25      0.18      1497



Epoch: 2/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.85it/s, F1=0.397, train_acc=0.835, train_loss=19.1, train_precision=0.346, train_recall=0.476]


train_reports:
              precision    recall  f1-score   support

        CONT       0.03      0.03      0.03        35
         EDU       0.13      0.16      0.14        99
         LOC       0.00      0.00      0.00         7
        NAME       0.13      0.16      0.14       148
         ORG       0.49      0.67      0.56       547
         PRO       0.00      0.00      0.00        37
        RACE       0.00      0.00      0.00        16
       TITLE       0.28      0.52      0.37       702

   micro avg       0.32      0.48      0.39      1591
   macro avg       0.13      0.19      0.16      1591
weighted avg       0.31      0.48      0.38      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.73it/s, F1=0.754, eval_acc=0.925, eval_loss=9.47, eval_precision=0.685, eval_recall=0.842]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.25      0.36      0.30        33
         EDU       0.77      0.85      0.81       106
         LOC       0.00      0.00      0.00         2
        NAME       0.76      0.89      0.82       110
         ORG       0.71      0.86      0.78       523
         PRO       0.08      0.11      0.10        18
        RACE       1.00      0.07      0.12        15
       TITLE       0.63      0.86      0.73       690

   micro avg       0.65      0.83      0.73      1497
   macro avg       0.53      0.50      0.46      1497
weighted avg       0.67      0.83      0.73      1497



Epoch: 3/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.93it/s, F1=0.831, train_acc=0.959, train_loss=5.91, train_precision=0.789, train_recall=0.883]


train_reports:
              precision    recall  f1-score   support

        CONT       0.69      0.94      0.80        35
         EDU       0.79      0.85      0.82        99
         LOC       0.00      0.00      0.00         7
        NAME       0.89      0.95      0.92       148
         ORG       0.73      0.87      0.80       547
         PRO       0.28      0.35      0.31        37
        RACE       0.80      0.25      0.38        16
       TITLE       0.80      0.91      0.85       702

   micro avg       0.76      0.87      0.81      1591
   macro avg       0.62      0.64      0.61      1591
weighted avg       0.77      0.87      0.81      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.62it/s, F1=0.866, eval_acc=0.951, eval_loss=6.56, eval_precision=0.82, eval_recall=0.921] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.85      0.90      0.87       106
         LOC       0.00      0.00      0.00         2
        NAME       0.99      0.99      0.99       110
         ORG       0.74      0.89      0.81       523
         PRO       0.47      1.00      0.64        18
        RACE       0.93      0.93      0.93        15
       TITLE       0.83      0.93      0.87       690

   micro avg       0.80      0.92      0.85      1497
   macro avg       0.72      0.83      0.76      1497
weighted avg       0.81      0.92      0.86      1497



Epoch: 4/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.84it/s, F1=0.909, train_acc=0.979, train_loss=2.91, train_precision=0.882, train_recall=0.941]


train_reports:
              precision    recall  f1-score   support

        CONT       0.92      0.97      0.94        35
         EDU       0.91      0.92      0.91        99
         LOC       0.00      0.00      0.00         7
        NAME       0.99      0.98      0.98       148
         ORG       0.84      0.93      0.88       547
         PRO       0.52      0.68      0.59        37
        RACE       0.83      0.94      0.88        16
       TITLE       0.90      0.96      0.93       702

   micro avg       0.87      0.94      0.90      1591
   macro avg       0.74      0.80      0.77      1591
weighted avg       0.87      0.94      0.90      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.49it/s, F1=0.859, eval_acc=0.959, eval_loss=5.01, eval_precision=0.808, eval_recall=0.921]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.92      0.97      0.94       106
         LOC       0.00      0.00      0.00         2
        NAME       0.96      1.00      0.98       110
         ORG       0.73      0.86      0.79       523
         PRO       0.67      1.00      0.80        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.79      0.93      0.85       690

   micro avg       0.79      0.91      0.85      1497
   macro avg       0.75      0.84      0.79      1497
weighted avg       0.79      0.91      0.85      1497



Epoch: 5/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.89it/s, F1=0.947, train_acc=0.989, train_loss=1.54, train_precision=0.93, train_recall=0.967] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       0.93      0.96      0.95        99
         LOC       0.14      0.14      0.14         7
        NAME       0.99      0.99      0.99       148
         ORG       0.91      0.96      0.93       547
         PRO       0.73      0.86      0.79        37
        RACE       0.79      0.94      0.86        16
       TITLE       0.94      0.97      0.96       702

   micro avg       0.92      0.96      0.94      1591
   macro avg       0.80      0.85      0.83      1591
weighted avg       0.92      0.96      0.94      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.71it/s, F1=0.881, eval_acc=0.957, eval_loss=5.93, eval_precision=0.848, eval_recall=0.919]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.97      0.97      0.97        33
         EDU       0.94      0.95      0.94       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.79      0.87      0.83       523
         PRO       0.67      1.00      0.80        18
        RACE       1.00      0.93      0.97        15
       TITLE       0.82      0.92      0.87       690

   micro avg       0.83      0.92      0.87      1497
   macro avg       0.90      0.96      0.92      1497
weighted avg       0.83      0.92      0.87      1497



Epoch: 6/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.23it/s, F1=0.971, train_acc=0.996, train_loss=0.825, train_precision=0.964, train_recall=0.979]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       0.99      1.00      0.99        99
         LOC       1.00      1.00      1.00         7
        NAME       0.99      0.99      0.99       148
         ORG       0.95      0.97      0.96       547
         PRO       0.87      0.92      0.89        37
        RACE       0.88      0.94      0.91        16
       TITLE       0.96      0.98      0.97       702

   micro avg       0.96      0.98      0.97      1591
   macro avg       0.96      0.98      0.97      1591
weighted avg       0.96      0.98      0.97      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.69it/s, F1=0.902, eval_acc=0.963, eval_loss=5.5, eval_precision=0.874, eval_recall=0.934] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.97      0.97      0.97        33
         EDU       0.95      0.98      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.82      0.89      0.85       523
         PRO       0.78      1.00      0.88        18
        RACE       0.93      0.93      0.93        15
       TITLE       0.85      0.93      0.89       690

   micro avg       0.86      0.93      0.89      1497
   macro avg       0.91      0.96      0.94      1497
weighted avg       0.86      0.93      0.89      1497



Epoch: 7/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.88it/s, F1=0.976, train_acc=0.996, train_loss=0.736, train_precision=0.97, train_recall=0.983] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       0.99      1.00      1.00       148
         ORG       0.96      0.98      0.97       547
         PRO       1.00      1.00      1.00        37
        RACE       0.88      0.88      0.88        16
       TITLE       0.96      0.98      0.97       702

   micro avg       0.97      0.98      0.97      1591
   macro avg       0.97      0.98      0.98      1591
weighted avg       0.97      0.98      0.97      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.72it/s, F1=0.885, eval_acc=0.956, eval_loss=7.26, eval_precision=0.845, eval_recall=0.934]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      0.98      0.96       106
         LOC       0.67      1.00      0.80         2
        NAME       0.99      1.00      1.00       110
         ORG       0.77      0.90      0.83       523
         PRO       0.67      1.00      0.80        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.82      0.92      0.87       690

   micro avg       0.82      0.93      0.87      1497
   macro avg       0.84      0.98      0.90      1497
weighted avg       0.83      0.93      0.87      1497



Epoch: 8/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.88it/s, F1=0.98, train_acc=0.996, train_loss=0.602, train_precision=0.972, train_recall=0.988] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       0.99      1.00      1.00       148
         ORG       0.96      0.98      0.97       547
         PRO       1.00      1.00      1.00        37
        RACE       0.88      0.94      0.91        16
       TITLE       0.98      0.99      0.98       702

   micro avg       0.97      0.99      0.98      1591
   macro avg       0.98      0.99      0.98      1591
weighted avg       0.97      0.99      0.98      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.72it/s, F1=0.886, eval_acc=0.959, eval_loss=6.86, eval_precision=0.848, eval_recall=0.932]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.97      0.97      0.97        33
         EDU       0.95      0.99      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.96      1.00      0.98       110
         ORG       0.79      0.88      0.83       523
         PRO       0.56      1.00      0.72        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.81      0.93      0.87       690

   micro avg       0.82      0.93      0.87      1497
   macro avg       0.87      0.97      0.91      1497
weighted avg       0.83      0.93      0.87      1497



Epoch: 9/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.82it/s, F1=0.988, train_acc=0.998, train_loss=0.351, train_precision=0.985, train_recall=0.991]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       0.99      0.99      0.99       148
         ORG       0.98      0.99      0.99       547
         PRO       0.97      1.00      0.99        37
        RACE       0.88      0.94      0.91        16
       TITLE       0.99      0.99      0.99       702

   micro avg       0.99      0.99      0.99      1591
   macro avg       0.98      0.99      0.98      1591
weighted avg       0.99      0.99      0.99      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.74it/s, F1=0.915, eval_acc=0.966, eval_loss=5.68, eval_precision=0.889, eval_recall=0.944]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.97      0.97      0.97        33
         EDU       0.95      0.98      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.84      0.93      0.88       523
         PRO       0.69      1.00      0.82        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.88      0.93      0.90       690

   micro avg       0.87      0.94      0.91      1497
   macro avg       0.90      0.97      0.93      1497
weighted avg       0.88      0.94      0.91      1497



Epoch: 10/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.86it/s, F1=0.986, train_acc=0.998, train_loss=0.312, train_precision=0.982, train_recall=0.991]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       0.99      1.00      0.99       148
         ORG       0.98      0.99      0.98       547
         PRO       1.00      1.00      1.00        37
        RACE       0.88      0.94      0.91        16
       TITLE       0.98      0.99      0.99       702

   micro avg       0.98      0.99      0.99      1591
   macro avg       0.98      0.99      0.98      1591
weighted avg       0.98      0.99      0.99      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.912, eval_acc=0.965, eval_loss=6.43, eval_precision=0.888, eval_recall=0.939]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.97      0.97      0.97        33
         EDU       0.97      0.99      0.98       106
         LOC       1.00      1.00      1.00         2
        NAME       0.97      1.00      0.99       110
         ORG       0.85      0.91      0.88       523
         PRO       0.72      1.00      0.84        18
        RACE       0.93      0.93      0.93        15
       TITLE       0.87      0.93      0.90       690

   micro avg       0.87      0.94      0.90      1497
   macro avg       0.91      0.97      0.94      1497
weighted avg       0.88      0.94      0.90      1497



Epoch: 11/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.86it/s, F1=0.995, train_acc=0.999, train_loss=0.16, train_precision=0.994, train_recall=0.996] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       0.99      1.00      1.00       148
         ORG       0.99      0.99      0.99       547
         PRO       1.00      1.00      1.00        37
        RACE       0.88      0.88      0.88        16
       TITLE       1.00      1.00      1.00       702

   micro avg       0.99      1.00      0.99      1591
   macro avg       0.98      0.98      0.98      1591
weighted avg       0.99      1.00      0.99      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.72it/s, F1=0.913, eval_acc=0.966, eval_loss=6.57, eval_precision=0.891, eval_recall=0.938]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.97      0.97      0.97        33
         EDU       0.95      0.98      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.84      0.91      0.87       523
         PRO       0.82      1.00      0.90        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.87      0.92      0.89       690

   micro avg       0.87      0.93      0.90      1497
   macro avg       0.92      0.97      0.94      1497
weighted avg       0.87      0.93      0.90      1497



Epoch: 12/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.85it/s, F1=0.988, train_acc=0.998, train_loss=0.31, train_precision=0.985, train_recall=0.992] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       0.96      0.98      0.97        99
         LOC       1.00      1.00      1.00         7
        NAME       0.99      1.00      1.00       148
         ORG       0.99      0.99      0.99       547
         PRO       0.95      0.97      0.96        37
        RACE       0.88      0.94      0.91        16
       TITLE       0.98      0.99      0.99       702

   micro avg       0.98      0.99      0.99      1591
   macro avg       0.97      0.98      0.98      1591
weighted avg       0.98      0.99      0.99      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.72it/s, F1=0.901, eval_acc=0.965, eval_loss=5.98, eval_precision=0.871, eval_recall=0.935]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.94      0.96      0.95       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.83      0.90      0.86       523
         PRO       0.62      1.00      0.77        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.85      0.93      0.89       690

   micro avg       0.86      0.93      0.89      1497
   macro avg       0.90      0.97      0.93      1497
weighted avg       0.86      0.93      0.89      1497



Epoch: 13/30 Train: 100%|██████████| 63/63 [00:18<00:00,  3.35it/s, F1=0.989, train_acc=0.998, train_loss=0.274, train_precision=0.986, train_recall=0.991]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       0.98      0.99      0.98        99
         LOC       1.00      1.00      1.00         7
        NAME       0.99      0.99      0.99       148
         ORG       0.99      0.99      0.99       547
         PRO       1.00      1.00      1.00        37
        RACE       0.88      0.88      0.88        16
       TITLE       0.99      0.99      0.99       702

   micro avg       0.99      0.99      0.99      1591
   macro avg       0.98      0.98      0.98      1591
weighted avg       0.99      0.99      0.99      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.72it/s, F1=0.899, eval_acc=0.965, eval_loss=6.08, eval_precision=0.869, eval_recall=0.933]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.97      0.97      0.97        33
         EDU       0.95      0.98      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.96      1.00      0.98       110
         ORG       0.82      0.90      0.86       523
         PRO       0.75      1.00      0.86        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.85      0.92      0.88       690

   micro avg       0.85      0.93      0.89      1497
   macro avg       0.90      0.97      0.93      1497
weighted avg       0.85      0.93      0.89      1497



Epoch: 14/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.79it/s, F1=0.992, train_acc=0.998, train_loss=0.388, train_precision=0.988, train_recall=0.997]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       0.99      0.99      0.99        99
         LOC       1.00      1.00      1.00         7
        NAME       0.99      1.00      1.00       148
         ORG       0.99      1.00      0.99       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       0.98      1.00      0.99       702

   micro avg       0.99      1.00      0.99      1591
   macro avg       0.99      1.00      1.00      1591
weighted avg       0.99      1.00      0.99      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.74it/s, F1=0.91, eval_acc=0.965, eval_loss=6.15, eval_precision=0.885, eval_recall=0.936] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.97      1.00      0.99        33
         EDU       0.94      0.97      0.96       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.84      0.91      0.87       523
         PRO       0.69      1.00      0.82        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.87      0.92      0.89       690

   micro avg       0.87      0.93      0.90      1497
   macro avg       0.90      0.98      0.93      1497
weighted avg       0.87      0.93      0.90      1497



Epoch: 15/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.89it/s, F1=0.994, train_acc=0.999, train_loss=0.23, train_precision=0.993, train_recall=0.995]  


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       0.98      0.99      0.99       547
         PRO       0.95      0.95      0.95        37
        RACE       1.00      1.00      1.00        16
       TITLE       0.99      1.00      1.00       702

   micro avg       0.99      0.99      0.99      1591
   macro avg       0.99      0.99      0.99      1591
weighted avg       0.99      0.99      0.99      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.72it/s, F1=0.819, eval_acc=0.938, eval_loss=11.5, eval_precision=0.77, eval_recall=0.876] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.94      0.99      0.96       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.69      0.76      0.73       523
         PRO       0.42      0.94      0.59        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.77      0.90      0.83       690

   micro avg       0.76      0.87      0.81      1497
   macro avg       0.83      0.94      0.87      1497
weighted avg       0.77      0.87      0.82      1497



Epoch: 16/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.88it/s, F1=0.973, train_acc=0.997, train_loss=0.678, train_precision=0.963, train_recall=0.985]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       0.98      0.99      0.98        99
         LOC       0.88      1.00      0.93         7
        NAME       1.00      1.00      1.00       148
         ORG       0.95      0.98      0.96       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       0.96      0.98      0.97       702

   micro avg       0.96      0.99      0.97      1591
   macro avg       0.97      0.99      0.98      1591
weighted avg       0.96      0.99      0.97      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.73it/s, F1=0.871, eval_acc=0.952, eval_loss=8.33, eval_precision=0.838, eval_recall=0.908]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.93      0.99      0.96       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.73      0.83      0.78       523
         PRO       0.69      1.00      0.82        18
        RACE       0.82      0.93      0.87        15
       TITLE       0.87      0.92      0.90       690

   micro avg       0.83      0.90      0.87      1497
   macro avg       0.88      0.96      0.92      1497
weighted avg       0.84      0.90      0.87      1497



Epoch: 17/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.86it/s, F1=0.967, train_acc=0.994, train_loss=0.92, train_precision=0.957, train_recall=0.979] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       0.97      0.99      0.98        99
         LOC       1.00      1.00      1.00         7
        NAME       0.95      0.96      0.95       148
         ORG       0.93      0.97      0.95       547
         PRO       0.92      0.95      0.93        37
        RACE       0.88      0.94      0.91        16
       TITLE       0.99      0.99      0.99       702

   micro avg       0.96      0.98      0.97      1591
   macro avg       0.95      0.97      0.96      1591
weighted avg       0.96      0.98      0.97      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.61it/s, F1=0.905, eval_acc=0.962, eval_loss=6.95, eval_precision=0.881, eval_recall=0.932]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.92      0.98      0.95       106
         LOC       0.40      1.00      0.57         2
        NAME       0.94      1.00      0.97       110
         ORG       0.84      0.90      0.87       523
         PRO       0.67      1.00      0.80        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.88      0.92      0.90       690

   micro avg       0.87      0.93      0.90      1497
   macro avg       0.82      0.97      0.87      1497
weighted avg       0.87      0.93      0.90      1497



Epoch: 18/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.83it/s, F1=0.99, train_acc=0.998, train_loss=0.362, train_precision=0.988, train_recall=0.993] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      0.99      0.99        99
         LOC       1.00      1.00      1.00         7
        NAME       0.99      0.99      0.99       148
         ORG       0.98      0.99      0.99       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       0.99      0.99      0.99       702

   micro avg       0.99      0.99      0.99      1591
   macro avg       1.00      0.99      1.00      1591
weighted avg       0.99      0.99      0.99      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.908, eval_acc=0.963, eval_loss=6.5, eval_precision=0.882, eval_recall=0.937] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      0.99      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.97      1.00      0.99       110
         ORG       0.86      0.90      0.88       523
         PRO       0.67      1.00      0.80        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.86      0.93      0.89       690

   micro avg       0.87      0.93      0.90      1497
   macro avg       0.90      0.97      0.93      1497
weighted avg       0.88      0.93      0.90      1497



Epoch: 19/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.29it/s, F1=0.993, train_acc=0.999, train_loss=0.164, train_precision=0.991, train_recall=0.996]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       0.98      0.99      0.99       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       0.99      1.00      0.99       702

   micro avg       0.99      0.99      0.99      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       0.99      0.99      0.99      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.69it/s, F1=0.922, eval_acc=0.966, eval_loss=7.03, eval_precision=0.9, eval_recall=0.946]  


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.94      0.96      0.95       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.87      0.93      0.90       523
         PRO       0.78      1.00      0.88        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.89      0.94      0.91       690

   micro avg       0.89      0.94      0.92      1497
   macro avg       0.92      0.97      0.94      1497
weighted avg       0.89      0.94      0.92      1497



Epoch: 20/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.89it/s, F1=0.994, train_acc=0.999, train_loss=0.225, train_precision=0.993, train_recall=0.996] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       0.99      0.99      0.99       547
         PRO       1.00      0.97      0.99        37
        RACE       1.00      1.00      1.00        16
       TITLE       0.99      1.00      1.00       702

   micro avg       0.99      1.00      0.99      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       0.99      1.00      0.99      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.67it/s, F1=0.912, eval_acc=0.962, eval_loss=7.53, eval_precision=0.882, eval_recall=0.946]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.94      0.97      0.96       106
         LOC       1.00      1.00      1.00         2
        NAME       0.97      1.00      0.99       110
         ORG       0.86      0.92      0.89       523
         PRO       0.53      1.00      0.69        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.87      0.94      0.90       690

   micro avg       0.87      0.94      0.91      1497
   macro avg       0.88      0.97      0.92      1497
weighted avg       0.88      0.94      0.91      1497



Epoch: 21/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.86it/s, F1=0.995, train_acc=0.999, train_loss=0.371, train_precision=0.994, train_recall=0.997]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       0.99      1.00      0.99        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       0.99      1.00      0.99       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       0.99      1.00      0.99       702

   micro avg       0.99      1.00      0.99      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       0.99      1.00      0.99      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.58it/s, F1=0.856, eval_acc=0.952, eval_loss=8.8, eval_precision=0.809, eval_recall=0.911] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      0.98      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.74      0.83      0.78       523
         PRO       0.56      1.00      0.72        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.80      0.93      0.86       690

   micro avg       0.80      0.91      0.85      1497
   macro avg       0.86      0.96      0.90      1497
weighted avg       0.81      0.91      0.85      1497



Epoch: 22/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.85it/s, F1=0.996, train_acc=0.999, train_loss=0.254, train_precision=0.995, train_recall=0.997]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       0.99      0.99      0.99       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       0.99      1.00      1.00       702

   micro avg       0.99      1.00      0.99      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       0.99      1.00      0.99      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.73it/s, F1=0.92, eval_acc=0.966, eval_loss=7.11, eval_precision=0.892, eval_recall=0.952] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      0.99      0.98       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.85      0.93      0.89       523
         PRO       0.60      1.00      0.75        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.88      0.94      0.91       690

   micro avg       0.88      0.95      0.92      1497
   macro avg       0.89      0.98      0.93      1497
weighted avg       0.89      0.95      0.92      1497



Epoch: 23/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.86it/s, F1=0.992, train_acc=0.999, train_loss=0.126, train_precision=0.989, train_recall=0.995] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       0.98      0.99      0.99       547
         PRO       0.95      0.95      0.95        37
        RACE       1.00      1.00      1.00        16
       TITLE       0.99      0.99      0.99       702

   micro avg       0.99      0.99      0.99      1591
   macro avg       0.99      0.99      0.99      1591
weighted avg       0.99      0.99      0.99      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.55it/s, F1=0.865, eval_acc=0.95, eval_loss=7.84, eval_precision=0.817, eval_recall=0.921] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.97      0.98      0.98       106
         LOC       1.00      1.00      1.00         2
        NAME       0.97      1.00      0.99       110
         ORG       0.75      0.84      0.79       523
         PRO       0.19      1.00      0.32        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.85      0.94      0.89       690

   micro avg       0.80      0.91      0.85      1497
   macro avg       0.83      0.96      0.86      1497
weighted avg       0.83      0.91      0.87      1497



Epoch: 24/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.81it/s, F1=0.993, train_acc=0.999, train_loss=0.215, train_precision=0.991, train_recall=0.995]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       0.98      0.99      0.99       547
         PRO       0.95      1.00      0.97        37
        RACE       1.00      1.00      1.00        16
       TITLE       0.99      0.99      0.99       702

   micro avg       0.99      0.99      0.99      1591
   macro avg       0.99      1.00      0.99      1591
weighted avg       0.99      0.99      0.99      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.73it/s, F1=0.902, eval_acc=0.965, eval_loss=6.88, eval_precision=0.867, eval_recall=0.941]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      0.98      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.82      0.91      0.86       523
         PRO       0.67      1.00      0.80        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.86      0.94      0.90       690

   micro avg       0.86      0.94      0.90      1497
   macro avg       0.90      0.97      0.93      1497
weighted avg       0.86      0.94      0.90      1497



Epoch: 25/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.26it/s, F1=0.999, train_acc=1, train_loss=0.0365, train_precision=0.999, train_recall=1]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       1.00      1.00      1.00       547
         PRO       0.95      0.97      0.96        37
        RACE       1.00      1.00      1.00        16
       TITLE       1.00      1.00      1.00       702

   micro avg       1.00      1.00      1.00      1591
   macro avg       0.99      1.00      0.99      1591
weighted avg       1.00      1.00      1.00      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.59it/s, F1=0.906, eval_acc=0.964, eval_loss=7.08, eval_precision=0.875, eval_recall=0.941]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      0.98      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.83      0.91      0.87       523
         PRO       0.64      1.00      0.78        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.87      0.94      0.90       690

   micro avg       0.87      0.94      0.90      1497
   macro avg       0.90      0.97      0.93      1497
weighted avg       0.87      0.94      0.90      1497



Epoch: 26/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.83it/s, F1=1, train_acc=1, train_loss=0.0389, train_precision=1, train_recall=1]    


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       1.00      1.00      1.00       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       1.00      1.00      1.00       702

   micro avg       1.00      1.00      1.00      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       1.00      1.00      1.00      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.36it/s, F1=0.911, eval_acc=0.965, eval_loss=7.17, eval_precision=0.881, eval_recall=0.944]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      0.98      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.85      0.92      0.88       523
         PRO       0.62      1.00      0.77        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.87      0.93      0.90       690

   micro avg       0.88      0.94      0.91      1497
   macro avg       0.90      0.97      0.93      1497
weighted avg       0.88      0.94      0.91      1497



Epoch: 27/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.79it/s, F1=0.993, train_acc=0.999, train_loss=0.16, train_precision=0.99, train_recall=0.997]  


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       0.98      0.99      0.99       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       0.99      1.00      0.99       702

   micro avg       0.99      1.00      0.99      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       0.99      1.00      0.99      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.71it/s, F1=0.891, eval_acc=0.955, eval_loss=9.64, eval_precision=0.859, eval_recall=0.928]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.97      0.98      0.98       106
         LOC       1.00      1.00      1.00         2
        NAME       0.96      1.00      0.98       110
         ORG       0.81      0.89      0.85       523
         PRO       0.56      1.00      0.72        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.83      0.93      0.87       690

   micro avg       0.84      0.93      0.88      1497
   macro avg       0.88      0.97      0.91      1497
weighted avg       0.84      0.93      0.88      1497



Epoch: 28/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.84it/s, F1=0.988, train_acc=0.998, train_loss=0.541, train_precision=0.983, train_recall=0.993]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       0.99      1.00      0.99        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       0.97      0.99      0.98       547
         PRO       0.97      0.97      0.97        37
        RACE       1.00      1.00      1.00        16
       TITLE       0.98      0.99      0.99       702

   micro avg       0.98      0.99      0.99      1591
   macro avg       0.99      0.99      0.99      1591
weighted avg       0.98      0.99      0.99      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.64it/s, F1=0.905, eval_acc=0.96, eval_loss=7.74, eval_precision=0.88, eval_recall=0.934]  


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.91      0.99      0.95       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.84      0.90      0.87       523
         PRO       0.47      1.00      0.64        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.87      0.92      0.89       690

   micro avg       0.87      0.93      0.90      1497
   macro avg       0.87      0.97      0.91      1497
weighted avg       0.87      0.93      0.90      1497



Epoch: 29/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.76it/s, F1=0.994, train_acc=0.999, train_loss=0.262, train_precision=0.992, train_recall=0.997]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       0.97      0.99      0.98        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       0.99      1.00      0.99       547
         PRO       0.97      1.00      0.99        37
        RACE       1.00      1.00      1.00        16
       TITLE       0.99      1.00      0.99       702

   micro avg       0.99      1.00      0.99      1591
   macro avg       0.99      1.00      0.99      1591
weighted avg       0.99      1.00      0.99      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.923, eval_acc=0.964, eval_loss=7.85, eval_precision=0.898, eval_recall=0.951]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      0.98      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.86      0.93      0.90       523
         PRO       0.58      1.00      0.73        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.89      0.94      0.92       690

   micro avg       0.89      0.95      0.92      1497
   macro avg       0.89      0.97      0.93      1497
weighted avg       0.89      0.95      0.92      1497



Epoch: 30/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.86it/s, F1=0.999, train_acc=1, train_loss=0.0662, train_precision=0.998, train_recall=0.999]   


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       0.99      1.00      0.99        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       1.00      1.00      1.00       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       1.00      1.00      1.00       702

   micro avg       1.00      1.00      1.00      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       1.00      1.00      1.00      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.71it/s, F1=0.921, eval_acc=0.965, eval_loss=7.59, eval_precision=0.897, eval_recall=0.947]


eval_reports:


calculate data/few_shot/resume/train_500.json etag: 100%|██████████| 226k/226k [00:00<00:00, 213MB/s]
calculate data/few_shot/resume/dev.json etag: 100%|██████████| 208k/208k [00:00<00:00, 202MB/s]
calculate data/few_shot/resume/test.json etag: 100%|██████████| 230k/230k [00:00<00:00, 220MB/s]
calculate data/few_shot/resume/labels.txt etag: 100%|██████████| 181/181 [00:00<00:00, 1.11MB/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      0.96      0.96       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.87      0.92      0.89       523
         PRO       0.60      1.00      0.75        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.89      0.94      0.92       690

   micro avg       0.89      0.94      0.92      1497
   macro avg       0.90      0.97      0.93      1497
weighted avg       0.89      0.94      0.92      1497

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/resume/train_500.json",
    "eval_file": "data/few_shot/resume/dev.json",
    "test_file": "data/few_shot


count line size data/few_shot/resume/labels.txt: 29L [00:00, 248741.96L/s]
build line mapper: 29L [00:00, 243269.63L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 29/29 [00:00<00:00, 8409.49it/s]
load vocab from list: 100%|██████████| 28/28 [00:00<00:00, 257544.98it/s]
load dataset from data/few_shot/resume/train_500.json: 91it [00:00, 908.22it/s]

load cached ./temp/1acbeeb28deec326649877a3b4cfe533_578a629df36736a7b0ca315689a0fbc2_a783a23408031aaf8881013b1b168597_61206f767c93b652c614f8099bc479e7/1000000/matched_words
load cached ./temp/1acbeeb28deec326649877a3b4cfe533_578a629df36736a7b0ca315689a0fbc2_a783a23408031aaf8881013b1b168597_61206f767c93b652c614f8099bc479e7/1000000/word_vocab
load cached ./temp/1acbeeb28deec326649877a3b4cfe533_578a629df36736a7b0ca315689a0fbc2_a783a23408031aaf8881013b1b168597_61206f767c93b652c614f8099bc479e7/1000000/vocab_embedding


load dataset from data/few_shot/resume/train_500.json: 500it [00:00, 822.94it/s]
load dataset from data/few_shot/resume/dev.json: 463it [00:00, 824.92it/s]
Some weights of the model checkpoint at save_pretrained/resume_pretrain_lebert_500_pretraind_task/Bert_480/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.91it/s, F1=0.0252, train_acc=0.363, train_loss=89.9, train_precision=0.0204, train_recall=0.0363]     


train_reports:
              precision    recall  f1-score   support

        CONT       0.00      0.00      0.00        35
         EDU       0.00      0.00      0.00        99
         LOC       0.00      0.00      0.00         7
        NAME       0.08      0.01      0.02       148
         ORG       0.01      0.06      0.02       547
         PRO       0.00      0.00      0.00        37
        RACE       0.00      0.06      0.00        16
       TITLE       0.02      0.02      0.02       702

   micro avg       0.01      0.03      0.01      1591
   macro avg       0.01      0.02      0.01      1591
weighted avg       0.02      0.03      0.02      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.58it/s, F1=0.236, eval_acc=0.725, eval_loss=34.3, eval_precision=0.203, eval_recall=0.283]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.00      0.00      0.00        33
         EDU       0.00      0.00      0.00       106
         LOC       0.00      0.00      0.00         2
        NAME       0.00      0.00      0.00       110
         ORG       0.15      0.29      0.20       523
         PRO       0.00      0.00      0.00        18
        RACE       0.00      0.00      0.00        15
       TITLE       0.23      0.39      0.29       690

   micro avg       0.20      0.28      0.23      1497
   macro avg       0.05      0.09      0.06      1497
weighted avg       0.16      0.28      0.20      1497



Epoch: 2/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.81it/s, F1=0.457, train_acc=0.852, train_loss=19.1, train_precision=0.393, train_recall=0.553]


train_reports:
              precision    recall  f1-score   support

        CONT       0.00      0.00      0.00        35
         EDU       0.06      0.11      0.08        99
         LOC       0.00      0.00      0.00         7
        NAME       0.06      0.10      0.07       148
         ORG       0.37      0.65      0.47       547
         PRO       0.00      0.00      0.00        37
        RACE       0.00      0.00      0.00        16
       TITLE       0.55      0.73      0.63       702

   micro avg       0.38      0.56      0.45      1591
   macro avg       0.13      0.20      0.16      1591
weighted avg       0.38      0.56      0.45      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.72it/s, F1=0.636, eval_acc=0.906, eval_loss=11.5, eval_precision=0.559, eval_recall=0.74] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.03      0.03      0.03        33
         EDU       0.13      0.26      0.18       106
         LOC       0.00      0.00      0.00         2
        NAME       0.17      0.32      0.22       110
         ORG       0.60      0.91      0.72       523
         PRO       0.00      0.00      0.00        18
        RACE       0.00      0.00      0.00        15
       TITLE       0.71      0.79      0.75       690

   micro avg       0.53      0.73      0.62      1497
   macro avg       0.21      0.29      0.24      1497
weighted avg       0.56      0.73      0.63      1497



Epoch: 3/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.83it/s, F1=0.786, train_acc=0.951, train_loss=6.51, train_precision=0.74, train_recall=0.846] 


train_reports:
              precision    recall  f1-score   support

        CONT       0.43      0.66      0.52        35
         EDU       0.54      0.71      0.61        99
         LOC       0.00      0.00      0.00         7
        NAME       0.74      0.89      0.81       148
         ORG       0.74      0.88      0.80       547
         PRO       0.06      0.11      0.07        37
        RACE       0.00      0.00      0.00        16
       TITLE       0.83      0.91      0.87       702

   micro avg       0.72      0.85      0.78      1591
   macro avg       0.42      0.52      0.46      1591
weighted avg       0.73      0.85      0.79      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.72it/s, F1=0.867, eval_acc=0.95, eval_loss=7.05, eval_precision=0.816, eval_recall=0.927] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.65      0.97      0.78        33
         EDU       0.87      0.93      0.90       106
         LOC       0.00      0.00      0.00         2
        NAME       0.96      1.00      0.98       110
         ORG       0.74      0.92      0.82       523
         PRO       0.48      0.72      0.58        18
        RACE       0.00      0.00      0.00        15
       TITLE       0.84      0.93      0.89       690

   micro avg       0.80      0.92      0.85      1497
   macro avg       0.57      0.68      0.62      1497
weighted avg       0.80      0.92      0.85      1497



Epoch: 4/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.81it/s, F1=0.914, train_acc=0.981, train_loss=2.74, train_precision=0.891, train_recall=0.942]


train_reports:
              precision    recall  f1-score   support

        CONT       0.72      0.97      0.83        35
         EDU       0.90      0.95      0.92        99
         LOC       0.00      0.00      0.00         7
        NAME       0.92      0.96      0.94       148
         ORG       0.87      0.94      0.90       547
         PRO       0.57      0.68      0.62        37
        RACE       0.60      0.56      0.58        16
       TITLE       0.93      0.97      0.95       702

   micro avg       0.88      0.94      0.91      1591
   macro avg       0.69      0.75      0.72      1591
weighted avg       0.88      0.94      0.91      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.52it/s, F1=0.892, eval_acc=0.958, eval_loss=5.9, eval_precision=0.853, eval_recall=0.937] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.92      0.97      0.94       106
         LOC       0.00      0.00      0.00         2
        NAME       0.95      0.99      0.97       110
         ORG       0.80      0.91      0.85       523
         PRO       0.56      1.00      0.72        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.86      0.93      0.89       690

   micro avg       0.84      0.93      0.89      1497
   macro avg       0.75      0.85      0.79      1497
weighted avg       0.85      0.93      0.89      1497



Epoch: 5/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.84it/s, F1=0.964, train_acc=0.992, train_loss=1.25, train_precision=0.953, train_recall=0.975]


train_reports:
              precision    recall  f1-score   support

        CONT       0.97      1.00      0.99        35
         EDU       0.97      0.98      0.97        99
         LOC       0.56      0.71      0.63         7
        NAME       0.99      0.99      0.99       148
         ORG       0.94      0.97      0.95       547
         PRO       0.90      0.95      0.92        37
        RACE       0.88      0.88      0.88        16
       TITLE       0.96      0.98      0.97       702

   micro avg       0.95      0.97      0.96      1591
   macro avg       0.90      0.93      0.91      1591
weighted avg       0.95      0.97      0.96      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.66it/s, F1=0.886, eval_acc=0.965, eval_loss=4.76, eval_precision=0.849, eval_recall=0.928]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.93      0.94      0.93       106
         LOC       1.00      1.00      1.00         2
        NAME       0.96      1.00      0.98       110
         ORG       0.75      0.88      0.81       523
         PRO       0.82      1.00      0.90        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.85      0.94      0.89       690

   micro avg       0.83      0.92      0.88      1497
   macro avg       0.90      0.96      0.93      1497
weighted avg       0.84      0.92      0.88      1497



Epoch: 6/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.82it/s, F1=0.974, train_acc=0.994, train_loss=1.1, train_precision=0.965, train_recall=0.984]  


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       0.98      0.99      0.98        99
         LOC       1.00      1.00      1.00         7
        NAME       0.99      1.00      0.99       148
         ORG       0.95      0.97      0.96       547
         PRO       0.92      0.97      0.95        37
        RACE       0.88      0.88      0.88        16
       TITLE       0.97      0.99      0.98       702

   micro avg       0.96      0.98      0.97      1591
   macro avg       0.96      0.97      0.97      1591
weighted avg       0.96      0.98      0.97      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.53it/s, F1=0.893, eval_acc=0.946, eval_loss=9.52, eval_precision=0.857, eval_recall=0.933]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.93      0.94      0.93       106
         LOC       1.00      1.00      1.00         2
        NAME       0.96      1.00      0.98       110
         ORG       0.83      0.89      0.86       523
         PRO       0.69      1.00      0.82        18
        RACE       0.83      1.00      0.91        15
       TITLE       0.84      0.93      0.88       690

   micro avg       0.85      0.93      0.89      1497
   macro avg       0.89      0.97      0.92      1497
weighted avg       0.85      0.93      0.89      1497



Epoch: 7/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.86it/s, F1=0.967, train_acc=0.994, train_loss=0.91, train_precision=0.958, train_recall=0.977] 


train_reports:
              precision    recall  f1-score   support

        CONT       0.97      0.97      0.97        35
         EDU       0.95      0.98      0.97        99
         LOC       1.00      1.00      1.00         7
        NAME       0.99      1.00      1.00       148
         ORG       0.96      0.98      0.97       547
         PRO       0.88      0.97      0.92        37
        RACE       0.88      0.88      0.88        16
       TITLE       0.95      0.97      0.96       702

   micro avg       0.96      0.98      0.97      1591
   macro avg       0.95      0.97      0.96      1591
weighted avg       0.96      0.98      0.97      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.69it/s, F1=0.904, eval_acc=0.963, eval_loss=5.54, eval_precision=0.879, eval_recall=0.932]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.94      0.95      0.95       106
         LOC       1.00      1.00      1.00         2
        NAME       0.95      0.99      0.97       110
         ORG       0.81      0.90      0.85       523
         PRO       0.90      1.00      0.95        18
        RACE       0.88      0.93      0.90        15
       TITLE       0.88      0.93      0.90       690

   micro avg       0.87      0.93      0.90      1497
   macro avg       0.92      0.96      0.94      1497
weighted avg       0.87      0.93      0.90      1497



Epoch: 8/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.85it/s, F1=0.977, train_acc=0.995, train_loss=0.64, train_precision=0.971, train_recall=0.983] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       0.98      0.99      0.98        99
         LOC       0.88      1.00      0.93         7
        NAME       0.98      0.99      0.99       148
         ORG       0.96      0.98      0.97       547
         PRO       0.95      0.97      0.96        37
        RACE       0.88      0.88      0.88        16
       TITLE       0.97      0.98      0.98       702

   micro avg       0.97      0.98      0.97      1591
   macro avg       0.95      0.97      0.96      1591
weighted avg       0.97      0.98      0.97      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.67it/s, F1=0.887, eval_acc=0.955, eval_loss=7.66, eval_precision=0.853, eval_recall=0.926]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.93      0.97      0.95       106
         LOC       1.00      1.00      1.00         2
        NAME       0.96      1.00      0.98       110
         ORG       0.79      0.88      0.83       523
         PRO       0.58      1.00      0.73        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.84      0.92      0.88       690

   micro avg       0.84      0.92      0.88      1497
   macro avg       0.87      0.97      0.91      1497
weighted avg       0.84      0.92      0.88      1497



Epoch: 9/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.90it/s, F1=0.971, train_acc=0.995, train_loss=0.711, train_precision=0.965, train_recall=0.979]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       0.88      1.00      0.93         7
        NAME       0.99      0.99      0.99       148
         ORG       0.95      0.97      0.96       547
         PRO       0.97      0.97      0.97        37
        RACE       0.93      0.88      0.90        16
       TITLE       0.96      0.98      0.97       702

   micro avg       0.96      0.98      0.97      1591
   macro avg       0.96      0.97      0.97      1591
weighted avg       0.96      0.98      0.97      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.902, eval_acc=0.962, eval_loss=6.16, eval_precision=0.876, eval_recall=0.93] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.97      0.97      0.97        33
         EDU       0.95      0.99      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.96      1.00      0.98       110
         ORG       0.83      0.90      0.86       523
         PRO       0.62      1.00      0.77        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.87      0.92      0.89       690

   micro avg       0.86      0.93      0.89      1497
   macro avg       0.88      0.97      0.92      1497
weighted avg       0.87      0.93      0.89      1497



Epoch: 10/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.81it/s, F1=0.982, train_acc=0.997, train_loss=0.423, train_precision=0.979, train_recall=0.985]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       0.99      0.99      0.99       148
         ORG       0.97      0.98      0.98       547
         PRO       1.00      1.00      1.00        37
        RACE       0.88      0.88      0.88        16
       TITLE       0.98      0.98      0.98       702

   micro avg       0.98      0.98      0.98      1591
   macro avg       0.98      0.98      0.98      1591
weighted avg       0.98      0.98      0.98      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.63it/s, F1=0.91, eval_acc=0.962, eval_loss=6.75, eval_precision=0.877, eval_recall=0.946] 


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.97      0.97      0.97        33
         EDU       0.94      0.99      0.96       106
         LOC       1.00      1.00      1.00         2
        NAME       0.97      1.00      0.99       110
         ORG       0.83      0.91      0.87       523
         PRO       0.67      1.00      0.80        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.86      0.94      0.90       690

   micro avg       0.86      0.94      0.90      1497
   macro avg       0.90      0.98      0.93      1497
weighted avg       0.86      0.94      0.90      1497



Epoch: 11/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.81it/s, F1=0.991, train_acc=0.999, train_loss=0.155, train_precision=0.989, train_recall=0.994]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       0.99      0.99      0.99       547
         PRO       1.00      1.00      1.00        37
        RACE       0.88      0.94      0.91        16
       TITLE       0.99      1.00      1.00       702

   micro avg       0.99      1.00      0.99      1591
   macro avg       0.98      0.99      0.99      1591
weighted avg       0.99      1.00      0.99      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.915, eval_acc=0.964, eval_loss=6.56, eval_precision=0.888, eval_recall=0.943]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.97      0.97      0.97        33
         EDU       0.93      0.99      0.96       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.85      0.92      0.88       523
         PRO       0.69      1.00      0.82        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.87      0.93      0.90       690

   micro avg       0.87      0.94      0.91      1497
   macro avg       0.90      0.98      0.94      1497
weighted avg       0.88      0.94      0.91      1497



Epoch: 12/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.25it/s, F1=0.997, train_acc=1, train_loss=0.105, train_precision=0.997, train_recall=0.998]    


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       1.00      0.99      1.00       547
         PRO       1.00      1.00      1.00        37
        RACE       0.88      0.94      0.91        16
       TITLE       1.00      1.00      1.00       702

   micro avg       1.00      1.00      1.00      1591
   macro avg       0.98      0.99      0.99      1591
weighted avg       1.00      1.00      1.00      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.66it/s, F1=0.915, eval_acc=0.963, eval_loss=6.88, eval_precision=0.887, eval_recall=0.945]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.94      0.99      0.96       106
         LOC       1.00      1.00      1.00         2
        NAME       0.97      1.00      0.99       110
         ORG       0.84      0.92      0.88       523
         PRO       0.78      1.00      0.88        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.87      0.93      0.90       690

   micro avg       0.88      0.94      0.91      1497
   macro avg       0.92      0.98      0.95      1497
weighted avg       0.88      0.94      0.91      1497



Epoch: 13/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.82it/s, F1=0.993, train_acc=0.999, train_loss=0.136, train_precision=0.991, train_recall=0.995]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       0.99      0.99      0.99       148
         ORG       0.99      0.99      0.99       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       0.99      1.00      1.00       702

   micro avg       0.99      1.00      0.99      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       0.99      1.00      0.99      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.71it/s, F1=0.912, eval_acc=0.963, eval_loss=6.72, eval_precision=0.888, eval_recall=0.939]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      0.99      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.84      0.92      0.88       523
         PRO       0.67      1.00      0.80        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.87      0.92      0.90       690

   micro avg       0.87      0.94      0.90      1497
   macro avg       0.90      0.98      0.93      1497
weighted avg       0.88      0.94      0.90      1497



Epoch: 14/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.85it/s, F1=0.996, train_acc=0.999, train_loss=0.0797, train_precision=0.996, train_recall=0.997]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       0.99      1.00      1.00       148
         ORG       1.00      0.99      1.00       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       1.00      1.00      1.00       702

   micro avg       1.00      1.00      1.00      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       1.00      1.00      1.00      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.69it/s, F1=0.918, eval_acc=0.963, eval_loss=7.08, eval_precision=0.892, eval_recall=0.947]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      0.99      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.85      0.93      0.89       523
         PRO       0.72      1.00      0.84        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.88      0.93      0.90       690

   micro avg       0.88      0.94      0.91      1497
   macro avg       0.91      0.98      0.94      1497
weighted avg       0.88      0.94      0.91      1497



Epoch: 15/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.83it/s, F1=0.998, train_acc=1, train_loss=0.0572, train_precision=0.998, train_recall=0.999]    


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       0.99      1.00      1.00       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       1.00      1.00      1.00       702

   micro avg       1.00      1.00      1.00      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       1.00      1.00      1.00      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.68it/s, F1=0.921, eval_acc=0.963, eval_loss=7.13, eval_precision=0.897, eval_recall=0.946]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      0.99      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.86      0.92      0.89       523
         PRO       0.69      1.00      0.82        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.88      0.93      0.91       690

   micro avg       0.89      0.94      0.91      1497
   macro avg       0.91      0.98      0.94      1497
weighted avg       0.89      0.94      0.91      1497



Epoch: 16/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.77it/s, F1=0.998, train_acc=1, train_loss=0.0403, train_precision=0.998, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       0.99      1.00      1.00       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       1.00      1.00      1.00       702

   micro avg       1.00      1.00      1.00      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       1.00      1.00      1.00      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.921, eval_acc=0.964, eval_loss=7.31, eval_precision=0.897, eval_recall=0.947]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.94      0.99      0.96       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.87      0.92      0.89       523
         PRO       0.64      1.00      0.78        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.88      0.93      0.91       690

   micro avg       0.88      0.94      0.91      1497
   macro avg       0.91      0.98      0.94      1497
weighted avg       0.89      0.94      0.91      1497



Epoch: 17/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.81it/s, F1=0.998, train_acc=1, train_loss=0.0315, train_precision=0.998, train_recall=0.999]    


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       0.99      1.00      1.00       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       1.00      1.00      1.00       702

   micro avg       1.00      1.00      1.00      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       1.00      1.00      1.00      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.68it/s, F1=0.919, eval_acc=0.963, eval_loss=7.52, eval_precision=0.895, eval_recall=0.947]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.94      0.99      0.96       106
         LOC       1.00      1.00      1.00         2
        NAME       0.97      1.00      0.99       110
         ORG       0.86      0.93      0.89       523
         PRO       0.67      1.00      0.80        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.88      0.93      0.90       690

   micro avg       0.88      0.94      0.91      1497
   macro avg       0.91      0.98      0.94      1497
weighted avg       0.88      0.94      0.91      1497



Epoch: 18/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.26it/s, F1=0.999, train_acc=0.999, train_loss=0.175, train_precision=0.999, train_recall=0.998]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       1.00      1.00      1.00       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       1.00      1.00      1.00       702

   micro avg       1.00      1.00      1.00      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       1.00      1.00      1.00      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.72it/s, F1=0.918, eval_acc=0.963, eval_loss=7.37, eval_precision=0.895, eval_recall=0.944]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      0.99      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.86      0.92      0.89       523
         PRO       0.67      1.00      0.80        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.88      0.93      0.90       690

   micro avg       0.88      0.94      0.91      1497
   macro avg       0.90      0.98      0.94      1497
weighted avg       0.89      0.94      0.91      1497



Epoch: 19/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.81it/s, F1=1, train_acc=1, train_loss=0.0384, train_precision=0.999, train_recall=1]    


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       1.00      1.00      1.00       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       1.00      1.00      1.00       702

   micro avg       1.00      1.00      1.00      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       1.00      1.00      1.00      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.73it/s, F1=0.916, eval_acc=0.964, eval_loss=7.17, eval_precision=0.887, eval_recall=0.948]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      0.99      0.98       106
         LOC       1.00      1.00      1.00         2
        NAME       0.97      1.00      0.99       110
         ORG       0.86      0.93      0.89       523
         PRO       0.60      1.00      0.75        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.88      0.94      0.91       690

   micro avg       0.88      0.95      0.91      1497
   macro avg       0.90      0.98      0.93      1497
weighted avg       0.89      0.95      0.91      1497



Epoch: 20/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.84it/s, F1=0.999, train_acc=1, train_loss=0.0307, train_precision=0.998, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       0.99      1.00      1.00       148
         ORG       1.00      1.00      1.00       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       1.00      1.00      1.00       702

   micro avg       1.00      1.00      1.00      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       1.00      1.00      1.00      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.69it/s, F1=0.916, eval_acc=0.964, eval_loss=7.28, eval_precision=0.889, eval_recall=0.946]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      0.99      0.98       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      0.99      0.99       110
         ORG       0.86      0.93      0.89       523
         PRO       0.62      1.00      0.77        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.88      0.93      0.91       690

   micro avg       0.89      0.94      0.91      1497
   macro avg       0.90      0.98      0.93      1497
weighted avg       0.89      0.94      0.91      1497



Epoch: 21/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.83it/s, F1=0.999, train_acc=1, train_loss=0.0333, train_precision=0.999, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       1.00      1.00      1.00       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       1.00      1.00      1.00       702

   micro avg       1.00      1.00      1.00      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       1.00      1.00      1.00      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.67it/s, F1=0.918, eval_acc=0.964, eval_loss=7.59, eval_precision=0.893, eval_recall=0.946]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      0.99      0.98       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.86      0.93      0.89       523
         PRO       0.67      1.00      0.80        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.88      0.93      0.90       690

   micro avg       0.88      0.94      0.91      1497
   macro avg       0.90      0.98      0.94      1497
weighted avg       0.89      0.94      0.91      1497



Epoch: 22/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.81it/s, F1=1, train_acc=1, train_loss=0.0163, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       1.00      1.00      1.00       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       1.00      1.00      1.00       702

   micro avg       1.00      1.00      1.00      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       1.00      1.00      1.00      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.72it/s, F1=0.916, eval_acc=0.963, eval_loss=7.83, eval_precision=0.889, eval_recall=0.946]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      0.99      0.98       106
         LOC       1.00      1.00      1.00         2
        NAME       0.97      1.00      0.99       110
         ORG       0.86      0.93      0.89       523
         PRO       0.69      1.00      0.82        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.87      0.93      0.90       690

   micro avg       0.88      0.94      0.91      1497
   macro avg       0.91      0.98      0.94      1497
weighted avg       0.88      0.94      0.91      1497



Epoch: 23/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.86it/s, F1=1, train_acc=1, train_loss=0.0284, train_precision=1, train_recall=1]        


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       1.00      1.00      1.00       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       1.00      1.00      1.00       702

   micro avg       1.00      1.00      1.00      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       1.00      1.00      1.00      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.918, eval_acc=0.964, eval_loss=7.55, eval_precision=0.893, eval_recall=0.944]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      0.99      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.86      0.92      0.89       523
         PRO       0.64      1.00      0.78        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.88      0.93      0.90       690

   micro avg       0.88      0.94      0.91      1497
   macro avg       0.90      0.98      0.94      1497
weighted avg       0.89      0.94      0.91      1497



Epoch: 24/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.81it/s, F1=1, train_acc=1, train_loss=0.0142, train_precision=1, train_recall=1] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       1.00      1.00      1.00       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       1.00      1.00      1.00       702

   micro avg       1.00      1.00      1.00      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       1.00      1.00      1.00      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.72it/s, F1=0.921, eval_acc=0.964, eval_loss=7.89, eval_precision=0.897, eval_recall=0.948]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      0.99      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.97      1.00      0.99       110
         ORG       0.86      0.92      0.89       523
         PRO       0.69      1.00      0.82        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.88      0.94      0.91       690

   micro avg       0.89      0.94      0.91      1497
   macro avg       0.91      0.98      0.94      1497
weighted avg       0.89      0.94      0.91      1497



Epoch: 25/30 Train: 100%|██████████| 63/63 [00:19<00:00,  3.20it/s, F1=0.999, train_acc=1, train_loss=0.0209, train_precision=0.999, train_recall=1]    


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       1.00      1.00      1.00       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       1.00      1.00      1.00       702

   micro avg       1.00      1.00      1.00      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       1.00      1.00      1.00      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.46it/s, F1=0.922, eval_acc=0.964, eval_loss=7.82, eval_precision=0.899, eval_recall=0.947]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      0.99      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.97      1.00      0.99       110
         ORG       0.87      0.93      0.90       523
         PRO       0.69      1.00      0.82        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.88      0.93      0.91       690

   micro avg       0.89      0.94      0.92      1497
   macro avg       0.91      0.98      0.94      1497
weighted avg       0.89      0.94      0.92      1497



Epoch: 26/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.82it/s, F1=1, train_acc=1, train_loss=0.0104, train_precision=1, train_recall=1] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       1.00      1.00      1.00       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       1.00      1.00      1.00       702

   micro avg       1.00      1.00      1.00      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       1.00      1.00      1.00      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.923, eval_acc=0.964, eval_loss=7.92, eval_precision=0.9, eval_recall=0.947]  


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      0.99      0.98       106
         LOC       1.00      1.00      1.00         2
        NAME       0.97      1.00      0.99       110
         ORG       0.87      0.92      0.90       523
         PRO       0.72      1.00      0.84        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.88      0.93      0.91       690

   micro avg       0.89      0.94      0.92      1497
   macro avg       0.91      0.98      0.94      1497
weighted avg       0.89      0.94      0.92      1497



Epoch: 27/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.83it/s, F1=1, train_acc=1, train_loss=0.0132, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       1.00      1.00      1.00       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       1.00      1.00      1.00       702

   micro avg       1.00      1.00      1.00      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       1.00      1.00      1.00      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.68it/s, F1=0.923, eval_acc=0.964, eval_loss=8.31, eval_precision=0.898, eval_recall=0.949]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      0.99      0.98       106
         LOC       1.00      1.00      1.00         2
        NAME       0.97      1.00      0.99       110
         ORG       0.86      0.93      0.89       523
         PRO       0.72      1.00      0.84        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.88      0.94      0.91       690

   micro avg       0.89      0.95      0.92      1497
   macro avg       0.91      0.98      0.94      1497
weighted avg       0.89      0.95      0.92      1497



Epoch: 28/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.86it/s, F1=0.999, train_acc=1, train_loss=0.0314, train_precision=0.999, train_recall=0.999]    


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       1.00      1.00      1.00       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       1.00      1.00      1.00       702

   micro avg       1.00      1.00      1.00      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       1.00      1.00      1.00      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.71it/s, F1=0.919, eval_acc=0.964, eval_loss=7.71, eval_precision=0.892, eval_recall=0.948]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      0.99      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.86      0.93      0.89       523
         PRO       0.62      1.00      0.77        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.88      0.94      0.91       690

   micro avg       0.88      0.94      0.91      1497
   macro avg       0.90      0.98      0.93      1497
weighted avg       0.88      0.94      0.91      1497



Epoch: 29/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.80it/s, F1=0.998, train_acc=1, train_loss=0.0278, train_precision=0.997, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       0.99      1.00      0.99       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       1.00      1.00      1.00       702

   micro avg       1.00      1.00      1.00      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       1.00      1.00      1.00      1591



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.64it/s, F1=0.922, eval_acc=0.964, eval_loss=8.01, eval_precision=0.898, eval_recall=0.948]


eval_reports:


  0%|          | 0/63 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      0.99      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.97      1.00      0.99       110
         ORG       0.88      0.93      0.90       523
         PRO       0.58      1.00      0.73        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.89      0.94      0.91       690

   micro avg       0.89      0.95      0.92      1497
   macro avg       0.89      0.98      0.93      1497
weighted avg       0.89      0.95      0.92      1497



Epoch: 30/30 Train: 100%|██████████| 63/63 [00:16<00:00,  3.79it/s, F1=1, train_acc=1, train_loss=0.0115, train_precision=1, train_recall=1] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        35
         EDU       1.00      1.00      1.00        99
         LOC       1.00      1.00      1.00         7
        NAME       1.00      1.00      1.00       148
         ORG       1.00      1.00      1.00       547
         PRO       1.00      1.00      1.00        37
        RACE       1.00      1.00      1.00        16
       TITLE       1.00      1.00      1.00       702

   micro avg       1.00      1.00      1.00      1591
   macro avg       1.00      1.00      1.00      1591
weighted avg       1.00      1.00      1.00      1591



Eval Result: 100%|██████████| 8/8 [00:05<00:00,  1.58it/s, F1=0.917, eval_acc=0.963, eval_loss=7.96, eval_precision=0.891, eval_recall=0.946]


eval_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      0.99      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.97      1.00      0.99       110
         ORG       0.87      0.92      0.89       523
         PRO       0.60      1.00      0.75        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.89      0.94      0.91       690

   micro avg       0.89      0.94      0.91      1497
   macro avg       0.90      0.98      0.93      1497
weighted avg       0.89      0.94      0.91      1497



calculate data/few_shot/resume/train_1000.json etag: 100%|██████████| 466k/466k [00:00<00:00, 266MB/s]
calculate data/few_shot/resume/dev.json etag: 100%|██████████| 208k/208k [00:00<00:00, 197MB/s]
calculate data/few_shot/resume/test.json etag: 100%|██████████| 230k/230k [00:00<00:00, 208MB/s]
calculate data/few_shot/resume/labels.txt etag: 100%|██████████| 181/181 [00:00<00:00, 325kB/s]

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/resume/train_1000.json",
    "eval_file": "data/few_shot/resume/dev.json",
    "test_file": "data/few_shot/resume/test.json",
    "tag_file": "data/few_shot/resume/labels.txt",
    "bert_vocab_file": "./model/chinese_wwm_ext/vocab.txt",
    "output_eval": true,
    "max_scan_num": 1000000,
    "add_seq_vocab": false,
    "max_seq_length": 150,
    "max_word_num": 5,
    "default_tag": "O",
    "use_test": false,
    "do_shuffle": true,
    "do_predict": false,
    "task_name": "resume_pretrain_lebert_crf_1000_x1"
}
load cached ./temp/204ecb844970c953244b42be8f449690_578a629df36736a7b0ca315689a0fbc2_a783a23408031aaf8881013b1b168597_61206f767c93b652c614f8099bc479e7/1000000/lexicon_tree



count line size data/few_shot/resume/labels.txt: 29L [00:00, 187708.05L/s]
build line mapper: 29L [00:00, 230368.97L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 29/29 [00:00<00:00, 7850.95it/s]
load vocab from list: 100%|██████████| 28/28 [00:00<00:00, 235351.73it/s]
load dataset from data/few_shot/resume/train_1000.json: 0it [00:00, ?it/s]

load cached ./temp/204ecb844970c953244b42be8f449690_578a629df36736a7b0ca315689a0fbc2_a783a23408031aaf8881013b1b168597_61206f767c93b652c614f8099bc479e7/1000000/matched_words
load cached ./temp/204ecb844970c953244b42be8f449690_578a629df36736a7b0ca315689a0fbc2_a783a23408031aaf8881013b1b168597_61206f767c93b652c614f8099bc479e7/1000000/word_vocab
load cached ./temp/204ecb844970c953244b42be8f449690_578a629df36736a7b0ca315689a0fbc2_a783a23408031aaf8881013b1b168597_61206f767c93b652c614f8099bc479e7/1000000/vocab_embedding


load dataset from data/few_shot/resume/train_1000.json: 1000it [00:01, 802.00it/s]
load dataset from data/few_shot/resume/dev.json: 463it [00:00, 819.80it/s]
Some weights of the model checkpoint at save_pretrained/resume_pretrain_lebert_1000_pretraind_task/Bert_960/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification mo

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.77it/s, F1=0.228, train_acc=0.582, train_loss=52.8, train_precision=0.197, train_recall=0.278]      


train_reports:
              precision    recall  f1-score   support

        CONT       0.08      0.10      0.09        70
         EDU       0.28      0.13      0.17       197
         LOC       0.00      0.00      0.00        16
        NAME       0.01      0.16      0.01       271
         ORG       0.22      0.36      0.27      1151
         PRO       0.00      0.00      0.00        64
        RACE       0.00      0.00      0.00        32
       TITLE       0.15      0.28      0.20      1517

   micro avg       0.08      0.27      0.12      3318
   macro avg       0.09      0.13      0.09      3318
weighted avg       0.16      0.27      0.20      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.56it/s, F1=0.82, eval_acc=0.936, eval_loss=7.78, eval_precision=0.778, eval_recall=0.869] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.67      0.97      0.79        33
         EDU       0.74      0.79      0.76       106
         LOC       0.00      0.00      0.00         2
        NAME       0.94      0.96      0.95       110
         ORG       0.75      0.87      0.80       523
         PRO       0.13      0.11      0.12        18
        RACE       0.00      0.00      0.00        15
       TITLE       0.76      0.89      0.82       690

   micro avg       0.76      0.86      0.81      1497
   macro avg       0.50      0.57      0.53      1497
weighted avg       0.75      0.86      0.80      1497



Epoch: 2/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.75it/s, F1=0.832, train_acc=0.957, train_loss=6.12, train_precision=0.789, train_recall=0.887]


train_reports:
              precision    recall  f1-score   support

        CONT       0.71      0.93      0.80        70
         EDU       0.72      0.84      0.78       197
         LOC       0.11      0.12      0.11        16
        NAME       0.88      0.96      0.92       271
         ORG       0.75      0.87      0.80      1151
         PRO       0.45      0.52      0.48        64
        RACE       0.88      0.69      0.77        32
       TITLE       0.81      0.91      0.86      1517

   micro avg       0.77      0.88      0.83      3318
   macro avg       0.66      0.73      0.69      3318
weighted avg       0.77      0.88      0.83      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.60it/s, F1=0.896, eval_acc=0.958, eval_loss=5.38, eval_precision=0.853, eval_recall=0.945]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.91      0.97      0.94        33
         EDU       0.84      0.97      0.90       106
         LOC       0.20      1.00      0.33         2
        NAME       0.96      1.00      0.98       110
         ORG       0.82      0.93      0.88       523
         PRO       0.39      0.67      0.49        18
        RACE       0.93      0.93      0.93        15
       TITLE       0.85      0.94      0.89       690

   micro avg       0.84      0.94      0.89      1497
   macro avg       0.74      0.93      0.79      1497
weighted avg       0.85      0.94      0.89      1497



Epoch: 3/30 Train: 100%|██████████| 125/125 [00:32<00:00,  3.79it/s, F1=0.925, train_acc=0.982, train_loss=2.55, train_precision=0.904, train_recall=0.951]


train_reports:
              precision    recall  f1-score   support

        CONT       0.91      0.97      0.94        70
         EDU       0.96      0.98      0.97       197
         LOC       0.57      0.81      0.67        16
        NAME       0.92      0.96      0.94       271
         ORG       0.87      0.94      0.91      1151
         PRO       0.77      0.83      0.80        64
        RACE       0.75      0.84      0.79        32
       TITLE       0.91      0.96      0.93      1517

   micro avg       0.89      0.95      0.92      3318
   macro avg       0.83      0.91      0.87      3318
weighted avg       0.89      0.95      0.92      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.68it/s, F1=0.914, eval_acc=0.969, eval_loss=3.88, eval_precision=0.885, eval_recall=0.947]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.98      0.98      0.98       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.85      0.93      0.89       523
         PRO       0.74      0.94      0.83        18
        RACE       0.93      0.93      0.93        15
       TITLE       0.88      0.94      0.91       690

   micro avg       0.88      0.95      0.91      1497
   macro avg       0.91      0.96      0.94      1497
weighted avg       0.88      0.95      0.91      1497



Epoch: 4/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.77it/s, F1=0.946, train_acc=0.988, train_loss=1.75, train_precision=0.93, train_recall=0.964] 


train_reports:
              precision    recall  f1-score   support

        CONT       0.95      0.99      0.97        70
         EDU       0.97      0.98      0.97       197
         LOC       0.78      0.88      0.82        16
        NAME       1.00      0.99      0.99       271
         ORG       0.91      0.96      0.94      1151
         PRO       0.91      0.94      0.92        64
        RACE       0.82      0.84      0.83        32
       TITLE       0.92      0.96      0.94      1517

   micro avg       0.92      0.96      0.94      3318
   macro avg       0.91      0.94      0.92      3318
weighted avg       0.92      0.96      0.94      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.65it/s, F1=0.918, eval_acc=0.972, eval_loss=3.6, eval_precision=0.888, eval_recall=0.949] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.97      0.97      0.97        33
         EDU       0.94      0.98      0.96       106
         LOC       0.50      1.00      0.67         2
        NAME       0.99      1.00      1.00       110
         ORG       0.85      0.93      0.89       523
         PRO       0.82      1.00      0.90        18
        RACE       0.93      0.93      0.93        15
       TITLE       0.88      0.94      0.91       690

   micro avg       0.88      0.94      0.91      1497
   macro avg       0.86      0.97      0.90      1497
weighted avg       0.88      0.94      0.91      1497



Epoch: 5/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.76it/s, F1=0.961, train_acc=0.992, train_loss=1.14, train_precision=0.95, train_recall=0.973] 


train_reports:
              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        70
         EDU       0.96      0.97      0.96       197
         LOC       0.78      0.88      0.82        16
        NAME       0.98      0.99      0.99       271
         ORG       0.94      0.97      0.96      1151
         PRO       0.91      0.98      0.95        64
        RACE       0.94      0.94      0.94        32
       TITLE       0.95      0.97      0.96      1517

   micro avg       0.95      0.97      0.96      3318
   macro avg       0.93      0.96      0.94      3318
weighted avg       0.95      0.97      0.96      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.69it/s, F1=0.912, eval_acc=0.965, eval_loss=5.33, eval_precision=0.88, eval_recall=0.947] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.97      1.00      0.99        33
         EDU       0.96      1.00      0.98       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.84      0.92      0.88       523
         PRO       0.86      1.00      0.92        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.85      0.94      0.89       690

   micro avg       0.87      0.94      0.90      1497
   macro avg       0.92      0.98      0.95      1497
weighted avg       0.87      0.94      0.90      1497



Epoch: 6/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.42it/s, F1=0.968, train_acc=0.993, train_loss=1, train_precision=0.959, train_recall=0.979]   


train_reports:
              precision    recall  f1-score   support

        CONT       0.95      0.99      0.97        70
         EDU       0.99      0.99      0.99       197
         LOC       0.82      0.88      0.85        16
        NAME       0.98      1.00      0.99       271
         ORG       0.96      0.97      0.97      1151
         PRO       0.97      0.98      0.98        64
        RACE       0.94      0.94      0.94        32
       TITLE       0.96      0.98      0.97      1517

   micro avg       0.96      0.98      0.97      3318
   macro avg       0.95      0.97      0.96      3318
weighted avg       0.96      0.98      0.97      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.68it/s, F1=0.924, eval_acc=0.973, eval_loss=3.82, eval_precision=0.895, eval_recall=0.955]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.97      0.99      0.98       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.87      0.94      0.90       523
         PRO       0.65      0.94      0.77        18
        RACE       0.93      0.93      0.93        15
       TITLE       0.89      0.95      0.92       690

   micro avg       0.89      0.95      0.92      1497
   macro avg       0.86      0.97      0.91      1497
weighted avg       0.89      0.95      0.92      1497



Epoch: 7/30 Train: 100%|██████████| 125/125 [00:32<00:00,  3.80it/s, F1=0.978, train_acc=0.995, train_loss=0.644, train_precision=0.972, train_recall=0.985]


train_reports:
              precision    recall  f1-score   support

        CONT       0.97      1.00      0.99        70
         EDU       0.98      0.99      0.99       197
         LOC       0.88      0.94      0.91        16
        NAME       0.99      1.00      1.00       271
         ORG       0.96      0.98      0.97      1151
         PRO       0.93      0.97      0.95        64
        RACE       1.00      0.94      0.97        32
       TITLE       0.98      0.99      0.98      1517

   micro avg       0.97      0.99      0.98      3318
   macro avg       0.96      0.98      0.97      3318
weighted avg       0.97      0.99      0.98      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.55it/s, F1=0.931, eval_acc=0.971, eval_loss=4.09, eval_precision=0.907, eval_recall=0.957]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.97      1.00      0.99       106
         LOC       0.67      1.00      0.80         2
        NAME       0.99      1.00      1.00       110
         ORG       0.87      0.94      0.90       523
         PRO       0.78      1.00      0.88        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.89      0.95      0.92       690

   micro avg       0.90      0.95      0.93      1497
   macro avg       0.88      0.98      0.93      1497
weighted avg       0.90      0.95      0.93      1497



Epoch: 8/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.79it/s, F1=0.986, train_acc=0.997, train_loss=0.392, train_precision=0.983, train_recall=0.99] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       0.98      0.99      0.99       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       0.98      0.99      0.98      1151
         PRO       0.93      0.97      0.95        64
        RACE       0.97      1.00      0.98        32
       TITLE       0.99      0.99      0.99      1517

   micro avg       0.98      0.99      0.99      3318
   macro avg       0.98      0.99      0.99      3318
weighted avg       0.98      0.99      0.99      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.925, eval_acc=0.97, eval_loss=4.03, eval_precision=0.905, eval_recall=0.947] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.99      0.98      0.99       106
         LOC       0.50      1.00      0.67         2
        NAME       0.99      1.00      1.00       110
         ORG       0.87      0.93      0.90       523
         PRO       0.82      1.00      0.90        18
        RACE       1.00      0.93      0.97        15
       TITLE       0.89      0.94      0.91       690

   micro avg       0.89      0.94      0.92      1497
   macro avg       0.87      0.97      0.91      1497
weighted avg       0.90      0.94      0.92      1497



Epoch: 9/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.77it/s, F1=0.991, train_acc=0.998, train_loss=0.279, train_precision=0.989, train_recall=0.993]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       1.00      0.99      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       0.99      0.99      0.99      1151
         PRO       0.95      0.98      0.97        64
        RACE       1.00      0.97      0.98        32
       TITLE       0.99      0.99      0.99      1517

   micro avg       0.99      0.99      0.99      3318
   macro avg       0.99      0.99      0.99      3318
weighted avg       0.99      0.99      0.99      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.73it/s, F1=0.924, eval_acc=0.973, eval_loss=4, eval_precision=0.898, eval_recall=0.952]   


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.98      0.99      0.99       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.86      0.93      0.90       523
         PRO       0.86      1.00      0.92        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.89      0.94      0.91       690

   micro avg       0.90      0.95      0.92      1497
   macro avg       0.95      0.98      0.96      1497
weighted avg       0.90      0.95      0.92      1497



Epoch: 10/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.45it/s, F1=0.994, train_acc=0.999, train_loss=0.216, train_precision=0.992, train_recall=0.995]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       1.00      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       0.99      0.99      0.99      1151
         PRO       0.98      0.98      0.98        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.99      0.99      0.99      1517

   micro avg       0.99      0.99      0.99      3318
   macro avg       1.00      1.00      1.00      3318
weighted avg       0.99      0.99      0.99      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.924, eval_acc=0.97, eval_loss=5.69, eval_precision=0.901, eval_recall=0.948] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.97      1.00      0.99       106
         LOC       0.67      1.00      0.80         2
        NAME       0.99      1.00      1.00       110
         ORG       0.88      0.94      0.91       523
         PRO       0.78      1.00      0.88        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.89      0.93      0.91       690

   micro avg       0.90      0.95      0.92      1497
   macro avg       0.89      0.98      0.93      1497
weighted avg       0.90      0.95      0.92      1497



Epoch: 11/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.78it/s, F1=0.993, train_acc=0.998, train_loss=0.287, train_precision=0.992, train_recall=0.994]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       1.00      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      0.99      0.99       271
         ORG       0.99      0.99      0.99      1151
         PRO       1.00      1.00      1.00        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.99      0.99      0.99      1517

   micro avg       0.99      0.99      0.99      3318
   macro avg       1.00      1.00      1.00      3318
weighted avg       0.99      0.99      0.99      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.62it/s, F1=0.931, eval_acc=0.973, eval_loss=4.41, eval_precision=0.904, eval_recall=0.959]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.97      0.99      0.98       106
         LOC       0.67      1.00      0.80         2
        NAME       0.99      1.00      1.00       110
         ORG       0.89      0.94      0.91       523
         PRO       0.78      1.00      0.88        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.88      0.95      0.92       690

   micro avg       0.90      0.96      0.93      1497
   macro avg       0.89      0.98      0.93      1497
weighted avg       0.90      0.96      0.93      1497



Epoch: 12/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.78it/s, F1=0.99, train_acc=0.998, train_loss=0.273, train_precision=0.988, train_recall=0.993] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       1.00      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       0.98      0.99      0.99      1151
         PRO       0.97      0.98      0.98        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.99      0.99      0.99      1517

   micro avg       0.99      0.99      0.99      3318
   macro avg       0.99      1.00      0.99      3318
weighted avg       0.99      0.99      0.99      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.928, eval_acc=0.971, eval_loss=4.91, eval_precision=0.903, eval_recall=0.954]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.96      0.99      0.98       106
         LOC       0.67      1.00      0.80         2
        NAME       0.99      1.00      1.00       110
         ORG       0.89      0.94      0.91       523
         PRO       0.78      1.00      0.88        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.89      0.94      0.91       690

   micro avg       0.90      0.95      0.92      1497
   macro avg       0.89      0.98      0.93      1497
weighted avg       0.90      0.95      0.92      1497



Epoch: 13/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.43it/s, F1=0.993, train_acc=0.999, train_loss=0.158, train_precision=0.991, train_recall=0.995]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       1.00      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       0.99      0.99      0.99      1151
         PRO       1.00      1.00      1.00        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.99      0.99      0.99      1517

   micro avg       0.99      1.00      0.99      3318
   macro avg       1.00      1.00      1.00      3318
weighted avg       0.99      1.00      0.99      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.929, eval_acc=0.97, eval_loss=4.77, eval_precision=0.91, eval_recall=0.95]   


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.97      0.99      0.98       106
         LOC       0.67      1.00      0.80         2
        NAME       0.99      1.00      1.00       110
         ORG       0.88      0.92      0.90       523
         PRO       0.82      1.00      0.90        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.89      0.95      0.92       690

   micro avg       0.90      0.95      0.92      1497
   macro avg       0.90      0.98      0.93      1497
weighted avg       0.90      0.95      0.92      1497



Epoch: 14/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.76it/s, F1=0.988, train_acc=0.998, train_loss=0.237, train_precision=0.984, train_recall=0.992]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       1.00      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       0.98      0.99      0.99      1151
         PRO       1.00      1.00      1.00        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.98      0.99      0.98      1517

   micro avg       0.98      0.99      0.99      3318
   macro avg       0.99      1.00      1.00      3318
weighted avg       0.98      0.99      0.99      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.929, eval_acc=0.971, eval_loss=4.85, eval_precision=0.908, eval_recall=0.951]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.96      0.98      0.97       106
         LOC       0.67      1.00      0.80         2
        NAME       0.99      1.00      1.00       110
         ORG       0.88      0.93      0.91       523
         PRO       0.75      1.00      0.86        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.90      0.94      0.92       690

   micro avg       0.90      0.95      0.93      1497
   macro avg       0.89      0.98      0.93      1497
weighted avg       0.91      0.95      0.93      1497



Epoch: 15/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.75it/s, F1=0.996, train_acc=0.999, train_loss=0.151, train_precision=0.995, train_recall=0.997]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       1.00      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       0.99      1.00      0.99      1151
         PRO       1.00      1.00      1.00        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.99      1.00      1.00      1517

   micro avg       0.99      1.00      1.00      3318
   macro avg       1.00      1.00      1.00      3318
weighted avg       0.99      1.00      1.00      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.56it/s, F1=0.927, eval_acc=0.971, eval_loss=4.15, eval_precision=0.908, eval_recall=0.948]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.96      0.98      0.97       106
         LOC       0.67      1.00      0.80         2
        NAME       0.99      1.00      1.00       110
         ORG       0.88      0.92      0.90       523
         PRO       0.75      1.00      0.86        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.91      0.94      0.93       690

   micro avg       0.90      0.95      0.92      1497
   macro avg       0.89      0.98      0.93      1497
weighted avg       0.91      0.95      0.92      1497



Epoch: 16/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.44it/s, F1=0.992, train_acc=0.999, train_loss=0.229, train_precision=0.99, train_recall=0.995] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       1.00      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       0.98      0.99      0.99      1151
         PRO       1.00      1.00      1.00        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.99      0.99      0.99      1517

   micro avg       0.99      0.99      0.99      3318
   macro avg       1.00      1.00      1.00      3318
weighted avg       0.99      0.99      0.99      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.58it/s, F1=0.934, eval_acc=0.972, eval_loss=4.86, eval_precision=0.915, eval_recall=0.955]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.99      0.98      0.99       106
         LOC       0.67      1.00      0.80         2
        NAME       0.99      1.00      1.00       110
         ORG       0.88      0.94      0.91       523
         PRO       0.78      1.00      0.88        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.92      0.95      0.93       690

   micro avg       0.91      0.95      0.93      1497
   macro avg       0.90      0.98      0.93      1497
weighted avg       0.91      0.95      0.93      1497



Epoch: 17/30 Train: 100%|██████████| 125/125 [00:32<00:00,  3.82it/s, F1=0.999, train_acc=1, train_loss=0.051, train_precision=0.998, train_recall=0.999] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       1.00      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       1.00      1.00      1.00      1151
         PRO       1.00      1.00      1.00        64
        RACE       1.00      1.00      1.00        32
       TITLE       1.00      1.00      1.00      1517

   micro avg       1.00      1.00      1.00      3318
   macro avg       1.00      1.00      1.00      3318
weighted avg       1.00      1.00      1.00      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.18it/s, F1=0.934, eval_acc=0.971, eval_loss=4.94, eval_precision=0.919, eval_recall=0.95] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.98      0.98      0.98       106
         LOC       0.67      1.00      0.80         2
        NAME       0.99      1.00      1.00       110
         ORG       0.89      0.93      0.91       523
         PRO       0.82      1.00      0.90        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.91      0.94      0.93       690

   micro avg       0.91      0.95      0.93      1497
   macro avg       0.90      0.98      0.93      1497
weighted avg       0.91      0.95      0.93      1497



Epoch: 18/30 Train: 100%|██████████| 125/125 [00:32<00:00,  3.80it/s, F1=0.983, train_acc=0.996, train_loss=0.706, train_precision=0.979, train_recall=0.988]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       1.00      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       0.99      1.00      0.99       271
         ORG       0.98      0.99      0.98      1151
         PRO       0.89      0.97      0.93        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.97      0.99      0.98      1517

   micro avg       0.98      0.99      0.98      3318
   macro avg       0.98      0.99      0.98      3318
weighted avg       0.98      0.99      0.98      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.46it/s, F1=0.916, eval_acc=0.965, eval_loss=5.9, eval_precision=0.895, eval_recall=0.938] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.94      0.96      0.95       106
         LOC       1.00      1.00      1.00         2
        NAME       0.97      1.00      0.99       110
         ORG       0.86      0.92      0.89       523
         PRO       0.13      0.17      0.15        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.90      0.94      0.92       690

   micro avg       0.88      0.93      0.91      1497
   macro avg       0.85      0.87      0.86      1497
weighted avg       0.89      0.93      0.91      1497



Epoch: 19/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.41it/s, F1=0.983, train_acc=0.996, train_loss=0.738, train_precision=0.978, train_recall=0.988]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       0.94      0.97      0.95       197
         LOC       1.00      1.00      1.00        16
        NAME       0.99      1.00      0.99       271
         ORG       0.98      0.99      0.99      1151
         PRO       0.81      0.86      0.83        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.98      0.99      0.99      1517

   micro avg       0.98      0.99      0.98      3318
   macro avg       0.96      0.98      0.97      3318
weighted avg       0.98      0.99      0.98      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.64it/s, F1=0.926, eval_acc=0.972, eval_loss=4.75, eval_precision=0.9, eval_recall=0.953]  


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.93      0.98      0.95       106
         LOC       0.67      1.00      0.80         2
        NAME       0.99      1.00      1.00       110
         ORG       0.87      0.93      0.90       523
         PRO       0.69      1.00      0.82        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.89      0.95      0.92       690

   micro avg       0.89      0.95      0.92      1497
   macro avg       0.87      0.98      0.92      1497
weighted avg       0.90      0.95      0.92      1497



Epoch: 20/30 Train: 100%|██████████| 125/125 [00:32<00:00,  3.80it/s, F1=0.985, train_acc=0.997, train_loss=0.531, train_precision=0.98, train_recall=0.992] 


train_reports:
              precision    recall  f1-score   support

        CONT       0.96      0.99      0.97        70
         EDU       0.97      0.99      0.98       197
         LOC       1.00      1.00      1.00        16
        NAME       0.97      1.00      0.99       271
         ORG       0.97      0.99      0.98      1151
         PRO       0.97      1.00      0.98        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.99      0.99      0.99      1517

   micro avg       0.98      0.99      0.98      3318
   macro avg       0.98      0.99      0.99      3318
weighted avg       0.98      0.99      0.98      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.923, eval_acc=0.966, eval_loss=6.06, eval_precision=0.905, eval_recall=0.943]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.97      1.00      0.99        33
         EDU       0.96      1.00      0.98       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.88      0.92      0.90       523
         PRO       0.82      1.00      0.90        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.89      0.94      0.91       690

   micro avg       0.90      0.94      0.92      1497
   macro avg       0.93      0.98      0.96      1497
weighted avg       0.90      0.94      0.92      1497



Epoch: 21/30 Train: 100%|██████████| 125/125 [00:32<00:00,  3.82it/s, F1=0.991, train_acc=0.998, train_loss=0.382, train_precision=0.988, train_recall=0.995]


train_reports:
              precision    recall  f1-score   support

        CONT       0.99      1.00      0.99        70
         EDU       0.98      1.00      0.99       197
         LOC       1.00      1.00      1.00        16
        NAME       0.98      1.00      0.99       271
         ORG       0.98      0.99      0.99      1151
         PRO       1.00      1.00      1.00        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.99      1.00      0.99      1517

   micro avg       0.99      1.00      0.99      3318
   macro avg       0.99      1.00      0.99      3318
weighted avg       0.99      1.00      0.99      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.68it/s, F1=0.935, eval_acc=0.969, eval_loss=5.19, eval_precision=0.923, eval_recall=0.946]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.99      0.98      0.99       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.90      0.93      0.91       523
         PRO       0.86      1.00      0.92        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.91      0.94      0.92       690

   micro avg       0.92      0.94      0.93      1497
   macro avg       0.95      0.98      0.96      1497
weighted avg       0.92      0.94      0.93      1497



Epoch: 22/30 Train: 100%|██████████| 125/125 [00:32<00:00,  3.82it/s, F1=0.993, train_acc=0.999, train_loss=0.23, train_precision=0.992, train_recall=0.995] 


train_reports:
              precision    recall  f1-score   support

        CONT       0.96      0.97      0.96        70
         EDU       0.98      0.98      0.98       197
         LOC       0.68      0.81      0.74        16
        NAME       0.99      1.00      0.99       271
         ORG       1.00      1.00      1.00      1151
         PRO       1.00      1.00      1.00        64
        RACE       1.00      1.00      1.00        32
       TITLE       1.00      1.00      1.00      1517

   micro avg       0.99      1.00      0.99      3318
   macro avg       0.95      0.97      0.96      3318
weighted avg       0.99      1.00      0.99      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.69it/s, F1=0.939, eval_acc=0.971, eval_loss=5.39, eval_precision=0.92, eval_recall=0.958] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      0.97      0.98        33
         EDU       0.97      0.99      0.98       106
         LOC       0.67      1.00      0.80         2
        NAME       0.99      1.00      1.00       110
         ORG       0.90      0.94      0.92       523
         PRO       0.82      1.00      0.90        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.91      0.95      0.93       690

   micro avg       0.92      0.96      0.94      1497
   macro avg       0.91      0.98      0.94      1497
weighted avg       0.92      0.96      0.94      1497



Epoch: 23/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.44it/s, F1=0.995, train_acc=0.999, train_loss=0.202, train_precision=0.993, train_recall=0.997]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       0.98      0.99      0.99       197
         LOC       1.00      1.00      1.00        16
        NAME       0.99      1.00      0.99       271
         ORG       0.99      0.99      0.99      1151
         PRO       0.95      0.98      0.97        64
        RACE       1.00      1.00      1.00        32
       TITLE       1.00      1.00      1.00      1517

   micro avg       0.99      1.00      0.99      3318
   macro avg       0.99      1.00      0.99      3318
weighted avg       0.99      1.00      0.99      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.71it/s, F1=0.938, eval_acc=0.973, eval_loss=5.29, eval_precision=0.919, eval_recall=0.958]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.97      0.99      0.98       106
         LOC       0.67      1.00      0.80         2
        NAME       0.99      1.00      1.00       110
         ORG       0.90      0.94      0.92       523
         PRO       0.71      0.94      0.81        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.92      0.95      0.94       690

   micro avg       0.92      0.96      0.94      1497
   macro avg       0.89      0.98      0.92      1497
weighted avg       0.92      0.96      0.94      1497



Epoch: 24/30 Train: 100%|██████████| 125/125 [00:32<00:00,  3.82it/s, F1=0.994, train_acc=0.999, train_loss=0.218, train_precision=0.992, train_recall=0.996]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       1.00      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       0.99      0.99      0.99      1151
         PRO       0.93      0.97      0.95        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.99      1.00      1.00      1517

   micro avg       0.99      1.00      0.99      3318
   macro avg       0.99      0.99      0.99      3318
weighted avg       0.99      1.00      0.99      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.69it/s, F1=0.927, eval_acc=0.97, eval_loss=5.32, eval_precision=0.91, eval_recall=0.945]  


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.97      0.98      0.98       106
         LOC       0.67      1.00      0.80         2
        NAME       0.99      1.00      1.00       110
         ORG       0.88      0.93      0.90       523
         PRO       0.78      1.00      0.88        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.90      0.93      0.92       690

   micro avg       0.90      0.94      0.92      1497
   macro avg       0.89      0.98      0.93      1497
weighted avg       0.90      0.94      0.92      1497



Epoch: 25/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.78it/s, F1=0.989, train_acc=0.998, train_loss=0.37, train_precision=0.985, train_recall=0.993] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       1.00      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       0.98      0.99      0.98      1151
         PRO       1.00      1.00      1.00        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.98      0.99      0.99      1517

   micro avg       0.98      0.99      0.99      3318
   macro avg       0.99      1.00      1.00      3318
weighted avg       0.98      0.99      0.99      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.65it/s, F1=0.932, eval_acc=0.967, eval_loss=5.32, eval_precision=0.916, eval_recall=0.949]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.97      1.00      0.99       106
         LOC       0.67      1.00      0.80         2
        NAME       0.99      0.96      0.98       110
         ORG       0.88      0.94      0.91       523
         PRO       0.78      1.00      0.88        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.92      0.94      0.93       690

   micro avg       0.91      0.95      0.93      1497
   macro avg       0.89      0.98      0.93      1497
weighted avg       0.91      0.95      0.93      1497



Epoch: 26/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.44it/s, F1=0.995, train_acc=0.998, train_loss=0.349, train_precision=0.995, train_recall=0.996]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       0.99      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      0.99      1.00       271
         ORG       0.99      0.99      0.99      1151
         PRO       1.00      1.00      1.00        64
        RACE       1.00      1.00      1.00        32
       TITLE       1.00      1.00      1.00      1517

   micro avg       0.99      1.00      1.00      3318
   macro avg       1.00      1.00      1.00      3318
weighted avg       0.99      1.00      1.00      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.69it/s, F1=0.937, eval_acc=0.972, eval_loss=4.56, eval_precision=0.92, eval_recall=0.955] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       1.00      0.98      0.99       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.90      0.94      0.92       523
         PRO       0.86      1.00      0.92        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.91      0.95      0.93       690

   micro avg       0.92      0.95      0.94      1497
   macro avg       0.91      0.98      0.94      1497
weighted avg       0.92      0.95      0.94      1497



Epoch: 27/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.74it/s, F1=0.997, train_acc=1, train_loss=0.0682, train_precision=0.997, train_recall=0.998]    


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       1.00      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       1.00      1.00      1.00      1151
         PRO       1.00      1.00      1.00        64
        RACE       1.00      1.00      1.00        32
       TITLE       1.00      1.00      1.00      1517

   micro avg       1.00      1.00      1.00      3318
   macro avg       1.00      1.00      1.00      3318
weighted avg       1.00      1.00      1.00      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.69it/s, F1=0.943, eval_acc=0.972, eval_loss=4.54, eval_precision=0.931, eval_recall=0.956]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.98      1.00      0.99       106
         LOC       0.50      1.00      0.67         2
        NAME       0.99      1.00      1.00       110
         ORG       0.91      0.94      0.93       523
         PRO       0.78      1.00      0.88        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.92      0.95      0.94       690

   micro avg       0.93      0.95      0.94      1497
   macro avg       0.87      0.98      0.91      1497
weighted avg       0.93      0.95      0.94      1497



Epoch: 28/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.79it/s, F1=0.999, train_acc=1, train_loss=0.0289, train_precision=0.999, train_recall=1]   


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       1.00      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       0.99      1.00      0.99       271
         ORG       1.00      1.00      1.00      1151
         PRO       1.00      1.00      1.00        64
        RACE       1.00      1.00      1.00        32
       TITLE       1.00      1.00      1.00      1517

   micro avg       1.00      1.00      1.00      3318
   macro avg       1.00      1.00      1.00      3318
weighted avg       1.00      1.00      1.00      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.65it/s, F1=0.939, eval_acc=0.973, eval_loss=4.83, eval_precision=0.926, eval_recall=0.953]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.98      1.00      0.99       106
         LOC       0.67      1.00      0.80         2
        NAME       0.99      1.00      1.00       110
         ORG       0.90      0.93      0.92       523
         PRO       0.86      1.00      0.92        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.92      0.94      0.93       690

   micro avg       0.92      0.95      0.94      1497
   macro avg       0.90      0.98      0.94      1497
weighted avg       0.92      0.95      0.94      1497



Epoch: 29/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.45it/s, F1=0.999, train_acc=1, train_loss=0.0413, train_precision=0.999, train_recall=1]       


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       1.00      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       1.00      1.00      1.00      1151
         PRO       1.00      1.00      1.00        64
        RACE       1.00      1.00      1.00        32
       TITLE       1.00      1.00      1.00      1517

   micro avg       1.00      1.00      1.00      3318
   macro avg       1.00      1.00      1.00      3318
weighted avg       1.00      1.00      1.00      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.69it/s, F1=0.938, eval_acc=0.971, eval_loss=4.52, eval_precision=0.933, eval_recall=0.944]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.99      0.98      0.99       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.91      0.92      0.91       523
         PRO       0.82      1.00      0.90        18
        RACE       0.93      0.93      0.93        15
       TITLE       0.93      0.94      0.94       690

   micro avg       0.93      0.94      0.94      1497
   macro avg       0.95      0.97      0.96      1497
weighted avg       0.93      0.94      0.94      1497



Epoch: 30/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.77it/s, F1=0.994, train_acc=0.998, train_loss=0.32, train_precision=0.992, train_recall=0.996] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       1.00      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       0.99      1.00      1.00      1151
         PRO       1.00      1.00      1.00        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.99      0.99      0.99      1517

   micro avg       0.99      1.00      0.99      3318
   macro avg       1.00      1.00      1.00      3318
weighted avg       0.99      1.00      0.99      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.67it/s, F1=0.94, eval_acc=0.971, eval_loss=5.41, eval_precision=0.924, eval_recall=0.956] 


eval_reports:


calculate data/few_shot/resume/train_1000.json etag: 100%|██████████| 466k/466k [00:00<00:00, 249MB/s]
calculate data/few_shot/resume/dev.json etag: 100%|██████████| 208k/208k [00:00<00:00, 286MB/s]
calculate data/few_shot/resume/test.json etag: 100%|██████████| 230k/230k [00:00<00:00, 218MB/s]
calculate data/few_shot/resume/labels.txt etag: 100%|██████████| 181/181 [00:00<00:00, 302kB/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.99      1.00      1.00       106
         LOC       0.29      1.00      0.44         2
        NAME       0.96      1.00      0.98       110
         ORG       0.90      0.94      0.92       523
         PRO       0.90      1.00      0.95        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.91      0.95      0.93       690

   micro avg       0.92      0.95      0.94      1497
   macro avg       0.86      0.98      0.90      1497
weighted avg       0.92      0.95      0.94      1497

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/resume/train_1000.json",
    "eval_file": "data/few_shot/resume/dev.json",
    "test_file": "data/few_sho


count line size data/few_shot/resume/labels.txt: 29L [00:00, 219557.43L/s]
build line mapper: 29L [00:00, 196820.09L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 29/29 [00:00<00:00, 8327.73it/s]
load vocab from list: 100%|██████████| 28/28 [00:00<00:00, 265702.52it/s]
load dataset from data/few_shot/resume/train_1000.json: 92it [00:00, 915.91it/s]

load cached ./temp/204ecb844970c953244b42be8f449690_578a629df36736a7b0ca315689a0fbc2_a783a23408031aaf8881013b1b168597_61206f767c93b652c614f8099bc479e7/1000000/matched_words
load cached ./temp/204ecb844970c953244b42be8f449690_578a629df36736a7b0ca315689a0fbc2_a783a23408031aaf8881013b1b168597_61206f767c93b652c614f8099bc479e7/1000000/word_vocab
load cached ./temp/204ecb844970c953244b42be8f449690_578a629df36736a7b0ca315689a0fbc2_a783a23408031aaf8881013b1b168597_61206f767c93b652c614f8099bc479e7/1000000/vocab_embedding


load dataset from data/few_shot/resume/train_1000.json: 1000it [00:01, 802.24it/s]
load dataset from data/few_shot/resume/dev.json: 463it [00:00, 821.67it/s]
Some weights of the model checkpoint at save_pretrained/resume_pretrain_lebert_1000_pretraind_task/Bert_960/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification mo

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.72it/s, F1=0.315, train_acc=0.606, train_loss=51.4, train_precision=0.285, train_recall=0.358]      


train_reports:
              precision    recall  f1-score   support

        CONT       0.00      0.00      0.00        70
         EDU       0.21      0.19      0.20       197
         LOC       0.00      0.00      0.00        16
        NAME       0.01      0.02      0.01       271
         ORG       0.19      0.38      0.26      1151
         PRO       0.00      0.00      0.00        64
        RACE       0.00      0.00      0.00        32
       TITLE       0.37      0.44      0.41      1517

   micro avg       0.12      0.35      0.18      3318
   macro avg       0.10      0.13      0.11      3318
weighted avg       0.25      0.35      0.29      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.57it/s, F1=0.778, eval_acc=0.942, eval_loss=7.84, eval_precision=0.719, eval_recall=0.849]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.00      0.00      0.00        33
         EDU       0.63      0.82      0.71       106
         LOC       0.00      0.00      0.00         2
        NAME       0.83      0.92      0.87       110
         ORG       0.71      0.87      0.78       523
         PRO       0.00      0.00      0.00        18
        RACE       0.00      0.00      0.00        15
       TITLE       0.84      0.92      0.88       690

   micro avg       0.72      0.85      0.78      1497
   macro avg       0.38      0.44      0.41      1497
weighted avg       0.74      0.85      0.79      1497



Epoch: 2/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.72it/s, F1=0.835, train_acc=0.959, train_loss=5.87, train_precision=0.796, train_recall=0.883]


train_reports:
              precision    recall  f1-score   support

        CONT       0.41      0.64      0.50        70
         EDU       0.80      0.93      0.86       197
         LOC       0.00      0.00      0.00        16
        NAME       0.98      0.96      0.97       271
         ORG       0.78      0.89      0.83      1151
         PRO       0.25      0.36      0.29        64
        RACE       0.15      0.22      0.18        32
       TITLE       0.86      0.93      0.89      1517

   micro avg       0.79      0.89      0.84      3318
   macro avg       0.53      0.62      0.57      3318
weighted avg       0.81      0.89      0.85      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.69it/s, F1=0.862, eval_acc=0.956, eval_loss=5.57, eval_precision=0.808, eval_recall=0.927]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.97      0.97      0.97        33
         EDU       0.90      0.96      0.93       106
         LOC       0.00      0.00      0.00         2
        NAME       0.97      0.99      0.98       110
         ORG       0.79      0.92      0.85       523
         PRO       0.32      0.67      0.44        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.79      0.92      0.85       690

   micro avg       0.80      0.93      0.86      1497
   macro avg       0.70      0.80      0.74      1497
weighted avg       0.81      0.93      0.86      1497



Epoch: 3/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.76it/s, F1=0.915, train_acc=0.978, train_loss=3, train_precision=0.896, train_recall=0.936]   


train_reports:
              precision    recall  f1-score   support

        CONT       0.87      0.97      0.92        70
         EDU       0.91      0.96      0.94       197
         LOC       0.35      0.44      0.39        16
        NAME       0.98      0.98      0.98       271
         ORG       0.86      0.92      0.89      1151
         PRO       0.72      0.81      0.76        64
        RACE       0.74      0.88      0.80        32
       TITLE       0.91      0.94      0.92      1517

   micro avg       0.89      0.94      0.91      3318
   macro avg       0.79      0.86      0.83      3318
weighted avg       0.89      0.94      0.91      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.69it/s, F1=0.923, eval_acc=0.972, eval_loss=3.72, eval_precision=0.9, eval_recall=0.948]  


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.90      0.98      0.94       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.87      0.92      0.90       523
         PRO       0.82      1.00      0.90        18
        RACE       0.93      0.93      0.93        15
       TITLE       0.90      0.95      0.92       690

   micro avg       0.89      0.95      0.92      1497
   macro avg       0.88      0.97      0.92      1497
weighted avg       0.89      0.95      0.92      1497



Epoch: 4/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.42it/s, F1=0.959, train_acc=0.99, train_loss=1.61, train_precision=0.947, train_recall=0.972] 


train_reports:
              precision    recall  f1-score   support

        CONT       0.95      0.99      0.97        70
         EDU       0.98      0.98      0.98       197
         LOC       0.78      0.88      0.82        16
        NAME       0.98      0.99      0.98       271
         ORG       0.94      0.97      0.96      1151
         PRO       0.89      0.92      0.91        64
        RACE       0.78      0.88      0.82        32
       TITLE       0.95      0.97      0.96      1517

   micro avg       0.95      0.97      0.96      3318
   macro avg       0.91      0.95      0.93      3318
weighted avg       0.95      0.97      0.96      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.921, eval_acc=0.969, eval_loss=3.98, eval_precision=0.893, eval_recall=0.952]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.95      0.99      0.97       106
         LOC       0.50      1.00      0.67         2
        NAME       0.99      1.00      1.00       110
         ORG       0.86      0.93      0.90       523
         PRO       0.68      0.94      0.79        18
        RACE       1.00      0.93      0.97        15
       TITLE       0.88      0.95      0.92       690

   micro avg       0.89      0.95      0.92      1497
   macro avg       0.85      0.96      0.89      1497
weighted avg       0.89      0.95      0.92      1497



Epoch: 5/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.76it/s, F1=0.966, train_acc=0.992, train_loss=1.1, train_precision=0.956, train_recall=0.977] 


train_reports:
              precision    recall  f1-score   support

        CONT       0.93      0.99      0.96        70
         EDU       0.98      0.99      0.99       197
         LOC       0.78      0.88      0.82        16
        NAME       0.99      1.00      0.99       271
         ORG       0.94      0.97      0.95      1151
         PRO       0.93      0.98      0.95        64
        RACE       0.88      0.88      0.88        32
       TITLE       0.96      0.98      0.97      1517

   micro avg       0.95      0.98      0.96      3318
   macro avg       0.92      0.96      0.94      3318
weighted avg       0.95      0.98      0.96      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.71it/s, F1=0.909, eval_acc=0.959, eval_loss=5.92, eval_precision=0.888, eval_recall=0.933]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.95      0.98      0.96       106
         LOC       0.67      1.00      0.80         2
        NAME       1.00      1.00      1.00       110
         ORG       0.86      0.89      0.87       523
         PRO       0.65      0.94      0.77        18
        RACE       0.93      0.93      0.93        15
       TITLE       0.86      0.94      0.90       690

   micro avg       0.88      0.93      0.90      1497
   macro avg       0.86      0.96      0.90      1497
weighted avg       0.88      0.93      0.90      1497



Epoch: 6/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.75it/s, F1=0.978, train_acc=0.995, train_loss=0.722, train_precision=0.973, train_recall=0.984]


train_reports:
              precision    recall  f1-score   support

        CONT       0.97      0.99      0.98        70
         EDU       0.98      0.99      0.99       197
         LOC       0.83      0.94      0.88        16
        NAME       0.99      1.00      0.99       271
         ORG       0.97      0.98      0.97      1151
         PRO       0.88      0.94      0.91        64
        RACE       0.82      0.84      0.83        32
       TITLE       0.97      0.98      0.98      1517

   micro avg       0.97      0.98      0.97      3318
   macro avg       0.93      0.96      0.94      3318
weighted avg       0.97      0.98      0.97      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.925, eval_acc=0.972, eval_loss=4.19, eval_precision=0.902, eval_recall=0.951]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.94      0.99      0.96       106
         LOC       0.50      1.00      0.67         2
        NAME       0.98      1.00      0.99       110
         ORG       0.86      0.93      0.89       523
         PRO       0.69      1.00      0.82        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.92      0.94      0.93       690

   micro avg       0.90      0.95      0.92      1497
   macro avg       0.85      0.98      0.90      1497
weighted avg       0.90      0.95      0.92      1497



Epoch: 7/30 Train: 100%|██████████| 125/125 [00:32<00:00,  3.79it/s, F1=0.978, train_acc=0.995, train_loss=0.697, train_precision=0.972, train_recall=0.983]


train_reports:
              precision    recall  f1-score   support

        CONT       0.99      0.99      0.99        70
         EDU       0.98      0.99      0.99       197
         LOC       0.94      0.94      0.94        16
        NAME       0.99      1.00      1.00       271
         ORG       0.96      0.98      0.97      1151
         PRO       0.94      0.97      0.95        64
        RACE       0.94      0.94      0.94        32
       TITLE       0.97      0.98      0.98      1517

   micro avg       0.97      0.98      0.98      3318
   macro avg       0.96      0.97      0.97      3318
weighted avg       0.97      0.98      0.98      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.68it/s, F1=0.927, eval_acc=0.972, eval_loss=4, eval_precision=0.908, eval_recall=0.948]   


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.91      0.97      0.94        33
         EDU       0.95      0.98      0.97       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.87      0.93      0.90       523
         PRO       0.78      1.00      0.88        18
        RACE       0.83      1.00      0.91        15
       TITLE       0.92      0.94      0.93       690

   micro avg       0.90      0.95      0.92      1497
   macro avg       0.87      0.98      0.91      1497
weighted avg       0.91      0.95      0.93      1497



Epoch: 8/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.42it/s, F1=0.986, train_acc=0.997, train_loss=0.443, train_precision=0.983, train_recall=0.99] 


train_reports:
              precision    recall  f1-score   support

        CONT       0.97      1.00      0.99        70
         EDU       0.99      0.99      0.99       197
         LOC       0.94      1.00      0.97        16
        NAME       0.99      1.00      1.00       271
         ORG       0.98      0.99      0.98      1151
         PRO       0.95      0.98      0.97        64
        RACE       0.97      0.94      0.95        32
       TITLE       0.98      0.99      0.99      1517

   micro avg       0.98      0.99      0.99      3318
   macro avg       0.97      0.99      0.98      3318
weighted avg       0.98      0.99      0.99      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.65it/s, F1=0.934, eval_acc=0.976, eval_loss=3.66, eval_precision=0.917, eval_recall=0.952]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.97      0.98      0.98       106
         LOC       0.67      1.00      0.80         2
        NAME       0.99      1.00      1.00       110
         ORG       0.89      0.93      0.91       523
         PRO       0.78      1.00      0.88        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.92      0.94      0.93       690

   micro avg       0.92      0.95      0.93      1497
   macro avg       0.89      0.98      0.93      1497
weighted avg       0.92      0.95      0.93      1497



Epoch: 9/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.78it/s, F1=0.981, train_acc=0.996, train_loss=0.625, train_precision=0.976, train_recall=0.987]


train_reports:
              precision    recall  f1-score   support

        CONT       0.99      0.99      0.99        70
         EDU       0.99      0.99      0.99       197
         LOC       0.94      1.00      0.97        16
        NAME       1.00      1.00      1.00       271
         ORG       0.98      0.98      0.98      1151
         PRO       0.94      0.98      0.96        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.97      0.98      0.97      1517

   micro avg       0.97      0.99      0.98      3318
   macro avg       0.98      0.99      0.98      3318
weighted avg       0.97      0.99      0.98      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.62it/s, F1=0.923, eval_acc=0.974, eval_loss=3.36, eval_precision=0.899, eval_recall=0.949]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      1.00      0.98       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.85      0.92      0.89       523
         PRO       0.75      1.00      0.86        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.91      0.94      0.93       690

   micro avg       0.90      0.95      0.92      1497
   macro avg       0.93      0.98      0.95      1497
weighted avg       0.90      0.95      0.92      1497



Epoch: 10/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.73it/s, F1=0.993, train_acc=0.999, train_loss=0.176, train_precision=0.991, train_recall=0.995]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       1.00      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       0.99      0.99      0.99      1151
         PRO       0.98      1.00      0.99        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.99      0.99      0.99      1517

   micro avg       0.99      1.00      0.99      3318
   macro avg       1.00      1.00      1.00      3318
weighted avg       0.99      1.00      0.99      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.65it/s, F1=0.929, eval_acc=0.975, eval_loss=3.79, eval_precision=0.91, eval_recall=0.948] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.95      0.98      0.97       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.88      0.93      0.90       523
         PRO       0.78      1.00      0.88        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.91      0.94      0.92       690

   micro avg       0.91      0.94      0.93      1497
   macro avg       0.89      0.98      0.93      1497
weighted avg       0.91      0.94      0.93      1497



Epoch: 11/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.41it/s, F1=0.996, train_acc=0.999, train_loss=0.102, train_precision=0.995, train_recall=0.997]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       1.00      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       0.99      1.00      0.99       271
         ORG       0.99      1.00      0.99      1151
         PRO       1.00      1.00      1.00        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.99      1.00      1.00      1517

   micro avg       0.99      1.00      1.00      3318
   macro avg       1.00      1.00      1.00      3318
weighted avg       0.99      1.00      1.00      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.33it/s, F1=0.943, eval_acc=0.975, eval_loss=4.09, eval_precision=0.932, eval_recall=0.955]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.95      0.99      0.97       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.90      0.93      0.91       523
         PRO       0.82      1.00      0.90        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.95      0.95      0.95       690

   micro avg       0.93      0.95      0.94      1497
   macro avg       0.89      0.98      0.93      1497
weighted avg       0.93      0.95      0.94      1497



Epoch: 12/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.77it/s, F1=0.974, train_acc=0.994, train_loss=0.938, train_precision=0.968, train_recall=0.982]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       0.94      0.97      0.95       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       0.95      0.98      0.96      1151
         PRO       0.94      0.97      0.95        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.97      0.98      0.97      1517

   micro avg       0.96      0.98      0.97      3318
   macro avg       0.97      0.99      0.98      3318
weighted avg       0.96      0.98      0.97      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.69it/s, F1=0.921, eval_acc=0.971, eval_loss=3.94, eval_precision=0.904, eval_recall=0.938]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.93      0.94      0.93       106
         LOC       1.00      1.00      1.00         2
        NAME       0.92      1.00      0.96       110
         ORG       0.87      0.91      0.89       523
         PRO       0.82      1.00      0.90        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.90      0.94      0.92       690

   micro avg       0.90      0.93      0.92      1497
   macro avg       0.92      0.97      0.95      1497
weighted avg       0.90      0.93      0.92      1497



Epoch: 13/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.77it/s, F1=0.988, train_acc=0.998, train_loss=0.372, train_precision=0.984, train_recall=0.992]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       0.95      0.97      0.96       197
         LOC       1.00      1.00      1.00        16
        NAME       0.98      1.00      0.99       271
         ORG       0.98      0.99      0.99      1151
         PRO       0.91      0.97      0.94        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.99      0.99      0.99      1517

   micro avg       0.98      0.99      0.99      3318
   macro avg       0.98      0.99      0.98      3318
weighted avg       0.98      0.99      0.99      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.69it/s, F1=0.926, eval_acc=0.973, eval_loss=3.83, eval_precision=0.907, eval_recall=0.945]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.93      0.98      0.95       106
         LOC       0.50      1.00      0.67         2
        NAME       0.98      1.00      0.99       110
         ORG       0.88      0.93      0.91       523
         PRO       0.86      1.00      0.92        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.90      0.94      0.92       690

   micro avg       0.90      0.94      0.92      1497
   macro avg       0.86      0.98      0.91      1497
weighted avg       0.90      0.94      0.92      1497



Epoch: 14/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.42it/s, F1=0.988, train_acc=0.998, train_loss=0.32, train_precision=0.984, train_recall=0.991] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       0.96      0.98      0.97       197
         LOC       1.00      1.00      1.00        16
        NAME       0.99      1.00      0.99       271
         ORG       0.98      0.99      0.99      1151
         PRO       0.93      0.97      0.95        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.98      0.99      0.99      1517

   micro avg       0.98      0.99      0.99      3318
   macro avg       0.98      0.99      0.99      3318
weighted avg       0.98      0.99      0.99      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.60it/s, F1=0.936, eval_acc=0.975, eval_loss=4.2, eval_precision=0.917, eval_recall=0.957] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.91      0.97      0.94        33
         EDU       0.95      0.99      0.97       106
         LOC       0.50      1.00      0.67         2
        NAME       0.99      1.00      1.00       110
         ORG       0.89      0.94      0.92       523
         PRO       0.72      1.00      0.84        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.91      0.95      0.93       690

   micro avg       0.91      0.95      0.93      1497
   macro avg       0.85      0.98      0.90      1497
weighted avg       0.91      0.95      0.93      1497



Epoch: 15/30 Train: 100%|██████████| 125/125 [00:32<00:00,  3.79it/s, F1=0.994, train_acc=0.999, train_loss=0.2, train_precision=0.992, train_recall=0.996]  


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       1.00      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       0.99      0.99      0.99      1151
         PRO       0.92      0.95      0.94        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.99      1.00      0.99      1517

   micro avg       0.99      1.00      0.99      3318
   macro avg       0.99      0.99      0.99      3318
weighted avg       0.99      1.00      0.99      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.71it/s, F1=0.938, eval_acc=0.975, eval_loss=4.34, eval_precision=0.926, eval_recall=0.951]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.95      0.98      0.96       106
         LOC       0.67      1.00      0.80         2
        NAME       0.99      1.00      1.00       110
         ORG       0.89      0.93      0.91       523
         PRO       0.78      1.00      0.88        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.93      0.95      0.94       690

   micro avg       0.92      0.95      0.93      1497
   macro avg       0.89      0.98      0.93      1497
weighted avg       0.92      0.95      0.93      1497



Epoch: 16/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.74it/s, F1=0.995, train_acc=0.999, train_loss=0.147, train_precision=0.993, train_recall=0.996]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       0.99      0.99      0.99       197
         LOC       0.94      1.00      0.97        16
        NAME       1.00      1.00      1.00       271
         ORG       0.99      0.99      0.99      1151
         PRO       1.00      1.00      1.00        64
        RACE       1.00      1.00      1.00        32
       TITLE       1.00      1.00      1.00      1517

   micro avg       0.99      1.00      0.99      3318
   macro avg       0.99      1.00      0.99      3318
weighted avg       0.99      1.00      0.99      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.93, eval_acc=0.971, eval_loss=5.24, eval_precision=0.918, eval_recall=0.942] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.97      0.98      0.98       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.87      0.92      0.89       523
         PRO       0.67      1.00      0.80        18
        RACE       1.00      0.93      0.97        15
       TITLE       0.92      0.93      0.93       690

   micro avg       0.91      0.94      0.92      1497
   macro avg       0.93      0.97      0.94      1497
weighted avg       0.91      0.94      0.92      1497



Epoch: 17/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.43it/s, F1=0.994, train_acc=0.999, train_loss=0.185, train_precision=0.992, train_recall=0.995] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       1.00      1.00      1.00       197
         LOC       0.82      0.88      0.85        16
        NAME       1.00      1.00      1.00       271
         ORG       0.99      0.99      0.99      1151
         PRO       0.98      1.00      0.99        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.99      0.99      0.99      1517

   micro avg       0.99      0.99      0.99      3318
   macro avg       0.97      0.98      0.98      3318
weighted avg       0.99      0.99      0.99      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.71it/s, F1=0.939, eval_acc=0.972, eval_loss=4.92, eval_precision=0.922, eval_recall=0.958]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.95      0.98      0.97       106
         LOC       0.40      1.00      0.57         2
        NAME       0.99      1.00      1.00       110
         ORG       0.88      0.94      0.91       523
         PRO       0.75      1.00      0.86        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.93      0.96      0.94       690

   micro avg       0.92      0.96      0.94      1497
   macro avg       0.85      0.98      0.90      1497
weighted avg       0.92      0.96      0.94      1497



Epoch: 18/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.69it/s, F1=0.996, train_acc=0.999, train_loss=0.168, train_precision=0.995, train_recall=0.997]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       0.99      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       0.99      0.99      0.99      1151
         PRO       1.00      1.00      1.00        64
        RACE       1.00      1.00      1.00        32
       TITLE       1.00      1.00      1.00      1517

   micro avg       0.99      1.00      1.00      3318
   macro avg       1.00      1.00      1.00      3318
weighted avg       0.99      1.00      1.00      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.64it/s, F1=0.935, eval_acc=0.972, eval_loss=4.73, eval_precision=0.92, eval_recall=0.95]  


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.95      0.97      0.96       106
         LOC       0.50      1.00      0.67         2
        NAME       0.99      1.00      1.00       110
         ORG       0.90      0.92      0.91       523
         PRO       0.82      1.00      0.90        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.92      0.95      0.94       690

   micro avg       0.92      0.95      0.93      1497
   macro avg       0.87      0.98      0.91      1497
weighted avg       0.92      0.95      0.93      1497



Epoch: 19/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.77it/s, F1=0.997, train_acc=1, train_loss=0.104, train_precision=0.997, train_recall=0.998]     


train_reports:
              precision    recall  f1-score   support

        CONT       0.99      1.00      0.99        70
         EDU       1.00      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       0.99      1.00      1.00      1151
         PRO       1.00      1.00      1.00        64
        RACE       1.00      1.00      1.00        32
       TITLE       1.00      1.00      1.00      1517

   micro avg       1.00      1.00      1.00      3318
   macro avg       1.00      1.00      1.00      3318
weighted avg       1.00      1.00      1.00      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.71it/s, F1=0.935, eval_acc=0.969, eval_loss=5.36, eval_precision=0.92, eval_recall=0.951] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.96      0.97      0.97       106
         LOC       0.50      1.00      0.67         2
        NAME       0.99      1.00      1.00       110
         ORG       0.88      0.93      0.91       523
         PRO       0.86      1.00      0.92        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.92      0.95      0.93       690

   micro avg       0.91      0.95      0.93      1497
   macro avg       0.87      0.98      0.91      1497
weighted avg       0.91      0.95      0.93      1497



Epoch: 20/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.76it/s, F1=0.983, train_acc=0.996, train_loss=0.533, train_precision=0.98, train_recall=0.986] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       0.98      0.99      0.99       197
         LOC       1.00      1.00      1.00        16
        NAME       0.99      1.00      0.99       271
         ORG       0.97      0.98      0.98      1151
         PRO       0.98      1.00      0.99        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.98      0.99      0.98      1517

   micro avg       0.98      0.99      0.98      3318
   macro avg       0.99      0.99      0.99      3318
weighted avg       0.98      0.99      0.98      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.39it/s, F1=0.916, eval_acc=0.965, eval_loss=5.18, eval_precision=0.892, eval_recall=0.942]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.94      0.97      0.95       106
         LOC       0.50      1.00      0.67         2
        NAME       0.99      1.00      1.00       110
         ORG       0.86      0.92      0.89       523
         PRO       0.82      1.00      0.90        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.89      0.94      0.92       690

   micro avg       0.89      0.94      0.91      1497
   macro avg       0.86      0.98      0.91      1497
weighted avg       0.89      0.94      0.92      1497



Epoch: 21/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.45it/s, F1=0.995, train_acc=0.999, train_loss=0.15, train_precision=0.995, train_recall=0.995] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       1.00      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       0.99      0.99      0.99      1151
         PRO       1.00      1.00      1.00        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.99      1.00      1.00      1517

   micro avg       0.99      1.00      0.99      3318
   macro avg       1.00      1.00      1.00      3318
weighted avg       0.99      1.00      0.99      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.938, eval_acc=0.972, eval_loss=5.02, eval_precision=0.926, eval_recall=0.95] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.98      0.99      0.99       106
         LOC       0.67      1.00      0.80         2
        NAME       0.99      1.00      1.00       110
         ORG       0.89      0.93      0.91       523
         PRO       0.78      1.00      0.88        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.93      0.94      0.94       690

   micro avg       0.92      0.95      0.94      1497
   macro avg       0.90      0.98      0.93      1497
weighted avg       0.93      0.95      0.94      1497



Epoch: 22/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.74it/s, F1=0.997, train_acc=0.999, train_loss=0.128, train_precision=0.997, train_recall=0.997]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       1.00      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       1.00      1.00      1.00      1151
         PRO       1.00      1.00      1.00        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.99      1.00      1.00      1517

   micro avg       1.00      1.00      1.00      3318
   macro avg       1.00      1.00      1.00      3318
weighted avg       1.00      1.00      1.00      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.65it/s, F1=0.927, eval_acc=0.973, eval_loss=5.2, eval_precision=0.912, eval_recall=0.943] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.97      0.99      0.98       106
         LOC       0.67      1.00      0.80         2
        NAME       0.99      1.00      1.00       110
         ORG       0.87      0.92      0.90       523
         PRO       0.90      1.00      0.95        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.91      0.93      0.92       690

   micro avg       0.91      0.94      0.92      1497
   macro avg       0.91      0.98      0.94      1497
weighted avg       0.91      0.94      0.92      1497



Epoch: 23/30 Train: 100%|██████████| 125/125 [00:32<00:00,  3.80it/s, F1=0.994, train_acc=0.999, train_loss=0.236, train_precision=0.993, train_recall=0.996]


train_reports:
              precision    recall  f1-score   support

        CONT       0.99      1.00      0.99        70
         EDU       0.99      0.99      0.99       197
         LOC       0.94      0.94      0.94        16
        NAME       1.00      1.00      1.00       271
         ORG       0.99      1.00      0.99      1151
         PRO       0.90      0.95      0.92        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.99      1.00      1.00      1517

   micro avg       0.99      1.00      0.99      3318
   macro avg       0.98      0.98      0.98      3318
weighted avg       0.99      1.00      0.99      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.47it/s, F1=0.926, eval_acc=0.971, eval_loss=5.24, eval_precision=0.91, eval_recall=0.943] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      0.98      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.86      0.92      0.89       523
         PRO       0.58      0.78      0.67        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.91      0.93      0.92       690

   micro avg       0.90      0.94      0.92      1497
   macro avg       0.91      0.95      0.93      1497
weighted avg       0.90      0.94      0.92      1497



Epoch: 24/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.47it/s, F1=0.982, train_acc=0.996, train_loss=0.886, train_precision=0.977, train_recall=0.988]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       0.98      0.99      0.99       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       0.96      0.98      0.97      1151
         PRO       0.91      0.95      0.93        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.98      0.99      0.98      1517

   micro avg       0.97      0.99      0.98      3318
   macro avg       0.98      0.99      0.98      3318
weighted avg       0.97      0.99      0.98      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.66it/s, F1=0.926, eval_acc=0.968, eval_loss=4.74, eval_precision=0.907, eval_recall=0.946]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      0.97      0.98        33
         EDU       0.92      0.97      0.94       106
         LOC       0.50      1.00      0.67         2
        NAME       0.99      1.00      1.00       110
         ORG       0.88      0.93      0.90       523
         PRO       0.75      1.00      0.86        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.90      0.94      0.92       690

   micro avg       0.90      0.94      0.92      1497
   macro avg       0.86      0.98      0.90      1497
weighted avg       0.90      0.94      0.92      1497



Epoch: 25/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.77it/s, F1=0.985, train_acc=0.996, train_loss=0.703, train_precision=0.981, train_recall=0.99] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       0.98      0.99      0.99       197
         LOC       0.83      0.94      0.88        16
        NAME       1.00      1.00      1.00       271
         ORG       0.97      0.99      0.98      1151
         PRO       0.98      0.98      0.98        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.99      0.99      0.99      1517

   micro avg       0.98      0.99      0.99      3318
   macro avg       0.97      0.99      0.98      3318
weighted avg       0.98      0.99      0.99      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.69it/s, F1=0.918, eval_acc=0.966, eval_loss=4.83, eval_precision=0.905, eval_recall=0.933]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.97      0.97      0.97        33
         EDU       0.96      0.97      0.97       106
         LOC       0.22      1.00      0.36         2
        NAME       0.99      1.00      1.00       110
         ORG       0.85      0.90      0.87       523
         PRO       0.60      1.00      0.75        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.93      0.93      0.93       690

   micro avg       0.90      0.93      0.91      1497
   macro avg       0.81      0.97      0.85      1497
weighted avg       0.90      0.93      0.92      1497



Epoch: 26/30 Train: 100%|██████████| 125/125 [00:32<00:00,  3.83it/s, F1=0.991, train_acc=0.998, train_loss=0.472, train_precision=0.989, train_recall=0.994]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       0.99      0.99      0.99       197
         LOC       0.94      1.00      0.97        16
        NAME       1.00      1.00      1.00       271
         ORG       0.99      0.99      0.99      1151
         PRO       0.98      1.00      0.99        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.99      0.99      0.99      1517

   micro avg       0.99      0.99      0.99      3318
   macro avg       0.99      1.00      0.99      3318
weighted avg       0.99      0.99      0.99      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.62it/s, F1=0.935, eval_acc=0.968, eval_loss=5.63, eval_precision=0.917, eval_recall=0.954]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.94      1.00      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.88      0.94      0.91       523
         PRO       0.56      1.00      0.72        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.93      0.94      0.94       690

   micro avg       0.91      0.95      0.93      1497
   macro avg       0.90      0.99      0.94      1497
weighted avg       0.91      0.95      0.93      1497



Epoch: 27/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.40it/s, F1=0.995, train_acc=0.999, train_loss=0.146, train_precision=0.994, train_recall=0.997]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       0.99      0.99      0.99       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       0.99      1.00      0.99      1151
         PRO       1.00      1.00      1.00        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.99      0.99      0.99      1517

   micro avg       0.99      1.00      0.99      3318
   macro avg       1.00      1.00      1.00      3318
weighted avg       0.99      1.00      0.99      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.53it/s, F1=0.94, eval_acc=0.971, eval_loss=4.74, eval_precision=0.931, eval_recall=0.95]  


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      0.99      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.90      0.93      0.91       523
         PRO       0.72      1.00      0.84        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.93      0.95      0.94       690

   micro avg       0.93      0.95      0.94      1497
   macro avg       0.93      0.98      0.95      1497
weighted avg       0.93      0.95      0.94      1497



Epoch: 28/30 Train: 100%|██████████| 125/125 [00:32<00:00,  3.80it/s, F1=0.998, train_acc=1, train_loss=0.0616, train_precision=0.998, train_recall=0.999]   


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       1.00      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       1.00      1.00      1.00      1151
         PRO       1.00      1.00      1.00        64
        RACE       1.00      1.00      1.00        32
       TITLE       1.00      1.00      1.00      1517

   micro avg       1.00      1.00      1.00      3318
   macro avg       1.00      1.00      1.00      3318
weighted avg       1.00      1.00      1.00      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.41it/s, F1=0.936, eval_acc=0.97, eval_loss=4.96, eval_precision=0.923, eval_recall=0.949] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.95      0.99      0.97       106
         LOC       0.67      1.00      0.80         2
        NAME       0.99      1.00      1.00       110
         ORG       0.89      0.92      0.91       523
         PRO       0.69      1.00      0.82        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.93      0.95      0.94       690

   micro avg       0.92      0.95      0.93      1497
   macro avg       0.87      0.98      0.92      1497
weighted avg       0.92      0.95      0.93      1497



Epoch: 29/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.78it/s, F1=0.999, train_acc=1, train_loss=0.0471, train_precision=0.999, train_recall=0.999]  


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       1.00      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       1.00      1.00      1.00      1151
         PRO       0.97      0.97      0.97        64
        RACE       1.00      1.00      1.00        32
       TITLE       1.00      1.00      1.00      1517

   micro avg       1.00      1.00      1.00      3318
   macro avg       1.00      1.00      1.00      3318
weighted avg       1.00      1.00      1.00      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.941, eval_acc=0.972, eval_loss=4.64, eval_precision=0.931, eval_recall=0.952]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.96      0.99      0.98       106
         LOC       0.67      1.00      0.80         2
        NAME       0.99      1.00      1.00       110
         ORG       0.90      0.93      0.91       523
         PRO       0.78      1.00      0.88        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.94      0.95      0.94       690

   micro avg       0.93      0.95      0.94      1497
   macro avg       0.89      0.98      0.93      1497
weighted avg       0.93      0.95      0.94      1497



Epoch: 30/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.46it/s, F1=1, train_acc=1, train_loss=0.00944, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       1.00      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       1.00      1.00      1.00      1151
         PRO       1.00      1.00      1.00        64
        RACE       1.00      1.00      1.00        32
       TITLE       1.00      1.00      1.00      1517

   micro avg       1.00      1.00      1.00      3318
   macro avg       1.00      1.00      1.00      3318
weighted avg       1.00      1.00      1.00      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.71it/s, F1=0.944, eval_acc=0.973, eval_loss=4.82, eval_precision=0.934, eval_recall=0.954]


eval_reports:


calculate data/few_shot/resume/train_1000.json etag: 100%|██████████| 466k/466k [00:00<00:00, 259MB/s]
calculate data/few_shot/resume/dev.json etag: 100%|██████████| 208k/208k [00:00<00:00, 205MB/s]
calculate data/few_shot/resume/test.json etag: 100%|██████████| 230k/230k [00:00<00:00, 218MB/s]
calculate data/few_shot/resume/labels.txt etag: 100%|██████████| 181/181 [00:00<00:00, 883kB/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.97      0.99      0.98       106
         LOC       0.67      1.00      0.80         2
        NAME       0.99      1.00      1.00       110
         ORG       0.90      0.93      0.92       523
         PRO       0.78      1.00      0.88        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.94      0.95      0.95       690

   micro avg       0.93      0.95      0.94      1497
   macro avg       0.89      0.98      0.93      1497
weighted avg       0.93      0.95      0.94      1497

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/resume/train_1000.json",
    "eval_file": "data/few_shot/resume/dev.json",
    "test_file": "data/few_sho


count line size data/few_shot/resume/labels.txt: 29L [00:00, 226087.02L/s]
build line mapper: 29L [00:00, 235270.44L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 29/29 [00:00<00:00, 8414.72it/s]
load vocab from list: 100%|██████████| 28/28 [00:00<00:00, 267518.25it/s]
load dataset from data/few_shot/resume/train_1000.json: 93it [00:00, 928.90it/s]

load cached ./temp/204ecb844970c953244b42be8f449690_578a629df36736a7b0ca315689a0fbc2_a783a23408031aaf8881013b1b168597_61206f767c93b652c614f8099bc479e7/1000000/matched_words
load cached ./temp/204ecb844970c953244b42be8f449690_578a629df36736a7b0ca315689a0fbc2_a783a23408031aaf8881013b1b168597_61206f767c93b652c614f8099bc479e7/1000000/word_vocab
load cached ./temp/204ecb844970c953244b42be8f449690_578a629df36736a7b0ca315689a0fbc2_a783a23408031aaf8881013b1b168597_61206f767c93b652c614f8099bc479e7/1000000/vocab_embedding


load dataset from data/few_shot/resume/train_1000.json: 1000it [00:01, 809.56it/s]
load dataset from data/few_shot/resume/dev.json: 463it [00:00, 830.29it/s]
Some weights of the model checkpoint at save_pretrained/resume_pretrain_lebert_1000_pretraind_task/Bert_960/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification mo

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.78it/s, F1=0.248, train_acc=0.609, train_loss=50.9, train_precision=0.224, train_recall=0.284]     


train_reports:
              precision    recall  f1-score   support

        CONT       0.00      0.00      0.00        70
         EDU       0.11      0.12      0.11       197
         LOC       0.00      0.00      0.00        16
        NAME       0.06      0.11      0.08       271
         ORG       0.09      0.34      0.14      1151
         PRO       0.25      0.02      0.03        64
        RACE       0.00      0.00      0.00        32
       TITLE       0.13      0.32      0.19      1517

   micro avg       0.09      0.28      0.14      3318
   macro avg       0.08      0.11      0.07      3318
weighted avg       0.11      0.28      0.15      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.53it/s, F1=0.786, eval_acc=0.934, eval_loss=8.34, eval_precision=0.736, eval_recall=0.845]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.57      0.61      0.59        33
         EDU       0.65      0.73      0.68       106
         LOC       0.00      0.00      0.00         2
        NAME       0.90      0.87      0.88       110
         ORG       0.68      0.86      0.76       523
         PRO       0.00      0.00      0.00        18
        RACE       0.00      0.00      0.00        15
       TITLE       0.79      0.92      0.85       690

   micro avg       0.74      0.85      0.79      1497
   macro avg       0.45      0.50      0.47      1497
weighted avg       0.73      0.85      0.78      1497



Epoch: 2/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.76it/s, F1=0.809, train_acc=0.954, train_loss=6.69, train_precision=0.76, train_recall=0.871] 


train_reports:
              precision    recall  f1-score   support

        CONT       0.77      0.96      0.85        70
         EDU       0.70      0.83      0.76       197
         LOC       0.05      0.06      0.06        16
        NAME       0.91      0.95      0.93       271
         ORG       0.70      0.86      0.77      1151
         PRO       0.25      0.34      0.29        64
        RACE       0.40      0.31      0.35        32
       TITLE       0.81      0.91      0.86      1517

   micro avg       0.75      0.87      0.81      3318
   macro avg       0.57      0.65      0.61      3318
weighted avg       0.75      0.87      0.81      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.69it/s, F1=0.908, eval_acc=0.964, eval_loss=4.75, eval_precision=0.88, eval_recall=0.939] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.92      0.98      0.95       106
         LOC       0.25      0.50      0.33         2
        NAME       0.98      0.99      0.99       110
         ORG       0.82      0.92      0.87       523
         PRO       0.77      0.94      0.85        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.87      0.92      0.89       690

   micro avg       0.86      0.93      0.90      1497
   macro avg       0.81      0.91      0.85      1497
weighted avg       0.86      0.93      0.90      1497



Epoch: 3/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.72it/s, F1=0.915, train_acc=0.978, train_loss=2.95, train_precision=0.891, train_recall=0.945]


train_reports:
              precision    recall  f1-score   support

        CONT       0.91      0.99      0.95        70
         EDU       0.95      0.97      0.96       197
         LOC       0.43      0.56      0.49        16
        NAME       0.95      0.96      0.95       271
         ORG       0.85      0.93      0.89      1151
         PRO       0.81      0.84      0.82        64
        RACE       0.71      0.84      0.77        32
       TITLE       0.90      0.96      0.93      1517

   micro avg       0.88      0.94      0.91      3318
   macro avg       0.81      0.88      0.84      3318
weighted avg       0.88      0.94      0.91      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.44it/s, F1=0.889, eval_acc=0.965, eval_loss=3.98, eval_precision=0.844, eval_recall=0.94] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.94      0.94        33
         EDU       0.94      0.95      0.95       106
         LOC       0.67      1.00      0.80         2
        NAME       0.97      1.00      0.99       110
         ORG       0.79      0.92      0.85       523
         PRO       0.75      1.00      0.86        18
        RACE       0.93      0.93      0.93        15
       TITLE       0.82      0.93      0.87       690

   micro avg       0.83      0.93      0.88      1497
   macro avg       0.85      0.96      0.90      1497
weighted avg       0.83      0.93      0.88      1497



Epoch: 4/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.77it/s, F1=0.947, train_acc=0.989, train_loss=1.7, train_precision=0.93, train_recall=0.967]  


train_reports:
              precision    recall  f1-score   support

        CONT       0.97      0.99      0.98        70
         EDU       0.96      0.97      0.96       197
         LOC       0.72      0.81      0.76        16
        NAME       0.98      0.99      0.98       271
         ORG       0.91      0.96      0.93      1151
         PRO       0.88      0.94      0.91        64
        RACE       0.84      0.84      0.84        32
       TITLE       0.93      0.96      0.95      1517

   micro avg       0.92      0.96      0.94      3318
   macro avg       0.90      0.93      0.92      3318
weighted avg       0.93      0.96      0.94      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.53it/s, F1=0.9, eval_acc=0.965, eval_loss=4.39, eval_precision=0.86, eval_recall=0.945]   


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.94      0.98      0.96       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.80      0.91      0.85       523
         PRO       0.78      1.00      0.88        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.86      0.94      0.90       690

   micro avg       0.85      0.94      0.90      1497
   macro avg       0.87      0.98      0.92      1497
weighted avg       0.86      0.94      0.90      1497



Epoch: 5/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.76it/s, F1=0.968, train_acc=0.993, train_loss=1.03, train_precision=0.958, train_recall=0.978] 


train_reports:
              precision    recall  f1-score   support

        CONT       0.96      0.99      0.97        70
         EDU       0.98      0.99      0.99       197
         LOC       0.76      0.81      0.79        16
        NAME       1.00      1.00      1.00       271
         ORG       0.94      0.97      0.96      1151
         PRO       0.93      0.98      0.95        64
        RACE       0.88      0.91      0.89        32
       TITLE       0.96      0.98      0.97      1517

   micro avg       0.95      0.98      0.97      3318
   macro avg       0.93      0.95      0.94      3318
weighted avg       0.95      0.98      0.97      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.69it/s, F1=0.891, eval_acc=0.969, eval_loss=4.31, eval_precision=0.858, eval_recall=0.927]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.95      0.97      0.96       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.78      0.88      0.83       523
         PRO       0.78      1.00      0.88        18
        RACE       0.93      0.93      0.93        15
       TITLE       0.85      0.93      0.89       690

   micro avg       0.84      0.92      0.88      1497
   macro avg       0.90      0.96      0.93      1497
weighted avg       0.85      0.92      0.88      1497



Epoch: 6/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.39it/s, F1=0.973, train_acc=0.994, train_loss=0.804, train_precision=0.966, train_recall=0.981]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      0.99      0.99        70
         EDU       0.99      1.00      0.99       197
         LOC       1.00      1.00      1.00        16
        NAME       0.99      1.00      1.00       271
         ORG       0.94      0.97      0.95      1151
         PRO       0.97      0.98      0.98        64
        RACE       1.00      0.97      0.98        32
       TITLE       0.97      0.98      0.98      1517

   micro avg       0.96      0.98      0.97      3318
   macro avg       0.98      0.99      0.98      3318
weighted avg       0.96      0.98      0.97      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.73it/s, F1=0.929, eval_acc=0.976, eval_loss=3.85, eval_precision=0.906, eval_recall=0.954]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.97      0.98      0.98       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.87      0.95      0.91       523
         PRO       0.90      1.00      0.95        18
        RACE       1.00      0.93      0.97        15
       TITLE       0.89      0.94      0.92       690

   micro avg       0.90      0.95      0.92      1497
   macro avg       0.95      0.97      0.96      1497
weighted avg       0.90      0.95      0.92      1497



Epoch: 7/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.77it/s, F1=0.983, train_acc=0.996, train_loss=0.603, train_precision=0.978, train_recall=0.989]


train_reports:
              precision    recall  f1-score   support

        CONT       0.96      0.97      0.96        70
         EDU       0.96      0.98      0.97       197
         LOC       0.94      1.00      0.97        16
        NAME       1.00      1.00      1.00       271
         ORG       0.98      0.99      0.99      1151
         PRO       0.93      0.97      0.95        64
        RACE       1.00      0.97      0.98        32
       TITLE       0.98      0.99      0.98      1517

   micro avg       0.98      0.99      0.98      3318
   macro avg       0.97      0.98      0.97      3318
weighted avg       0.98      0.99      0.98      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.889, eval_acc=0.959, eval_loss=6.52, eval_precision=0.852, eval_recall=0.93] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.82      0.98      0.89       106
         LOC       0.50      1.00      0.67         2
        NAME       0.98      1.00      0.99       110
         ORG       0.81      0.93      0.87       523
         PRO       0.72      1.00      0.84        18
        RACE       0.93      0.93      0.93        15
       TITLE       0.85      0.90      0.88       690

   micro avg       0.84      0.93      0.88      1497
   macro avg       0.83      0.97      0.88      1497
weighted avg       0.85      0.93      0.88      1497



Epoch: 8/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.77it/s, F1=0.972, train_acc=0.995, train_loss=0.775, train_precision=0.965, train_recall=0.981]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       0.96      0.98      0.97       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       0.96      0.98      0.97      1151
         PRO       0.91      0.92      0.91        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.97      0.98      0.97      1517

   micro avg       0.97      0.98      0.97      3318
   macro avg       0.97      0.98      0.98      3318
weighted avg       0.97      0.98      0.97      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.71it/s, F1=0.917, eval_acc=0.973, eval_loss=3.69, eval_precision=0.891, eval_recall=0.945]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      0.96      0.96       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.83      0.91      0.87       523
         PRO       0.78      1.00      0.88        18
        RACE       0.93      0.93      0.93        15
       TITLE       0.89      0.94      0.92       690

   micro avg       0.88      0.94      0.91      1497
   macro avg       0.92      0.97      0.94      1497
weighted avg       0.88      0.94      0.91      1497



Epoch: 9/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.79it/s, F1=0.993, train_acc=0.998, train_loss=0.244, train_precision=0.992, train_recall=0.994]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       0.99      0.99      0.99       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       0.99      0.99      0.99      1151
         PRO       0.95      0.98      0.97        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.99      0.99      0.99      1517

   micro avg       0.99      0.99      0.99      3318
   macro avg       0.99      1.00      0.99      3318
weighted avg       0.99      0.99      0.99      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.63it/s, F1=0.926, eval_acc=0.973, eval_loss=4.35, eval_precision=0.907, eval_recall=0.947]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      0.99      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.86      0.92      0.89       523
         PRO       0.82      1.00      0.90        18
        RACE       1.00      0.93      0.97        15
       TITLE       0.91      0.94      0.92       690

   micro avg       0.90      0.94      0.92      1497
   macro avg       0.94      0.97      0.96      1497
weighted avg       0.90      0.94      0.92      1497



Epoch: 10/30 Train: 100%|██████████| 125/125 [00:35<00:00,  3.53it/s, F1=0.993, train_acc=0.999, train_loss=0.184, train_precision=0.992, train_recall=0.995]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       0.99      1.00      0.99       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       0.99      0.99      0.99      1151
         PRO       0.97      0.95      0.96        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.99      1.00      0.99      1517

   micro avg       0.99      1.00      0.99      3318
   macro avg       0.99      0.99      0.99      3318
weighted avg       0.99      1.00      0.99      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.59it/s, F1=0.942, eval_acc=0.974, eval_loss=5.53, eval_precision=0.928, eval_recall=0.957]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.98      0.98      0.98       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.89      0.94      0.92       523
         PRO       0.82      1.00      0.90        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.93      0.94      0.94       690

   micro avg       0.93      0.95      0.94      1497
   macro avg       0.94      0.98      0.96      1497
weighted avg       0.93      0.95      0.94      1497



Epoch: 11/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.75it/s, F1=0.989, train_acc=0.997, train_loss=0.421, train_precision=0.985, train_recall=0.992]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       0.99      0.99      0.99       197
         LOC       1.00      1.00      1.00        16
        NAME       0.99      1.00      1.00       271
         ORG       0.99      1.00      0.99      1151
         PRO       0.97      1.00      0.98        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.98      0.99      0.98      1517

   micro avg       0.98      0.99      0.99      3318
   macro avg       0.99      1.00      0.99      3318
weighted avg       0.98      0.99      0.99      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.67it/s, F1=0.906, eval_acc=0.967, eval_loss=5.45, eval_precision=0.877, eval_recall=0.938]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      0.97      0.96       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.82      0.93      0.88       523
         PRO       0.81      0.94      0.87        18
        RACE       1.00      0.93      0.97        15
       TITLE       0.86      0.91      0.89       690

   micro avg       0.87      0.93      0.90      1497
   macro avg       0.93      0.96      0.94      1497
weighted avg       0.87      0.93      0.90      1497



Epoch: 12/30 Train: 100%|██████████| 125/125 [00:32<00:00,  3.81it/s, F1=0.984, train_acc=0.997, train_loss=0.578, train_precision=0.979, train_recall=0.99] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       1.00      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       0.96      0.98      0.97      1151
         PRO       0.98      0.98      0.98        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.98      0.99      0.99      1517

   micro avg       0.98      0.99      0.98      3318
   macro avg       0.99      0.99      0.99      3318
weighted avg       0.98      0.99      0.98      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.71it/s, F1=0.924, eval_acc=0.97, eval_loss=5.38, eval_precision=0.899, eval_recall=0.952] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.97      1.00      0.99       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.86      0.93      0.90       523
         PRO       0.82      1.00      0.90        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.88      0.94      0.91       690

   micro avg       0.89      0.95      0.92      1497
   macro avg       0.93      0.98      0.96      1497
weighted avg       0.89      0.95      0.92      1497



Epoch: 13/30 Train: 100%|██████████| 125/125 [00:35<00:00,  3.51it/s, F1=0.988, train_acc=0.998, train_loss=0.364, train_precision=0.984, train_recall=0.992]


train_reports:
              precision    recall  f1-score   support

        CONT       0.99      1.00      0.99        70
         EDU       0.99      0.99      0.99       197
         LOC       0.94      0.94      0.94        16
        NAME       1.00      1.00      1.00       271
         ORG       0.98      0.99      0.98      1151
         PRO       1.00      1.00      1.00        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.98      0.99      0.99      1517

   micro avg       0.98      0.99      0.99      3318
   macro avg       0.98      0.99      0.99      3318
weighted avg       0.98      0.99      0.99      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.919, eval_acc=0.973, eval_loss=4.37, eval_precision=0.897, eval_recall=0.943]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      0.98      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       1.00      1.00      1.00       110
         ORG       0.84      0.91      0.87       523
         PRO       0.82      1.00      0.90        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.89      0.94      0.92       690

   micro avg       0.89      0.94      0.91      1497
   macro avg       0.93      0.98      0.95      1497
weighted avg       0.89      0.94      0.91      1497



Epoch: 14/30 Train: 100%|██████████| 125/125 [00:32<00:00,  3.79it/s, F1=0.985, train_acc=0.997, train_loss=0.581, train_precision=0.981, train_recall=0.989]


train_reports:
              precision    recall  f1-score   support

        CONT       0.99      0.99      0.99        70
         EDU       1.00      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       0.97      0.98      0.98      1151
         PRO       0.98      0.98      0.98        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.98      0.99      0.99      1517

   micro avg       0.98      0.99      0.98      3318
   macro avg       0.99      0.99      0.99      3318
weighted avg       0.98      0.99      0.98      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.72it/s, F1=0.909, eval_acc=0.965, eval_loss=5.68, eval_precision=0.886, eval_recall=0.934]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.94      0.94        33
         EDU       0.95      1.00      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       1.00      0.99      1.00       110
         ORG       0.81      0.91      0.86       523
         PRO       0.78      1.00      0.88        18
        RACE       1.00      0.93      0.97        15
       TITLE       0.90      0.92      0.91       690

   micro avg       0.88      0.93      0.90      1497
   macro avg       0.92      0.96      0.94      1497
weighted avg       0.88      0.93      0.90      1497



Epoch: 15/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.78it/s, F1=0.989, train_acc=0.998, train_loss=0.346, train_precision=0.986, train_recall=0.993]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       1.00      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       0.98      0.99      0.98      1151
         PRO       1.00      1.00      1.00        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.99      0.99      0.99      1517

   micro avg       0.99      0.99      0.99      3318
   macro avg       1.00      1.00      1.00      3318
weighted avg       0.99      0.99      0.99      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.71it/s, F1=0.909, eval_acc=0.969, eval_loss=4.86, eval_precision=0.881, eval_recall=0.94] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.97      1.00      0.99       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.81      0.90      0.85       523
         PRO       0.75      1.00      0.86        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.88      0.94      0.91       690

   micro avg       0.87      0.94      0.90      1497
   macro avg       0.92      0.98      0.95      1497
weighted avg       0.87      0.94      0.90      1497



Epoch: 16/30 Train: 100%|██████████| 125/125 [00:35<00:00,  3.51it/s, F1=0.994, train_acc=0.999, train_loss=0.155, train_precision=0.992, train_recall=0.996]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       1.00      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       0.99      0.99      0.99      1151
         PRO       0.98      1.00      0.99        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.99      0.99      0.99      1517

   micro avg       0.99      1.00      0.99      3318
   macro avg       0.99      1.00      1.00      3318
weighted avg       0.99      1.00      0.99      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.67it/s, F1=0.923, eval_acc=0.971, eval_loss=5.17, eval_precision=0.905, eval_recall=0.943]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.98      0.98      0.98       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.86      0.91      0.88       523
         PRO       0.82      1.00      0.90        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.90      0.94      0.92       690

   micro avg       0.90      0.94      0.92      1497
   macro avg       0.94      0.98      0.96      1497
weighted avg       0.90      0.94      0.92      1497



Epoch: 17/30 Train: 100%|██████████| 125/125 [00:32<00:00,  3.80it/s, F1=0.996, train_acc=0.999, train_loss=0.151, train_precision=0.995, train_recall=0.997]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       1.00      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       0.99      0.99      0.99      1151
         PRO       1.00      1.00      1.00        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.99      1.00      0.99      1517

   micro avg       0.99      1.00      1.00      3318
   macro avg       1.00      1.00      1.00      3318
weighted avg       0.99      1.00      1.00      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.71it/s, F1=0.928, eval_acc=0.971, eval_loss=5.61, eval_precision=0.909, eval_recall=0.948]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      0.99      0.98       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.86      0.93      0.89       523
         PRO       0.82      1.00      0.90        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.91      0.93      0.92       690

   micro avg       0.90      0.94      0.92      1497
   macro avg       0.94      0.98      0.96      1497
weighted avg       0.90      0.94      0.92      1497



Epoch: 18/30 Train: 100%|██████████| 125/125 [00:32<00:00,  3.80it/s, F1=0.998, train_acc=1, train_loss=0.0386, train_precision=0.998, train_recall=0.999]   


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       1.00      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       1.00      1.00      1.00      1151
         PRO       1.00      1.00      1.00        64
        RACE       1.00      1.00      1.00        32
       TITLE       1.00      1.00      1.00      1517

   micro avg       1.00      1.00      1.00      3318
   macro avg       1.00      1.00      1.00      3318
weighted avg       1.00      1.00      1.00      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.58it/s, F1=0.928, eval_acc=0.971, eval_loss=6.21, eval_precision=0.907, eval_recall=0.95] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      1.00      0.98       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.86      0.93      0.90       523
         PRO       0.82      1.00      0.90        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.91      0.94      0.92       690

   micro avg       0.90      0.95      0.92      1497
   macro avg       0.93      0.98      0.96      1497
weighted avg       0.90      0.95      0.92      1497



Epoch: 19/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.44it/s, F1=1, train_acc=1, train_loss=0.025, train_precision=1, train_recall=1]               


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       1.00      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       1.00      1.00      1.00      1151
         PRO       1.00      1.00      1.00        64
        RACE       1.00      1.00      1.00        32
       TITLE       1.00      1.00      1.00      1517

   micro avg       1.00      1.00      1.00      3318
   macro avg       1.00      1.00      1.00      3318
weighted avg       1.00      1.00      1.00      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.67it/s, F1=0.933, eval_acc=0.971, eval_loss=6.35, eval_precision=0.916, eval_recall=0.952]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      0.99      0.98       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.87      0.93      0.90       523
         PRO       0.82      1.00      0.90        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.92      0.94      0.93       690

   micro avg       0.91      0.95      0.93      1497
   macro avg       0.94      0.98      0.96      1497
weighted avg       0.91      0.95      0.93      1497



Epoch: 20/30 Train: 100%|██████████| 125/125 [00:32<00:00,  3.79it/s, F1=0.996, train_acc=0.999, train_loss=0.134, train_precision=0.995, train_recall=0.997]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       1.00      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       0.99      1.00      0.99      1151
         PRO       1.00      1.00      1.00        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.99      1.00      0.99      1517

   micro avg       0.99      1.00      1.00      3318
   macro avg       1.00      1.00      1.00      3318
weighted avg       0.99      1.00      1.00      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.916, eval_acc=0.968, eval_loss=6.55, eval_precision=0.889, eval_recall=0.945]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      1.00      0.98       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.83      0.93      0.88       523
         PRO       0.82      1.00      0.90        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.89      0.92      0.91       690

   micro avg       0.88      0.94      0.91      1497
   macro avg       0.93      0.98      0.95      1497
weighted avg       0.88      0.94      0.91      1497



Epoch: 21/30 Train: 100%|██████████| 125/125 [00:32<00:00,  3.79it/s, F1=0.978, train_acc=0.997, train_loss=0.54, train_precision=0.971, train_recall=0.986] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       0.99      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       0.95      0.98      0.97      1151
         PRO       0.98      1.00      0.99        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.97      0.99      0.98      1517

   micro avg       0.97      0.99      0.98      3318
   macro avg       0.99      1.00      0.99      3318
weighted avg       0.97      0.99      0.98      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.37it/s, F1=0.906, eval_acc=0.966, eval_loss=5.88, eval_precision=0.876, eval_recall=0.938]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.87      0.82      0.84        33
         EDU       0.95      0.99      0.97       106
         LOC       0.25      1.00      0.40         2
        NAME       0.99      1.00      1.00       110
         ORG       0.82      0.92      0.87       523
         PRO       0.82      1.00      0.90        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.87      0.92      0.89       690

   micro avg       0.86      0.93      0.90      1497
   macro avg       0.81      0.96      0.85      1497
weighted avg       0.87      0.93      0.90      1497



Epoch: 22/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.78it/s, F1=0.991, train_acc=0.999, train_loss=0.278, train_precision=0.989, train_recall=0.993]


train_reports:
              precision    recall  f1-score   support

        CONT       0.97      0.99      0.98        70
         EDU       0.99      0.99      0.99       197
         LOC       0.83      0.94      0.88        16
        NAME       1.00      1.00      1.00       271
         ORG       0.98      0.99      0.99      1151
         PRO       0.98      0.98      0.98        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.99      0.99      0.99      1517

   micro avg       0.99      0.99      0.99      3318
   macro avg       0.97      0.99      0.98      3318
weighted avg       0.99      0.99      0.99      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.63it/s, F1=0.935, eval_acc=0.972, eval_loss=5.7, eval_precision=0.922, eval_recall=0.949] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.97      0.99      0.98       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.88      0.93      0.90       523
         PRO       0.82      1.00      0.90        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.92      0.94      0.93       690

   micro avg       0.92      0.95      0.93      1497
   macro avg       0.94      0.98      0.96      1497
weighted avg       0.92      0.95      0.93      1497



Epoch: 23/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.42it/s, F1=0.994, train_acc=0.999, train_loss=0.346, train_precision=0.992, train_recall=0.996]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       0.98      0.99      0.98       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       0.99      1.00      1.00      1151
         PRO       0.95      0.98      0.97        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.99      0.99      0.99      1517

   micro avg       0.99      1.00      0.99      3318
   macro avg       0.99      1.00      0.99      3318
weighted avg       0.99      1.00      0.99      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.928, eval_acc=0.969, eval_loss=4.96, eval_precision=0.908, eval_recall=0.951]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      0.97      0.96       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.87      0.93      0.90       523
         PRO       0.82      1.00      0.90        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.91      0.94      0.92       690

   micro avg       0.90      0.95      0.92      1497
   macro avg       0.93      0.98      0.96      1497
weighted avg       0.90      0.95      0.92      1497



Epoch: 24/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.69it/s, F1=0.988, train_acc=0.997, train_loss=0.505, train_precision=0.984, train_recall=0.993]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       0.99      0.99      0.99       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      0.99      1.00       271
         ORG       0.98      0.99      0.99      1151
         PRO       1.00      1.00      1.00        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.98      0.99      0.99      1517

   micro avg       0.98      0.99      0.99      3318
   macro avg       0.99      1.00      1.00      3318
weighted avg       0.98      0.99      0.99      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.67it/s, F1=0.933, eval_acc=0.97, eval_loss=6.13, eval_precision=0.922, eval_recall=0.944] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      0.95      0.96       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.89      0.92      0.90       523
         PRO       0.86      1.00      0.92        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.92      0.94      0.93       690

   micro avg       0.92      0.94      0.93      1497
   macro avg       0.94      0.98      0.96      1497
weighted avg       0.92      0.94      0.93      1497



Epoch: 25/30 Train: 100%|██████████| 125/125 [00:32<00:00,  3.81it/s, F1=0.985, train_acc=0.997, train_loss=0.471, train_precision=0.98, train_recall=0.991] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       1.00      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       0.99      1.00      1.00       271
         ORG       0.97      0.99      0.98      1151
         PRO       1.00      1.00      1.00        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.98      0.99      0.98      1517

   micro avg       0.98      0.99      0.98      3318
   macro avg       0.99      1.00      0.99      3318
weighted avg       0.98      0.99      0.98      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.73it/s, F1=0.929, eval_acc=0.972, eval_loss=4.64, eval_precision=0.916, eval_recall=0.944]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      0.99      0.98       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.85      0.91      0.88       523
         PRO       0.86      1.00      0.92        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.92      0.93      0.93       690

   micro avg       0.91      0.94      0.92      1497
   macro avg       0.95      0.98      0.96      1497
weighted avg       0.91      0.94      0.92      1497



Epoch: 26/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.47it/s, F1=0.995, train_acc=0.999, train_loss=0.168, train_precision=0.994, train_recall=0.997]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       1.00      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       0.99      1.00      0.99      1151
         PRO       1.00      1.00      1.00        64
        RACE       1.00      1.00      1.00        32
       TITLE       0.99      1.00      0.99      1517

   micro avg       0.99      1.00      1.00      3318
   macro avg       1.00      1.00      1.00      3318
weighted avg       0.99      1.00      1.00      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.46it/s, F1=0.926, eval_acc=0.975, eval_loss=4.69, eval_precision=0.909, eval_recall=0.945]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      0.98      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.86      0.93      0.89       523
         PRO       0.86      1.00      0.92        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.90      0.92      0.91       690

   micro avg       0.90      0.94      0.92      1497
   macro avg       0.94      0.98      0.96      1497
weighted avg       0.90      0.94      0.92      1497



Epoch: 27/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.75it/s, F1=0.998, train_acc=1, train_loss=0.04, train_precision=0.998, train_recall=0.999]     


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       1.00      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       1.00      1.00      1.00      1151
         PRO       1.00      1.00      1.00        64
        RACE       1.00      1.00      1.00        32
       TITLE       1.00      1.00      1.00      1517

   micro avg       1.00      1.00      1.00      3318
   macro avg       1.00      1.00      1.00      3318
weighted avg       1.00      1.00      1.00      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.935, eval_acc=0.975, eval_loss=4.92, eval_precision=0.922, eval_recall=0.949]


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      1.00      0.98       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.88      0.93      0.90       523
         PRO       0.86      1.00      0.92        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.91      0.93      0.92       690

   micro avg       0.91      0.94      0.93      1497
   macro avg       0.94      0.98      0.96      1497
weighted avg       0.91      0.94      0.93      1497



Epoch: 28/30 Train: 100%|██████████| 125/125 [00:33<00:00,  3.77it/s, F1=0.999, train_acc=1, train_loss=0.042, train_precision=0.998, train_recall=0.999] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       1.00      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       1.00      1.00      1.00      1151
         PRO       1.00      1.00      1.00        64
        RACE       1.00      1.00      1.00        32
       TITLE       1.00      1.00      1.00      1517

   micro avg       1.00      1.00      1.00      3318
   macro avg       1.00      1.00      1.00      3318
weighted avg       1.00      1.00      1.00      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.23it/s, F1=0.93, eval_acc=0.973, eval_loss=5.34, eval_precision=0.917, eval_recall=0.945] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      0.99      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.87      0.91      0.89       523
         PRO       0.86      1.00      0.92        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.91      0.93      0.92       690

   micro avg       0.91      0.94      0.92      1497
   macro avg       0.94      0.98      0.96      1497
weighted avg       0.91      0.94      0.92      1497



Epoch: 29/30 Train: 100%|██████████| 125/125 [00:36<00:00,  3.42it/s, F1=1, train_acc=1, train_loss=0.0198, train_precision=1, train_recall=1]       


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       1.00      1.00      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       1.00      1.00      1.00      1151
         PRO       1.00      1.00      1.00        64
        RACE       1.00      1.00      1.00        32
       TITLE       1.00      1.00      1.00      1517

   micro avg       1.00      1.00      1.00      3318
   macro avg       1.00      1.00      1.00      3318
weighted avg       1.00      1.00      1.00      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.71it/s, F1=0.926, eval_acc=0.971, eval_loss=5.59, eval_precision=0.91, eval_recall=0.943] 


eval_reports:


  0%|          | 0/125 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.98      1.00      0.99       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.86      0.91      0.88       523
         PRO       0.82      1.00      0.90        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.91      0.93      0.92       690

   micro avg       0.90      0.94      0.92      1497
   macro avg       0.94      0.98      0.96      1497
weighted avg       0.90      0.94      0.92      1497



Epoch: 30/30 Train: 100%|██████████| 125/125 [00:32<00:00,  3.80it/s, F1=0.998, train_acc=0.999, train_loss=0.0959, train_precision=0.998, train_recall=0.998]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        70
         EDU       1.00      0.99      1.00       197
         LOC       1.00      1.00      1.00        16
        NAME       1.00      1.00      1.00       271
         ORG       1.00      1.00      1.00      1151
         PRO       0.98      1.00      0.99        64
        RACE       1.00      1.00      1.00        32
       TITLE       1.00      1.00      1.00      1517

   micro avg       1.00      1.00      1.00      3318
   macro avg       1.00      1.00      1.00      3318
weighted avg       1.00      1.00      1.00      3318



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.68it/s, F1=0.924, eval_acc=0.97, eval_loss=5.88, eval_precision=0.906, eval_recall=0.944] 


eval_reports:


calculate data/few_shot/resume/train_1350.json etag: 100%|██████████| 639k/639k [00:00<00:00, 275MB/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.95      1.00      0.98       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.87      0.92      0.90       523
         PRO       0.78      1.00      0.88        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.91      0.93      0.92       690

   micro avg       0.90      0.94      0.92      1497
   macro avg       0.93      0.98      0.95      1497
weighted avg       0.91      0.94      0.92      1497

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/resume/train_1350.json",
    "eval_file": "data/few_shot/resume/dev.json",
    "test_file": "data/few_sho


calculate data/few_shot/resume/dev.json etag: 100%|██████████| 208k/208k [00:00<00:00, 201MB/s]
calculate data/few_shot/resume/test.json etag: 100%|██████████| 230k/230k [00:00<00:00, 280MB/s]
calculate data/few_shot/resume/labels.txt etag: 100%|██████████| 181/181 [00:00<00:00, 373kB/s]


load cached ./temp/67aae1402c328e13a97f12024469cc97_578a629df36736a7b0ca315689a0fbc2_a783a23408031aaf8881013b1b168597_61206f767c93b652c614f8099bc479e7/1000000/lexicon_tree


count line size data/few_shot/resume/labels.txt: 29L [00:00, 219557.43L/s]
build line mapper: 29L [00:00, 46782.62L/s]9 [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 29/29 [00:00<00:00, 9316.39it/s]
load vocab from list: 100%|██████████| 28/28 [00:00<00:00, 273754.11it/s]
load dataset from data/few_shot/resume/train_1350.json: 0it [00:00, ?it/s]

load cached ./temp/67aae1402c328e13a97f12024469cc97_578a629df36736a7b0ca315689a0fbc2_a783a23408031aaf8881013b1b168597_61206f767c93b652c614f8099bc479e7/1000000/matched_words
load cached ./temp/67aae1402c328e13a97f12024469cc97_578a629df36736a7b0ca315689a0fbc2_a783a23408031aaf8881013b1b168597_61206f767c93b652c614f8099bc479e7/1000000/word_vocab
load cached ./temp/67aae1402c328e13a97f12024469cc97_578a629df36736a7b0ca315689a0fbc2_a783a23408031aaf8881013b1b168597_61206f767c93b652c614f8099bc479e7/1000000/vocab_embedding


load dataset from data/few_shot/resume/train_1350.json: 1350it [00:01, 797.84it/s]
load dataset from data/few_shot/resume/dev.json: 463it [00:00, 826.23it/s]
Some weights of the model checkpoint at save_pretrained/resume_pretrain_lebert_1350_pretraind_task/Bert_1290/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification m

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.73it/s, F1=0.426, train_acc=0.696, train_loss=37.6, train_precision=0.4, train_recall=0.461]         


train_reports:
              precision    recall  f1-score   support

        CONT       0.01      0.20      0.02        86
         EDU       0.24      0.23      0.23       263
         LOC       0.00      0.00      0.00        22
        NAME       0.25      0.27      0.26       347
         ORG       0.15      0.50      0.24      1591
         PRO       0.00      0.00      0.00        86
        RACE       0.00      0.00      0.00        45
       TITLE       0.63      0.54      0.58      2111

   micro avg       0.19      0.46      0.27      4551
   macro avg       0.16      0.22      0.17      4551
weighted avg       0.38      0.46      0.38      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.35it/s, F1=0.86, eval_acc=0.95, eval_loss=5.19, eval_precision=0.826, eval_recall=0.899]  


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.56      0.88      0.68        33
         EDU       0.76      0.84      0.80       106
         LOC       0.00      0.00      0.00         2
        NAME       0.99      0.97      0.98       110
         ORG       0.75      0.91      0.83       523
         PRO       0.00      0.00      0.00        18
        RACE       0.00      0.00      0.00        15
       TITLE       0.86      0.92      0.89       690

   micro avg       0.80      0.89      0.85      1497
   macro avg       0.49      0.57      0.52      1497
weighted avg       0.80      0.89      0.84      1497



Epoch: 2/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.74it/s, F1=0.885, train_acc=0.969, train_loss=3.74, train_precision=0.859, train_recall=0.916]


train_reports:
              precision    recall  f1-score   support

        CONT       0.70      0.95      0.81        86
         EDU       0.82      0.91      0.86       263
         LOC       0.40      0.36      0.38        22
        NAME       0.97      0.98      0.97       347
         ORG       0.83      0.91      0.87      1591
         PRO       0.49      0.60      0.54        86
        RACE       0.63      0.76      0.69        45
       TITLE       0.90      0.93      0.92      2111

   micro avg       0.86      0.92      0.89      4551
   macro avg       0.72      0.80      0.76      4551
weighted avg       0.86      0.92      0.89      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.56it/s, F1=0.923, eval_acc=0.97, eval_loss=2.83, eval_precision=0.904, eval_recall=0.944] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.97      0.97      0.97        33
         EDU       0.94      0.97      0.96       106
         LOC       0.67      1.00      0.80         2
        NAME       0.99      1.00      1.00       110
         ORG       0.84      0.91      0.88       523
         PRO       0.82      1.00      0.90        18
        RACE       1.00      0.93      0.97        15
       TITLE       0.91      0.94      0.92       690

   micro avg       0.89      0.94      0.92      1497
   macro avg       0.89      0.97      0.92      1497
weighted avg       0.89      0.94      0.92      1497



Epoch: 3/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.50it/s, F1=0.942, train_acc=0.983, train_loss=1.94, train_precision=0.93, train_recall=0.956] 


train_reports:
              precision    recall  f1-score   support

        CONT       0.98      1.00      0.99        86
         EDU       0.94      0.97      0.96       263
         LOC       0.68      0.77      0.72        22
        NAME       0.98      0.99      0.98       347
         ORG       0.91      0.95      0.93      1591
         PRO       0.84      0.92      0.88        86
        RACE       0.91      0.91      0.91        45
       TITLE       0.95      0.96      0.95      2111

   micro avg       0.93      0.96      0.94      4551
   macro avg       0.90      0.93      0.92      4551
weighted avg       0.93      0.96      0.94      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.20it/s, F1=0.92, eval_acc=0.968, eval_loss=3.37, eval_precision=0.9, eval_recall=0.942]   


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      0.98      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.84      0.90      0.87       523
         PRO       0.82      1.00      0.90        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.90      0.94      0.92       690

   micro avg       0.89      0.94      0.91      1497
   macro avg       0.94      0.98      0.96      1497
weighted avg       0.89      0.94      0.92      1497



Epoch: 4/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.70it/s, F1=0.96, train_acc=0.99, train_loss=1.18, train_precision=0.951, train_recall=0.97]   


train_reports:
              precision    recall  f1-score   support

        CONT       0.98      0.99      0.98        86
         EDU       0.98      0.99      0.99       263
         LOC       0.70      0.86      0.78        22
        NAME       0.99      0.99      0.99       347
         ORG       0.93      0.96      0.95      1591
         PRO       0.87      0.92      0.89        86
        RACE       0.89      0.93      0.91        45
       TITLE       0.96      0.97      0.96      2111

   micro avg       0.95      0.97      0.96      4551
   macro avg       0.91      0.95      0.93      4551
weighted avg       0.95      0.97      0.96      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.66it/s, F1=0.939, eval_acc=0.973, eval_loss=3.19, eval_precision=0.928, eval_recall=0.951]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      0.97      0.98        33
         EDU       0.95      0.98      0.96       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.89      0.93      0.91       523
         PRO       0.78      1.00      0.88        18
        RACE       1.00      0.93      0.97        15
       TITLE       0.93      0.94      0.94       690

   micro avg       0.92      0.95      0.93      1497
   macro avg       0.94      0.97      0.95      1497
weighted avg       0.92      0.95      0.93      1497



Epoch: 5/30 Train: 100%|██████████| 169/169 [00:47<00:00,  3.54it/s, F1=0.974, train_acc=0.993, train_loss=0.86, train_precision=0.967, train_recall=0.981] 


train_reports:
              precision    recall  f1-score   support

        CONT       0.99      1.00      0.99        86
         EDU       0.98      0.99      0.98       263
         LOC       0.91      0.91      0.91        22
        NAME       1.00      1.00      1.00       347
         ORG       0.95      0.98      0.96      1591
         PRO       0.85      0.93      0.89        86
        RACE       0.91      0.93      0.92        45
       TITLE       0.97      0.98      0.98      2111

   micro avg       0.96      0.98      0.97      4551
   macro avg       0.95      0.97      0.96      4551
weighted avg       0.97      0.98      0.97      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.63it/s, F1=0.935, eval_acc=0.975, eval_loss=2.76, eval_precision=0.921, eval_recall=0.95] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      0.97      0.98        33
         EDU       0.95      0.96      0.96       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.88      0.94      0.91       523
         PRO       0.86      1.00      0.92        18
        RACE       1.00      0.93      0.97        15
       TITLE       0.92      0.93      0.93       690

   micro avg       0.91      0.95      0.93      1497
   macro avg       0.91      0.97      0.93      1497
weighted avg       0.91      0.95      0.93      1497



Epoch: 6/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.72it/s, F1=0.982, train_acc=0.994, train_loss=0.732, train_precision=0.979, train_recall=0.987]


train_reports:
              precision    recall  f1-score   support

        CONT       0.97      0.98      0.97        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       0.97      0.98      0.98      1591
         PRO       0.92      0.98      0.95        86
        RACE       1.00      1.00      1.00        45
       TITLE       0.98      0.99      0.98      2111

   micro avg       0.98      0.99      0.98      4551
   macro avg       0.98      0.99      0.98      4551
weighted avg       0.98      0.99      0.98      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.60it/s, F1=0.944, eval_acc=0.977, eval_loss=3.02, eval_precision=0.929, eval_recall=0.96] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.97      0.97      0.97        33
         EDU       0.96      1.00      0.98       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.90      0.94      0.92       523
         PRO       0.86      1.00      0.92        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.92      0.95      0.94       690

   micro avg       0.92      0.96      0.94      1497
   macro avg       0.91      0.98      0.94      1497
weighted avg       0.92      0.96      0.94      1497



Epoch: 7/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.72it/s, F1=0.983, train_acc=0.996, train_loss=0.443, train_precision=0.98, train_recall=0.986] 


train_reports:
              precision    recall  f1-score   support

        CONT       0.98      0.99      0.98        86
         EDU       0.98      0.99      0.98       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       0.97      0.98      0.98      1591
         PRO       0.98      0.99      0.98        86
        RACE       0.96      0.98      0.97        45
       TITLE       0.98      0.99      0.99      2111

   micro avg       0.98      0.99      0.98      4551
   macro avg       0.98      0.99      0.98      4551
weighted avg       0.98      0.99      0.98      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.59it/s, F1=0.947, eval_acc=0.973, eval_loss=3.44, eval_precision=0.936, eval_recall=0.958]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      0.99      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.92      0.95      0.93       523
         PRO       0.86      1.00      0.92        18
        RACE       1.00      0.93      0.97        15
       TITLE       0.93      0.95      0.94       690

   micro avg       0.93      0.96      0.94      1497
   macro avg       0.95      0.98      0.96      1497
weighted avg       0.93      0.96      0.94      1497



Epoch: 8/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.50it/s, F1=0.995, train_acc=0.999, train_loss=0.187, train_precision=0.994, train_recall=0.996]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       0.99      1.00      0.99       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      0.99      1.00       347
         ORG       0.99      0.99      0.99      1591
         PRO       0.97      0.99      0.98        86
        RACE       1.00      0.98      0.99        45
       TITLE       0.99      1.00      1.00      2111

   micro avg       0.99      1.00      0.99      4551
   macro avg       0.99      0.99      0.99      4551
weighted avg       0.99      1.00      0.99      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.46it/s, F1=0.942, eval_acc=0.973, eval_loss=4.06, eval_precision=0.926, eval_recall=0.959]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      1.00      0.98       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.89      0.95      0.92       523
         PRO       0.86      1.00      0.92        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.92      0.94      0.93       690

   micro avg       0.92      0.96      0.94      1497
   macro avg       0.95      0.99      0.97      1497
weighted avg       0.92      0.96      0.94      1497



Epoch: 9/30 Train: 100%|██████████| 169/169 [00:44<00:00,  3.79it/s, F1=0.994, train_acc=0.999, train_loss=0.213, train_precision=0.992, train_recall=0.995]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       0.99      1.00      1.00       347
         ORG       0.99      0.99      0.99      1591
         PRO       0.99      0.99      0.99        86
        RACE       1.00      1.00      1.00        45
       TITLE       0.99      1.00      0.99      2111

   micro avg       0.99      1.00      0.99      4551
   macro avg       1.00      1.00      1.00      4551
weighted avg       0.99      1.00      0.99      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.62it/s, F1=0.943, eval_acc=0.974, eval_loss=4.38, eval_precision=0.933, eval_recall=0.954]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.97      1.00      0.99       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      0.99      0.99       110
         ORG       0.89      0.93      0.91       523
         PRO       0.86      1.00      0.92        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.94      0.95      0.94       690

   micro avg       0.93      0.95      0.94      1497
   macro avg       0.96      0.98      0.97      1497
weighted avg       0.93      0.95      0.94      1497



Epoch: 10/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.52it/s, F1=0.988, train_acc=0.997, train_loss=0.394, train_precision=0.986, train_recall=0.99] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       0.98      0.99      0.98      1591
         PRO       0.99      1.00      0.99        86
        RACE       1.00      1.00      1.00        45
       TITLE       0.99      0.99      0.99      2111

   micro avg       0.99      0.99      0.99      4551
   macro avg       0.99      1.00      0.99      4551
weighted avg       0.99      0.99      0.99      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.60it/s, F1=0.944, eval_acc=0.973, eval_loss=4.13, eval_precision=0.935, eval_recall=0.953]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.97      0.97      0.97        33
         EDU       0.99      0.99      0.99       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.90      0.94      0.92       523
         PRO       0.86      1.00      0.92        18
        RACE       1.00      0.93      0.97        15
       TITLE       0.93      0.94      0.94       690

   micro avg       0.93      0.95      0.94      1497
   macro avg       0.96      0.97      0.96      1497
weighted avg       0.93      0.95      0.94      1497



Epoch: 11/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.69it/s, F1=0.988, train_acc=0.997, train_loss=0.414, train_precision=0.985, train_recall=0.991]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       0.98      0.99      0.98      1591
         PRO       1.00      1.00      1.00        86
        RACE       1.00      1.00      1.00        45
       TITLE       0.98      0.99      0.99      2111

   micro avg       0.98      0.99      0.99      4551
   macro avg       0.99      1.00      1.00      4551
weighted avg       0.98      0.99      0.99      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.21it/s, F1=0.945, eval_acc=0.971, eval_loss=4.24, eval_precision=0.937, eval_recall=0.953]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      0.98      0.96       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.92      0.94      0.93       523
         PRO       0.86      1.00      0.92        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.93      0.94      0.94       690

   micro avg       0.93      0.95      0.94      1497
   macro avg       0.95      0.98      0.97      1497
weighted avg       0.93      0.95      0.94      1497



Epoch: 12/30 Train: 100%|██████████| 169/169 [00:44<00:00,  3.77it/s, F1=0.994, train_acc=0.998, train_loss=0.266, train_precision=0.993, train_recall=0.996]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       0.99      0.99      0.99      1591
         PRO       1.00      1.00      1.00        86
        RACE       1.00      1.00      1.00        45
       TITLE       0.99      1.00      0.99      2111

   micro avg       0.99      1.00      0.99      4551
   macro avg       1.00      1.00      1.00      4551
weighted avg       0.99      1.00      0.99      4551



Eval Result: 100%|██████████| 8/8 [00:04<00:00,  1.60it/s, F1=0.928, eval_acc=0.967, eval_loss=4.6, eval_precision=0.906, eval_recall=0.952] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.97      0.97      0.97        33
         EDU       0.96      0.98      0.97       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.85      0.92      0.88       523
         PRO       0.82      1.00      0.90        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.91      0.95      0.93       690

   micro avg       0.90      0.95      0.92      1497
   macro avg       0.89      0.98      0.93      1497
weighted avg       0.90      0.95      0.92      1497



Epoch: 13/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.71it/s, F1=0.993, train_acc=0.998, train_loss=0.327, train_precision=0.991, train_recall=0.995]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       0.95      0.95      0.95        22
        NAME       1.00      1.00      1.00       347
         ORG       0.99      0.99      0.99      1591
         PRO       1.00      1.00      1.00        86
        RACE       1.00      1.00      1.00        45
       TITLE       0.99      0.99      0.99      2111

   micro avg       0.99      0.99      0.99      4551
   macro avg       0.99      0.99      0.99      4551
weighted avg       0.99      0.99      0.99      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.61it/s, F1=0.943, eval_acc=0.974, eval_loss=3.54, eval_precision=0.934, eval_recall=0.952]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      0.97      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.91      0.94      0.92       523
         PRO       0.82      1.00      0.90        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.94      0.94      0.94       690

   micro avg       0.93      0.95      0.94      1497
   macro avg       0.95      0.98      0.97      1497
weighted avg       0.93      0.95      0.94      1497



Epoch: 14/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.74it/s, F1=0.998, train_acc=1, train_loss=0.0966, train_precision=0.997, train_recall=0.998]    


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       0.95      0.95      0.95        22
        NAME       1.00      1.00      1.00       347
         ORG       0.99      1.00      1.00      1591
         PRO       1.00      1.00      1.00        86
        RACE       1.00      1.00      1.00        45
       TITLE       1.00      1.00      1.00      2111

   micro avg       1.00      1.00      1.00      4551
   macro avg       0.99      0.99      0.99      4551
weighted avg       1.00      1.00      1.00      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.67it/s, F1=0.946, eval_acc=0.973, eval_loss=4.63, eval_precision=0.937, eval_recall=0.956]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.97      0.97      0.97        33
         EDU       0.98      0.99      0.99       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.91      0.94      0.93       523
         PRO       0.82      1.00      0.90        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.94      0.95      0.94       690

   micro avg       0.93      0.95      0.94      1497
   macro avg       0.91      0.98      0.94      1497
weighted avg       0.93      0.95      0.94      1497



Epoch: 15/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.47it/s, F1=0.995, train_acc=0.999, train_loss=0.198, train_precision=0.994, train_recall=0.997]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       0.99      0.99      0.99      1591
         PRO       1.00      1.00      1.00        86
        RACE       1.00      1.00      1.00        45
       TITLE       0.99      1.00      1.00      2111

   micro avg       0.99      1.00      0.99      4551
   macro avg       1.00      1.00      1.00      4551
weighted avg       0.99      1.00      0.99      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.68it/s, F1=0.943, eval_acc=0.975, eval_loss=4.44, eval_precision=0.928, eval_recall=0.958]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.97      0.97      0.97        33
         EDU       0.97      1.00      0.99       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.91      0.95      0.93       523
         PRO       0.82      1.00      0.90        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.93      0.95      0.94       690

   micro avg       0.93      0.96      0.94      1497
   macro avg       0.91      0.98      0.94      1497
weighted avg       0.93      0.96      0.94      1497



Epoch: 16/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.75it/s, F1=0.996, train_acc=0.999, train_loss=0.119, train_precision=0.996, train_recall=0.996] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       0.99      0.99      0.99      1591
         PRO       1.00      1.00      1.00        86
        RACE       1.00      1.00      1.00        45
       TITLE       1.00      1.00      1.00      2111

   micro avg       1.00      1.00      1.00      4551
   macro avg       1.00      1.00      1.00      4551
weighted avg       1.00      1.00      1.00      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.65it/s, F1=0.945, eval_acc=0.975, eval_loss=4.01, eval_precision=0.931, eval_recall=0.959]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.97      0.97      0.97        33
         EDU       0.95      0.99      0.97       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.91      0.95      0.93       523
         PRO       0.82      1.00      0.90        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.93      0.95      0.94       690

   micro avg       0.93      0.96      0.94      1497
   macro avg       0.90      0.98      0.94      1497
weighted avg       0.93      0.96      0.94      1497



Epoch: 17/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.72it/s, F1=0.995, train_acc=0.999, train_loss=0.226, train_precision=0.995, train_recall=0.996]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       0.99      0.99      0.99       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       0.99      0.99      0.99      1591
         PRO       1.00      1.00      1.00        86
        RACE       1.00      1.00      1.00        45
       TITLE       1.00      1.00      1.00      2111

   micro avg       1.00      1.00      1.00      4551
   macro avg       1.00      1.00      1.00      4551
weighted avg       1.00      1.00      1.00      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.63it/s, F1=0.935, eval_acc=0.971, eval_loss=5.21, eval_precision=0.924, eval_recall=0.947]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.86      0.95      0.90       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      0.99      0.99       110
         ORG       0.90      0.92      0.91       523
         PRO       0.74      0.94      0.83        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.93      0.95      0.94       690

   micro avg       0.92      0.94      0.93      1497
   macro avg       0.93      0.97      0.95      1497
weighted avg       0.92      0.94      0.93      1497



Epoch: 18/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.72it/s, F1=0.986, train_acc=0.996, train_loss=0.48, train_precision=0.982, train_recall=0.989] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       0.98      0.99      0.99       263
         LOC       1.00      1.00      1.00        22
        NAME       0.99      1.00      1.00       347
         ORG       0.98      0.99      0.98      1591
         PRO       0.83      0.90      0.86        86
        RACE       1.00      1.00      1.00        45
       TITLE       0.99      0.99      0.99      2111

   micro avg       0.98      0.99      0.99      4551
   macro avg       0.97      0.98      0.98      4551
weighted avg       0.98      0.99      0.99      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.68it/s, F1=0.939, eval_acc=0.976, eval_loss=3.16, eval_precision=0.93, eval_recall=0.948] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.93      0.95      0.94       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.89      0.93      0.91       523
         PRO       0.86      1.00      0.92        18
        RACE       1.00      0.93      0.97        15
       TITLE       0.94      0.94      0.94       690

   micro avg       0.92      0.95      0.93      1497
   macro avg       0.95      0.97      0.96      1497
weighted avg       0.92      0.95      0.93      1497



Epoch: 19/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.72it/s, F1=0.992, train_acc=0.998, train_loss=0.422, train_precision=0.992, train_recall=0.993]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       0.95      0.95      0.95        22
        NAME       1.00      1.00      1.00       347
         ORG       0.99      0.99      0.99      1591
         PRO       0.98      0.99      0.98        86
        RACE       1.00      1.00      1.00        45
       TITLE       0.99      0.99      0.99      2111

   micro avg       0.99      0.99      0.99      4551
   macro avg       0.99      0.99      0.99      4551
weighted avg       0.99      0.99      0.99      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.66it/s, F1=0.906, eval_acc=0.963, eval_loss=4.84, eval_precision=0.882, eval_recall=0.932]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      0.97      0.96       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.83      0.94      0.88       523
         PRO       0.86      1.00      0.92        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.88      0.90      0.89       690

   micro avg       0.88      0.93      0.90      1497
   macro avg       0.94      0.98      0.96      1497
weighted avg       0.88      0.93      0.90      1497



Epoch: 20/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.46it/s, F1=0.991, train_acc=0.997, train_loss=0.295, train_precision=0.988, train_recall=0.993]


train_reports:
              precision    recall  f1-score   support

        CONT       0.99      1.00      0.99        86
         EDU       0.98      0.99      0.99       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       0.98      0.99      0.99      1591
         PRO       0.98      0.99      0.98        86
        RACE       1.00      1.00      1.00        45
       TITLE       0.99      0.99      0.99      2111

   micro avg       0.99      0.99      0.99      4551
   macro avg       0.99      1.00      0.99      4551
weighted avg       0.99      0.99      0.99      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.65it/s, F1=0.946, eval_acc=0.973, eval_loss=4.78, eval_precision=0.933, eval_recall=0.96] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.94      0.97      0.96       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.91      0.95      0.93       523
         PRO       0.74      0.94      0.83        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.94      0.96      0.95       690

   micro avg       0.93      0.96      0.94      1497
   macro avg       0.94      0.98      0.96      1497
weighted avg       0.93      0.96      0.94      1497



Epoch: 21/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.70it/s, F1=0.995, train_acc=0.999, train_loss=0.188, train_precision=0.994, train_recall=0.996]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       0.98      0.99      0.99       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       0.99      1.00      0.99      1591
         PRO       0.93      0.97      0.95        86
        RACE       1.00      1.00      1.00        45
       TITLE       1.00      1.00      1.00      2111

   micro avg       0.99      1.00      0.99      4551
   macro avg       0.99      0.99      0.99      4551
weighted avg       0.99      1.00      0.99      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.65it/s, F1=0.937, eval_acc=0.97, eval_loss=4.66, eval_precision=0.924, eval_recall=0.951] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.90      0.96      0.93       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.92      0.94      0.93       523
         PRO       0.51      1.00      0.68        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.93      0.94      0.93       690

   micro avg       0.92      0.95      0.93      1497
   macro avg       0.91      0.98      0.93      1497
weighted avg       0.92      0.95      0.94      1497



Epoch: 22/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.47it/s, F1=0.997, train_acc=0.999, train_loss=0.169, train_precision=0.997, train_recall=0.998]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       0.98      0.99      0.99       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       1.00      1.00      1.00      1591
         PRO       0.93      0.98      0.95        86
        RACE       1.00      1.00      1.00        45
       TITLE       1.00      1.00      1.00      2111

   micro avg       1.00      1.00      1.00      4551
   macro avg       0.99      1.00      0.99      4551
weighted avg       1.00      1.00      1.00      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.67it/s, F1=0.944, eval_acc=0.973, eval_loss=4.1, eval_precision=0.936, eval_recall=0.951] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      0.97      0.96       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.90      0.93      0.91       523
         PRO       0.81      0.94      0.87        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.94      0.95      0.95       690

   micro avg       0.93      0.95      0.94      1497
   macro avg       0.95      0.97      0.96      1497
weighted avg       0.93      0.95      0.94      1497



Epoch: 23/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.73it/s, F1=1, train_acc=1, train_loss=0.0303, train_precision=0.999, train_recall=1]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       1.00      1.00      1.00      1591
         PRO       1.00      1.00      1.00        86
        RACE       1.00      1.00      1.00        45
       TITLE       1.00      1.00      1.00      2111

   micro avg       1.00      1.00      1.00      4551
   macro avg       1.00      1.00      1.00      4551
weighted avg       1.00      1.00      1.00      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.67it/s, F1=0.936, eval_acc=0.969, eval_loss=5.02, eval_precision=0.929, eval_recall=0.944]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.91      1.00      0.95       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.91      0.91      0.91       523
         PRO       0.78      1.00      0.88        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.92      0.94      0.93       690

   micro avg       0.92      0.94      0.93      1497
   macro avg       0.94      0.98      0.96      1497
weighted avg       0.93      0.94      0.93      1497



Epoch: 24/30 Train: 100%|██████████| 169/169 [00:44<00:00,  3.78it/s, F1=1, train_acc=1, train_loss=0.0253, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       1.00      1.00      1.00      1591
         PRO       1.00      1.00      1.00        86
        RACE       1.00      1.00      1.00        45
       TITLE       1.00      1.00      1.00      2111

   micro avg       1.00      1.00      1.00      4551
   macro avg       1.00      1.00      1.00      4551
weighted avg       1.00      1.00      1.00      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.67it/s, F1=0.944, eval_acc=0.974, eval_loss=4.57, eval_precision=0.936, eval_recall=0.952]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.94      0.97      0.95       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.91      0.93      0.92       523
         PRO       0.82      1.00      0.90        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.94      0.95      0.95       690

   micro avg       0.93      0.95      0.94      1497
   macro avg       0.95      0.98      0.96      1497
weighted avg       0.93      0.95      0.94      1497



Epoch: 25/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.45it/s, F1=1, train_acc=1, train_loss=0.00781, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       1.00      1.00      1.00      1591
         PRO       1.00      1.00      1.00        86
        RACE       1.00      1.00      1.00        45
       TITLE       1.00      1.00      1.00      2111

   micro avg       1.00      1.00      1.00      4551
   macro avg       1.00      1.00      1.00      4551
weighted avg       1.00      1.00      1.00      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.56it/s, F1=0.951, eval_acc=0.977, eval_loss=4.48, eval_precision=0.943, eval_recall=0.959]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.94      0.97      0.95       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.92      0.94      0.93       523
         PRO       0.86      1.00      0.92        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.95      0.96      0.95       690

   micro avg       0.94      0.96      0.95      1497
   macro avg       0.96      0.98      0.97      1497
weighted avg       0.94      0.96      0.95      1497



Epoch: 26/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.71it/s, F1=1, train_acc=1, train_loss=0.00395, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       1.00      1.00      1.00      1591
         PRO       1.00      1.00      1.00        86
        RACE       1.00      1.00      1.00        45
       TITLE       1.00      1.00      1.00      2111

   micro avg       1.00      1.00      1.00      4551
   macro avg       1.00      1.00      1.00      4551
weighted avg       1.00      1.00      1.00      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.64it/s, F1=0.952, eval_acc=0.977, eval_loss=4.59, eval_precision=0.945, eval_recall=0.959]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.94      0.98      0.96       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.92      0.94      0.93       523
         PRO       0.86      1.00      0.92        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.95      0.96      0.95       690

   micro avg       0.94      0.96      0.95      1497
   macro avg       0.96      0.98      0.97      1497
weighted avg       0.94      0.96      0.95      1497



Epoch: 27/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.49it/s, F1=1, train_acc=1, train_loss=0.0202, train_precision=1, train_recall=1] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       1.00      1.00      1.00      1591
         PRO       1.00      1.00      1.00        86
        RACE       1.00      1.00      1.00        45
       TITLE       1.00      1.00      1.00      2111

   micro avg       1.00      1.00      1.00      4551
   macro avg       1.00      1.00      1.00      4551
weighted avg       1.00      1.00      1.00      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.58it/s, F1=0.951, eval_acc=0.975, eval_loss=4.66, eval_precision=0.943, eval_recall=0.959]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.94      0.97      0.95       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.92      0.95      0.93       523
         PRO       0.86      1.00      0.92        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.94      0.95      0.95       690

   micro avg       0.94      0.96      0.95      1497
   macro avg       0.96      0.98      0.97      1497
weighted avg       0.94      0.96      0.95      1497



Epoch: 28/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.74it/s, F1=1, train_acc=1, train_loss=0.00477, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       1.00      1.00      1.00      1591
         PRO       1.00      1.00      1.00        86
        RACE       1.00      1.00      1.00        45
       TITLE       1.00      1.00      1.00      2111

   micro avg       1.00      1.00      1.00      4551
   macro avg       1.00      1.00      1.00      4551
weighted avg       1.00      1.00      1.00      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.48it/s, F1=0.954, eval_acc=0.976, eval_loss=4.84, eval_precision=0.948, eval_recall=0.96] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      0.98      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.93      0.95      0.94       523
         PRO       0.86      1.00      0.92        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.95      0.96      0.95       690

   micro avg       0.95      0.96      0.95      1497
   macro avg       0.96      0.99      0.97      1497
weighted avg       0.95      0.96      0.95      1497



Epoch: 29/30 Train: 100%|██████████| 169/169 [00:44<00:00,  3.77it/s, F1=1, train_acc=1, train_loss=0.00658, train_precision=1, train_recall=1]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       1.00      1.00      1.00      1591
         PRO       1.00      1.00      1.00        86
        RACE       1.00      1.00      1.00        45
       TITLE       1.00      1.00      1.00      2111

   micro avg       1.00      1.00      1.00      4551
   macro avg       1.00      1.00      1.00      4551
weighted avg       1.00      1.00      1.00      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.66it/s, F1=0.954, eval_acc=0.977, eval_loss=4.91, eval_precision=0.945, eval_recall=0.963]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      0.99      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.93      0.95      0.94       523
         PRO       0.86      1.00      0.92        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.95      0.96      0.95       690

   micro avg       0.94      0.96      0.95      1497
   macro avg       0.96      0.99      0.97      1497
weighted avg       0.94      0.96      0.95      1497



Epoch: 30/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.49it/s, F1=0.993, train_acc=0.998, train_loss=0.32, train_precision=0.991, train_recall=0.994] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       0.99      0.99      0.99      1591
         PRO       1.00      1.00      1.00        86
        RACE       1.00      1.00      1.00        45
       TITLE       0.99      0.99      0.99      2111

   micro avg       0.99      0.99      0.99      4551
   macro avg       1.00      1.00      1.00      4551
weighted avg       0.99      0.99      0.99      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.64it/s, F1=0.934, eval_acc=0.969, eval_loss=5.44, eval_precision=0.924, eval_recall=0.946]


eval_reports:


calculate data/few_shot/resume/train_1350.json etag: 100%|██████████| 639k/639k [00:00<00:00, 297MB/s]
calculate data/few_shot/resume/dev.json etag: 100%|██████████| 208k/208k [00:00<00:00, 198MB/s]
calculate data/few_shot/resume/test.json etag: 100%|██████████| 230k/230k [00:00<00:00, 206MB/s]
calculate data/few_shot/resume/labels.txt etag: 100%|██████████| 181/181 [00:00<00:00, 317kB/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.98      1.00      0.99       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.89      0.92      0.90       523
         PRO       0.90      1.00      0.95        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.91      0.94      0.92       690

   micro avg       0.92      0.94      0.93      1497
   macro avg       0.96      0.98      0.97      1497
weighted avg       0.92      0.94      0.93      1497

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/resume/train_1350.json",
    "eval_file": "data/few_shot/resume/dev.json",
    "test_file": "data/few_sho


count line size data/few_shot/resume/labels.txt: 29L [00:00, 207214.34L/s]
build line mapper: 29L [00:00, 211171.56L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 29/29 [00:00<00:00, 8011.25it/s]
load vocab from list: 100%|██████████| 28/28 [00:00<00:00, 280287.62it/s]
load dataset from data/few_shot/resume/train_1350.json: 93it [00:00, 928.54it/s]

load cached ./temp/67aae1402c328e13a97f12024469cc97_578a629df36736a7b0ca315689a0fbc2_a783a23408031aaf8881013b1b168597_61206f767c93b652c614f8099bc479e7/1000000/matched_words
load cached ./temp/67aae1402c328e13a97f12024469cc97_578a629df36736a7b0ca315689a0fbc2_a783a23408031aaf8881013b1b168597_61206f767c93b652c614f8099bc479e7/1000000/word_vocab
load cached ./temp/67aae1402c328e13a97f12024469cc97_578a629df36736a7b0ca315689a0fbc2_a783a23408031aaf8881013b1b168597_61206f767c93b652c614f8099bc479e7/1000000/vocab_embedding


load dataset from data/few_shot/resume/train_1350.json: 1350it [00:01, 798.71it/s]
load dataset from data/few_shot/resume/dev.json: 463it [00:00, 821.49it/s]
Some weights of the model checkpoint at save_pretrained/resume_pretrain_lebert_1350_pretraind_task/Bert_1290/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification m

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.74it/s, F1=0.399, train_acc=0.692, train_loss=38.1, train_precision=0.37, train_recall=0.44]         


train_reports:
              precision    recall  f1-score   support

        CONT       0.00      0.02      0.00        86
         EDU       0.03      0.30      0.06       263
         LOC       0.00      0.00      0.00        22
        NAME       0.40      0.28      0.33       347
         ORG       0.15      0.49      0.23      1591
         PRO       0.02      0.01      0.02        86
        RACE       0.01      0.07      0.02        45
       TITLE       0.57      0.52      0.54      2111

   micro avg       0.18      0.45      0.26      4551
   macro avg       0.15      0.21      0.15      4551
weighted avg       0.35      0.45      0.36      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.68it/s, F1=0.845, eval_acc=0.954, eval_loss=5.29, eval_precision=0.795, eval_recall=0.904]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.86      0.94      0.90        33
         EDU       0.74      0.90      0.81       106
         LOC       0.00      0.00      0.00         2
        NAME       0.97      0.94      0.95       110
         ORG       0.75      0.93      0.83       523
         PRO       0.03      0.06      0.04        18
        RACE       0.87      0.87      0.87        15
       TITLE       0.82      0.90      0.86       690

   micro avg       0.78      0.90      0.84      1497
   macro avg       0.63      0.69      0.66      1497
weighted avg       0.79      0.90      0.84      1497



Epoch: 2/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.75it/s, F1=0.89, train_acc=0.97, train_loss=3.87, train_precision=0.861, train_recall=0.924]  


train_reports:
              precision    recall  f1-score   support

        CONT       0.82      0.97      0.89        86
         EDU       0.89      0.95      0.92       263
         LOC       0.11      0.18      0.13        22
        NAME       0.93      0.97      0.94       347
         ORG       0.83      0.92      0.87      1591
         PRO       0.46      0.65      0.54        86
        RACE       0.79      0.91      0.85        45
       TITLE       0.90      0.94      0.92      2111

   micro avg       0.85      0.92      0.89      4551
   macro avg       0.71      0.81      0.76      4551
weighted avg       0.86      0.92      0.89      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.61it/s, F1=0.923, eval_acc=0.97, eval_loss=3.43, eval_precision=0.902, eval_recall=0.945] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.91      0.94      0.93        33
         EDU       0.92      0.95      0.94       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.86      0.93      0.89       523
         PRO       0.68      0.94      0.79        18
        RACE       1.00      0.93      0.97        15
       TITLE       0.92      0.95      0.93       690

   micro avg       0.90      0.94      0.92      1497
   macro avg       0.87      0.96      0.90      1497
weighted avg       0.90      0.94      0.92      1497



Epoch: 3/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.51it/s, F1=0.949, train_acc=0.984, train_loss=2.13, train_precision=0.938, train_recall=0.961]


train_reports:
              precision    recall  f1-score   support

        CONT       0.93      0.98      0.95        86
         EDU       0.97      0.97      0.97       263
         LOC       0.70      0.73      0.71        22
        NAME       0.98      1.00      0.99       347
         ORG       0.91      0.95      0.93      1591
         PRO       0.90      0.98      0.94        86
        RACE       0.87      0.89      0.88        45
       TITLE       0.94      0.96      0.95      2111

   micro avg       0.93      0.96      0.94      4551
   macro avg       0.90      0.93      0.92      4551
weighted avg       0.93      0.96      0.94      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.46it/s, F1=0.912, eval_acc=0.964, eval_loss=3.54, eval_precision=0.88, eval_recall=0.947] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.87      0.97      0.92       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.83      0.93      0.88       523
         PRO       0.81      0.94      0.87        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.89      0.94      0.92       690

   micro avg       0.87      0.95      0.91      1497
   macro avg       0.87      0.97      0.91      1497
weighted avg       0.88      0.95      0.91      1497



Epoch: 4/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.73it/s, F1=0.962, train_acc=0.99, train_loss=1.42, train_precision=0.954, train_recall=0.971] 


train_reports:
              precision    recall  f1-score   support

        CONT       0.94      0.98      0.96        86
         EDU       0.97      0.98      0.98       263
         LOC       0.78      0.82      0.80        22
        NAME       0.99      1.00      1.00       347
         ORG       0.93      0.96      0.94      1591
         PRO       0.85      0.95      0.90        86
        RACE       1.00      0.98      0.99        45
       TITLE       0.97      0.98      0.97      2111

   micro avg       0.95      0.97      0.96      4551
   macro avg       0.93      0.96      0.94      4551
weighted avg       0.95      0.97      0.96      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.25it/s, F1=0.937, eval_acc=0.973, eval_loss=3.79, eval_precision=0.922, eval_recall=0.954]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.91      0.94      0.93        33
         EDU       0.94      0.99      0.96       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.89      0.93      0.91       523
         PRO       0.77      0.94      0.85        18
        RACE       1.00      0.93      0.97        15
       TITLE       0.93      0.95      0.94       690

   micro avg       0.92      0.95      0.93      1497
   macro avg       0.89      0.96      0.92      1497
weighted avg       0.92      0.95      0.93      1497



Epoch: 5/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.74it/s, F1=0.971, train_acc=0.992, train_loss=1, train_precision=0.964, train_recall=0.978]    


train_reports:
              precision    recall  f1-score   support

        CONT       0.99      0.99      0.99        86
         EDU       0.98      0.99      0.98       263
         LOC       0.75      0.82      0.78        22
        NAME       0.99      1.00      1.00       347
         ORG       0.95      0.97      0.96      1591
         PRO       0.94      0.99      0.97        86
        RACE       0.98      0.98      0.98        45
       TITLE       0.97      0.98      0.97      2111

   micro avg       0.96      0.98      0.97      4551
   macro avg       0.94      0.96      0.95      4551
weighted avg       0.96      0.98      0.97      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.69it/s, F1=0.909, eval_acc=0.971, eval_loss=3.28, eval_precision=0.89, eval_recall=0.93]  


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.94      0.97      0.96       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.84      0.91      0.87       523
         PRO       0.74      0.94      0.83        18
        RACE       1.00      0.93      0.97        15
       TITLE       0.88      0.91      0.90       690

   micro avg       0.88      0.92      0.90      1497
   macro avg       0.88      0.95      0.91      1497
weighted avg       0.88      0.92      0.90      1497



Epoch: 6/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.50it/s, F1=0.978, train_acc=0.994, train_loss=0.785, train_precision=0.974, train_recall=0.983]


train_reports:
              precision    recall  f1-score   support

        CONT       0.98      1.00      0.99        86
         EDU       0.98      0.98      0.98       263
         LOC       0.87      0.91      0.89        22
        NAME       1.00      1.00      1.00       347
         ORG       0.96      0.98      0.97      1591
         PRO       0.95      0.98      0.97        86
        RACE       1.00      0.98      0.99        45
       TITLE       0.98      0.98      0.98      2111

   micro avg       0.97      0.98      0.98      4551
   macro avg       0.96      0.98      0.97      4551
weighted avg       0.97      0.98      0.98      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.67it/s, F1=0.935, eval_acc=0.971, eval_loss=3.65, eval_precision=0.917, eval_recall=0.955]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.95      0.99      0.97       106
         LOC       0.67      1.00      0.80         2
        NAME       0.99      1.00      1.00       110
         ORG       0.86      0.93      0.90       523
         PRO       0.81      0.94      0.87        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.93      0.95      0.94       690

   micro avg       0.91      0.95      0.93      1497
   macro avg       0.89      0.97      0.93      1497
weighted avg       0.91      0.95      0.93      1497



Epoch: 7/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.73it/s, F1=0.99, train_acc=0.997, train_loss=0.383, train_precision=0.988, train_recall=0.992] 


train_reports:
              precision    recall  f1-score   support

        CONT       0.99      0.99      0.99        86
         EDU       0.98      0.99      0.99       263
         LOC       0.88      0.95      0.91        22
        NAME       0.99      1.00      1.00       347
         ORG       0.99      0.99      0.99      1591
         PRO       0.93      0.97      0.95        86
        RACE       1.00      1.00      1.00        45
       TITLE       0.99      0.99      0.99      2111

   micro avg       0.99      0.99      0.99      4551
   macro avg       0.97      0.99      0.98      4551
weighted avg       0.99      0.99      0.99      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.68it/s, F1=0.938, eval_acc=0.974, eval_loss=3.79, eval_precision=0.924, eval_recall=0.953]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.97      0.97      0.97        33
         EDU       0.95      0.99      0.97       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.90      0.93      0.92       523
         PRO       0.82      1.00      0.90        18
        RACE       1.00      0.93      0.97        15
       TITLE       0.93      0.95      0.94       690

   micro avg       0.92      0.95      0.94      1497
   macro avg       0.94      0.97      0.96      1497
weighted avg       0.92      0.95      0.94      1497



Epoch: 8/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.50it/s, F1=0.988, train_acc=0.997, train_loss=0.349, train_precision=0.985, train_recall=0.99] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       0.98      0.99      0.98      1591
         PRO       0.97      0.98      0.97        86
        RACE       1.00      1.00      1.00        45
       TITLE       0.99      0.99      0.99      2111

   micro avg       0.98      0.99      0.99      4551
   macro avg       0.99      0.99      0.99      4551
weighted avg       0.98      0.99      0.99      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.64it/s, F1=0.93, eval_acc=0.97, eval_loss=5.04, eval_precision=0.918, eval_recall=0.944]  


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.97      1.00      0.99       106
         LOC       0.67      1.00      0.80         2
        NAME       0.99      1.00      1.00       110
         ORG       0.87      0.92      0.89       523
         PRO       0.82      1.00      0.90        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.92      0.93      0.92       690

   micro avg       0.91      0.94      0.92      1497
   macro avg       0.89      0.98      0.93      1497
weighted avg       0.91      0.94      0.92      1497



Epoch: 9/30 Train: 100%|██████████| 169/169 [00:44<00:00,  3.77it/s, F1=0.978, train_acc=0.994, train_loss=0.833, train_precision=0.972, train_recall=0.984]


train_reports:
              precision    recall  f1-score   support

        CONT       0.97      0.99      0.98        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       0.96      1.00      0.98       347
         ORG       0.96      0.98      0.97      1591
         PRO       0.89      0.93      0.91        86
        RACE       1.00      1.00      1.00        45
       TITLE       0.98      0.99      0.98      2111

   micro avg       0.97      0.98      0.98      4551
   macro avg       0.97      0.98      0.98      4551
weighted avg       0.97      0.98      0.98      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.65it/s, F1=0.92, eval_acc=0.969, eval_loss=3.91, eval_precision=0.902, eval_recall=0.938] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.95      0.99      0.97       106
         LOC       0.67      1.00      0.80         2
        NAME       0.99      0.99      0.99       110
         ORG       0.84      0.91      0.87       523
         PRO       0.63      0.94      0.76        18
        RACE       1.00      0.93      0.97        15
       TITLE       0.92      0.94      0.93       690

   micro avg       0.90      0.94      0.92      1497
   macro avg       0.87      0.96      0.91      1497
weighted avg       0.90      0.94      0.92      1497



Epoch: 10/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.74it/s, F1=0.981, train_acc=0.994, train_loss=0.723, train_precision=0.977, train_recall=0.987]


train_reports:
              precision    recall  f1-score   support

        CONT       0.99      1.00      0.99        86
         EDU       0.99      0.99      0.99       263
         LOC       0.88      0.95      0.91        22
        NAME       0.96      0.99      0.97       347
         ORG       0.97      0.98      0.98      1591
         PRO       0.90      0.95      0.93        86
        RACE       1.00      1.00      1.00        45
       TITLE       0.99      0.99      0.99      2111

   micro avg       0.98      0.99      0.98      4551
   macro avg       0.96      0.98      0.97      4551
weighted avg       0.98      0.99      0.98      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.60it/s, F1=0.93, eval_acc=0.971, eval_loss=4.52, eval_precision=0.913, eval_recall=0.948] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.97      1.00      0.99       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.87      0.93      0.90       523
         PRO       0.82      1.00      0.90        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.92      0.93      0.93       690

   micro avg       0.91      0.95      0.93      1497
   macro avg       0.90      0.98      0.93      1497
weighted avg       0.91      0.95      0.93      1497



Epoch: 11/30 Train: 100%|██████████| 169/169 [00:47<00:00,  3.52it/s, F1=0.988, train_acc=0.997, train_loss=0.384, train_precision=0.985, train_recall=0.992]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       0.98      0.99      0.98      1591
         PRO       0.93      0.95      0.94        86
        RACE       1.00      1.00      1.00        45
       TITLE       0.99      0.99      0.99      2111

   micro avg       0.98      0.99      0.99      4551
   macro avg       0.99      0.99      0.99      4551
weighted avg       0.98      0.99      0.99      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.64it/s, F1=0.926, eval_acc=0.969, eval_loss=4.72, eval_precision=0.911, eval_recall=0.942]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.95      0.99      0.97       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.87      0.93      0.90       523
         PRO       0.75      1.00      0.86        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.92      0.93      0.92       690

   micro avg       0.90      0.94      0.92      1497
   macro avg       0.88      0.98      0.92      1497
weighted avg       0.91      0.94      0.92      1497



Epoch: 12/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.70it/s, F1=0.995, train_acc=0.999, train_loss=0.229, train_precision=0.994, train_recall=0.996]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       0.99      1.00      1.00       347
         ORG       0.99      0.99      0.99      1591
         PRO       0.98      0.99      0.98        86
        RACE       1.00      1.00      1.00        45
       TITLE       1.00      1.00      1.00      2111

   micro avg       0.99      1.00      0.99      4551
   macro avg       0.99      1.00      1.00      4551
weighted avg       0.99      1.00      0.99      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.68it/s, F1=0.939, eval_acc=0.972, eval_loss=4.79, eval_precision=0.929, eval_recall=0.948]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.97      1.00      0.99       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.90      0.92      0.91       523
         PRO       0.78      1.00      0.88        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.93      0.94      0.94       690

   micro avg       0.93      0.95      0.94      1497
   macro avg       0.90      0.98      0.93      1497
weighted avg       0.93      0.95      0.94      1497



Epoch: 13/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.45it/s, F1=0.998, train_acc=1, train_loss=0.0911, train_precision=0.998, train_recall=0.999]   


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       1.00      1.00      1.00      1591
         PRO       1.00      1.00      1.00        86
        RACE       1.00      1.00      1.00        45
       TITLE       1.00      1.00      1.00      2111

   micro avg       1.00      1.00      1.00      4551
   macro avg       1.00      1.00      1.00      4551
weighted avg       1.00      1.00      1.00      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.64it/s, F1=0.938, eval_acc=0.973, eval_loss=4.9, eval_precision=0.927, eval_recall=0.95]  


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.97      1.00      0.99       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.89      0.93      0.91       523
         PRO       0.82      1.00      0.90        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.93      0.95      0.94       690

   micro avg       0.92      0.95      0.94      1497
   macro avg       0.90      0.98      0.93      1497
weighted avg       0.92      0.95      0.94      1497



Epoch: 14/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.74it/s, F1=0.998, train_acc=0.999, train_loss=0.0643, train_precision=0.998, train_recall=0.998]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       1.00      1.00      1.00      1591
         PRO       1.00      1.00      1.00        86
        RACE       1.00      1.00      1.00        45
       TITLE       1.00      1.00      1.00      2111

   micro avg       1.00      1.00      1.00      4551
   macro avg       1.00      1.00      1.00      4551
weighted avg       1.00      1.00      1.00      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.67it/s, F1=0.943, eval_acc=0.973, eval_loss=5.35, eval_precision=0.931, eval_recall=0.955]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.97      1.00      0.99       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      0.99      0.99       110
         ORG       0.90      0.93      0.92       523
         PRO       0.82      1.00      0.90        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.94      0.95      0.94       690

   micro avg       0.93      0.95      0.94      1497
   macro avg       0.90      0.98      0.94      1497
weighted avg       0.93      0.95      0.94      1497



Epoch: 15/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.72it/s, F1=0.998, train_acc=1, train_loss=0.0573, train_precision=0.998, train_recall=0.999]   


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       1.00      1.00      1.00      1591
         PRO       0.99      1.00      0.99        86
        RACE       1.00      1.00      1.00        45
       TITLE       1.00      1.00      1.00      2111

   micro avg       1.00      1.00      1.00      4551
   macro avg       1.00      1.00      1.00      4551
weighted avg       1.00      1.00      1.00      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.66it/s, F1=0.942, eval_acc=0.972, eval_loss=5.34, eval_precision=0.933, eval_recall=0.952]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.97      0.98      0.98       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.91      0.93      0.92       523
         PRO       0.86      1.00      0.92        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.93      0.95      0.94       690

   micro avg       0.93      0.95      0.94      1497
   macro avg       0.91      0.98      0.94      1497
weighted avg       0.93      0.95      0.94      1497



Epoch: 16/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.46it/s, F1=0.998, train_acc=1, train_loss=0.0567, train_precision=0.997, train_recall=0.999]   


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       0.99      1.00      0.99       347
         ORG       1.00      1.00      1.00      1591
         PRO       1.00      1.00      1.00        86
        RACE       1.00      1.00      1.00        45
       TITLE       1.00      1.00      1.00      2111

   micro avg       1.00      1.00      1.00      4551
   macro avg       1.00      1.00      1.00      4551
weighted avg       1.00      1.00      1.00      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.59it/s, F1=0.941, eval_acc=0.973, eval_loss=5.34, eval_precision=0.932, eval_recall=0.951]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.96      0.99      0.98       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      0.99      0.99       110
         ORG       0.90      0.93      0.92       523
         PRO       0.82      1.00      0.90        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.94      0.95      0.94       690

   micro avg       0.93      0.95      0.94      1497
   macro avg       0.90      0.98      0.93      1497
weighted avg       0.93      0.95      0.94      1497



Epoch: 17/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.69it/s, F1=0.997, train_acc=1, train_loss=0.0745, train_precision=0.996, train_recall=0.998]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       0.99      1.00      0.99      1591
         PRO       0.98      0.99      0.98        86
        RACE       1.00      1.00      1.00        45
       TITLE       1.00      1.00      1.00      2111

   micro avg       1.00      1.00      1.00      4551
   macro avg       1.00      1.00      1.00      4551
weighted avg       1.00      1.00      1.00      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.67it/s, F1=0.943, eval_acc=0.973, eval_loss=5.04, eval_precision=0.933, eval_recall=0.954]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.98      0.98      0.98       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.90      0.93      0.92       523
         PRO       0.75      1.00      0.86        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.94      0.96      0.95       690

   micro avg       0.93      0.95      0.94      1497
   macro avg       0.90      0.98      0.93      1497
weighted avg       0.93      0.95      0.94      1497



Epoch: 18/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.74it/s, F1=0.991, train_acc=0.998, train_loss=0.366, train_precision=0.99, train_recall=0.993] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       0.99      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       0.99      0.99      0.99      1591
         PRO       0.97      0.99      0.98        86
        RACE       1.00      1.00      1.00        45
       TITLE       0.99      0.99      0.99      2111

   micro avg       0.99      0.99      0.99      4551
   macro avg       0.99      1.00      0.99      4551
weighted avg       0.99      0.99      0.99      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.66it/s, F1=0.93, eval_acc=0.972, eval_loss=4.83, eval_precision=0.914, eval_recall=0.948] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.94      0.97      0.95       106
         LOC       0.40      1.00      0.57         2
        NAME       0.99      1.00      1.00       110
         ORG       0.89      0.93      0.91       523
         PRO       0.68      0.94      0.79        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.92      0.94      0.93       690

   micro avg       0.91      0.95      0.93      1497
   macro avg       0.84      0.97      0.88      1497
weighted avg       0.91      0.95      0.93      1497



Epoch: 19/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.50it/s, F1=0.994, train_acc=0.999, train_loss=0.289, train_precision=0.993, train_recall=0.995]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       0.99      0.99      0.99      1591
         PRO       0.97      0.98      0.97        86
        RACE       1.00      1.00      1.00        45
       TITLE       0.99      1.00      0.99      2111

   micro avg       0.99      0.99      0.99      4551
   macro avg       0.99      1.00      0.99      4551
weighted avg       0.99      0.99      0.99      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.65it/s, F1=0.944, eval_acc=0.97, eval_loss=5.08, eval_precision=0.933, eval_recall=0.955] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.96      1.00      0.98       106
         LOC       0.67      1.00      0.80         2
        NAME       0.99      1.00      1.00       110
         ORG       0.91      0.93      0.92       523
         PRO       0.86      1.00      0.92        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.93      0.95      0.94       690

   micro avg       0.93      0.95      0.94      1497
   macro avg       0.90      0.98      0.94      1497
weighted avg       0.93      0.95      0.94      1497



Epoch: 20/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.74it/s, F1=0.997, train_acc=1, train_loss=0.0812, train_precision=0.997, train_recall=0.998]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       0.99      1.00      1.00      1591
         PRO       1.00      1.00      1.00        86
        RACE       1.00      1.00      1.00        45
       TITLE       1.00      1.00      1.00      2111

   micro avg       1.00      1.00      1.00      4551
   macro avg       1.00      1.00      1.00      4551
weighted avg       1.00      1.00      1.00      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.58it/s, F1=0.94, eval_acc=0.971, eval_loss=5.21, eval_precision=0.927, eval_recall=0.954] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.96      0.99      0.98       106
         LOC       0.67      1.00      0.80         2
        NAME       0.99      1.00      1.00       110
         ORG       0.90      0.94      0.92       523
         PRO       0.82      1.00      0.90        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.93      0.95      0.94       690

   micro avg       0.92      0.95      0.94      1497
   macro avg       0.89      0.98      0.93      1497
weighted avg       0.92      0.95      0.94      1497



Epoch: 21/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.50it/s, F1=0.996, train_acc=0.999, train_loss=0.155, train_precision=0.995, train_recall=0.997]


train_reports:
              precision    recall  f1-score   support

        CONT       0.99      0.99      0.99        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       0.99      1.00      1.00      1591
         PRO       1.00      1.00      1.00        86
        RACE       1.00      1.00      1.00        45
       TITLE       0.99      1.00      0.99      2111

   micro avg       0.99      1.00      1.00      4551
   macro avg       1.00      1.00      1.00      4551
weighted avg       0.99      1.00      1.00      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.64it/s, F1=0.939, eval_acc=0.971, eval_loss=4.79, eval_precision=0.93, eval_recall=0.948] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.98      0.95      0.97       106
         LOC       0.67      1.00      0.80         2
        NAME       0.99      1.00      1.00       110
         ORG       0.90      0.93      0.92       523
         PRO       0.82      1.00      0.90        18
        RACE       1.00      0.93      0.97        15
       TITLE       0.93      0.94      0.94       690

   micro avg       0.93      0.95      0.94      1497
   macro avg       0.90      0.97      0.93      1497
weighted avg       0.93      0.95      0.94      1497



Epoch: 22/30 Train: 100%|██████████| 169/169 [00:44<00:00,  3.76it/s, F1=0.989, train_acc=0.997, train_loss=0.413, train_precision=0.987, train_recall=0.991]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       0.98      0.99      0.99      1591
         PRO       1.00      1.00      1.00        86
        RACE       1.00      1.00      1.00        45
       TITLE       0.98      0.99      0.99      2111

   micro avg       0.99      0.99      0.99      4551
   macro avg       1.00      1.00      1.00      4551
weighted avg       0.99      0.99      0.99      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.65it/s, F1=0.94, eval_acc=0.972, eval_loss=4.37, eval_precision=0.928, eval_recall=0.954] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.96      0.99      0.98       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.90      0.94      0.92       523
         PRO       0.82      1.00      0.90        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.93      0.94      0.94       690

   micro avg       0.92      0.95      0.94      1497
   macro avg       0.90      0.98      0.93      1497
weighted avg       0.92      0.95      0.94      1497



Epoch: 23/30 Train: 100%|██████████| 169/169 [00:47<00:00,  3.52it/s, F1=0.996, train_acc=0.999, train_loss=0.188, train_precision=0.996, train_recall=0.996]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       0.99      0.99      0.99      1591
         PRO       1.00      1.00      1.00        86
        RACE       1.00      1.00      1.00        45
       TITLE       1.00      1.00      1.00      2111

   micro avg       1.00      1.00      1.00      4551
   macro avg       1.00      1.00      1.00      4551
weighted avg       1.00      1.00      1.00      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.61it/s, F1=0.941, eval_acc=0.971, eval_loss=4.01, eval_precision=0.929, eval_recall=0.954]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.94      0.94        33
         EDU       0.97      0.98      0.98       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.90      0.94      0.92       523
         PRO       0.82      1.00      0.90        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.93      0.95      0.94       690

   micro avg       0.92      0.95      0.94      1497
   macro avg       0.90      0.98      0.93      1497
weighted avg       0.92      0.95      0.94      1497



Epoch: 24/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.75it/s, F1=0.995, train_acc=0.999, train_loss=0.311, train_precision=0.994, train_recall=0.996]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       0.97      0.99      0.98       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       0.99      0.99      0.99      1591
         PRO       0.99      1.00      0.99        86
        RACE       1.00      1.00      1.00        45
       TITLE       1.00      1.00      1.00      2111

   micro avg       0.99      1.00      1.00      4551
   macro avg       0.99      1.00      1.00      4551
weighted avg       0.99      1.00      1.00      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.66it/s, F1=0.935, eval_acc=0.968, eval_loss=4.68, eval_precision=0.924, eval_recall=0.947]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      0.93      0.94       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.90      0.93      0.91       523
         PRO       0.78      1.00      0.88        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.92      0.94      0.93       690

   micro avg       0.92      0.95      0.93      1497
   macro avg       0.94      0.98      0.96      1497
weighted avg       0.92      0.95      0.93      1497



Epoch: 25/30 Train: 100%|██████████| 169/169 [00:44<00:00,  3.78it/s, F1=0.993, train_acc=0.998, train_loss=0.349, train_precision=0.991, train_recall=0.994]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       0.99      0.99      0.99       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       0.99      0.99      0.99      1591
         PRO       0.99      0.99      0.99        86
        RACE       1.00      1.00      1.00        45
       TITLE       0.99      0.99      0.99      2111

   micro avg       0.99      0.99      0.99      4551
   macro avg       0.99      1.00      1.00      4551
weighted avg       0.99      0.99      0.99      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.64it/s, F1=0.933, eval_acc=0.967, eval_loss=4.73, eval_precision=0.924, eval_recall=0.943]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.97      0.94      0.96       106
         LOC       0.67      1.00      0.80         2
        NAME       0.99      1.00      1.00       110
         ORG       0.88      0.92      0.90       523
         PRO       0.67      1.00      0.80        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.93      0.94      0.93       690

   micro avg       0.92      0.94      0.93      1497
   macro avg       0.89      0.98      0.92      1497
weighted avg       0.92      0.94      0.93      1497



Epoch: 26/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.48it/s, F1=0.987, train_acc=0.996, train_loss=0.492, train_precision=0.985, train_recall=0.989]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       0.98      0.98      0.98      1591
         PRO       0.94      0.98      0.96        86
        RACE       1.00      1.00      1.00        45
       TITLE       0.99      0.99      0.99      2111

   micro avg       0.98      0.99      0.99      4551
   macro avg       0.99      0.99      0.99      4551
weighted avg       0.98      0.99      0.99      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.58it/s, F1=0.941, eval_acc=0.971, eval_loss=5.61, eval_precision=0.935, eval_recall=0.948]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      0.99      0.98       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.89      0.93      0.91       523
         PRO       0.82      1.00      0.90        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.95      0.94      0.94       690

   micro avg       0.93      0.95      0.94      1497
   macro avg       0.95      0.98      0.97      1497
weighted avg       0.93      0.95      0.94      1497



Epoch: 27/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.71it/s, F1=0.994, train_acc=0.998, train_loss=0.261, train_precision=0.993, train_recall=0.995]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       0.99      0.99      0.99       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       0.99      0.99      0.99      1591
         PRO       0.98      0.99      0.98        86
        RACE       1.00      1.00      1.00        45
       TITLE       0.99      1.00      1.00      2111

   micro avg       0.99      1.00      0.99      4551
   macro avg       0.99      1.00      1.00      4551
weighted avg       0.99      1.00      0.99      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.65it/s, F1=0.935, eval_acc=0.966, eval_loss=4.81, eval_precision=0.927, eval_recall=0.943]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.98      0.99      0.99       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.90      0.91      0.91       523
         PRO       0.86      1.00      0.92        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.92      0.94      0.93       690

   micro avg       0.92      0.94      0.93      1497
   macro avg       0.95      0.98      0.97      1497
weighted avg       0.92      0.94      0.93      1497



Epoch: 28/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.48it/s, F1=0.996, train_acc=0.999, train_loss=0.169, train_precision=0.995, train_recall=0.996]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       0.99      0.99      0.99       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       0.99      0.99      0.99      1591
         PRO       1.00      1.00      1.00        86
        RACE       1.00      1.00      1.00        45
       TITLE       1.00      1.00      1.00      2111

   micro avg       0.99      1.00      1.00      4551
   macro avg       1.00      1.00      1.00      4551
weighted avg       0.99      1.00      1.00      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.57it/s, F1=0.936, eval_acc=0.969, eval_loss=4.28, eval_precision=0.924, eval_recall=0.948]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.97      0.97      0.97        33
         EDU       0.97      0.97      0.97       106
         LOC       0.67      1.00      0.80         2
        NAME       0.99      1.00      1.00       110
         ORG       0.89      0.93      0.91       523
         PRO       0.78      1.00      0.88        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.93      0.94      0.94       690

   micro avg       0.92      0.95      0.93      1497
   macro avg       0.89      0.98      0.93      1497
weighted avg       0.93      0.95      0.94      1497



Epoch: 29/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.74it/s, F1=0.997, train_acc=0.999, train_loss=0.225, train_precision=0.996, train_recall=0.998]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       0.97      0.99      0.98       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       1.00      1.00      1.00      1591
         PRO       0.98      1.00      0.99        86
        RACE       1.00      1.00      1.00        45
       TITLE       1.00      1.00      1.00      2111

   micro avg       1.00      1.00      1.00      4551
   macro avg       0.99      1.00      1.00      4551
weighted avg       1.00      1.00      1.00      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.68it/s, F1=0.932, eval_acc=0.968, eval_loss=4.93, eval_precision=0.917, eval_recall=0.948]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.94      0.99      0.96       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.89      0.92      0.90       523
         PRO       0.86      1.00      0.92        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.92      0.95      0.93       690

   micro avg       0.92      0.95      0.93      1497
   macro avg       0.93      0.98      0.96      1497
weighted avg       0.92      0.95      0.93      1497



Epoch: 30/30 Train: 100%|██████████| 169/169 [00:44<00:00,  3.78it/s, F1=0.998, train_acc=0.999, train_loss=0.111, train_precision=0.997, train_recall=0.998]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       1.00      1.00      1.00      1591
         PRO       1.00      1.00      1.00        86
        RACE       1.00      1.00      1.00        45
       TITLE       1.00      1.00      1.00      2111

   micro avg       1.00      1.00      1.00      4551
   macro avg       1.00      1.00      1.00      4551
weighted avg       1.00      1.00      1.00      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.61it/s, F1=0.941, eval_acc=0.97, eval_loss=4.58, eval_precision=0.932, eval_recall=0.95]  


eval_reports:


calculate data/few_shot/resume/train_1350.json etag: 100%|██████████| 639k/639k [00:00<00:00, 298MB/s]
calculate data/few_shot/resume/dev.json etag: 100%|██████████| 208k/208k [00:00<00:00, 207MB/s]
calculate data/few_shot/resume/test.json etag: 100%|██████████| 230k/230k [00:00<00:00, 215MB/s]
calculate data/few_shot/resume/labels.txt etag: 100%|██████████| 181/181 [00:00<00:00, 357kB/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.94      0.98      0.96       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.91      0.93      0.92       523
         PRO       0.86      1.00      0.92        18
        RACE       0.88      1.00      0.94        15
       TITLE       0.93      0.95      0.94       690

   micro avg       0.93      0.95      0.94      1497
   macro avg       0.94      0.98      0.96      1497
weighted avg       0.93      0.95      0.94      1497

kwargs parser: {
    "batch_size": 8,
    "eval_batch_size": 64,
    "test_batch_size": 16,
    "word_embedding_file": "data/tencent/word_embedding.txt",
    "word_vocab_file": "data/tencent/tencent_vocab.txt",
    "train_file": "data/few_shot/resume/train_1350.json",
    "eval_file": "data/few_shot/resume/dev.json",
    "test_file": "data/few_sho


count line size data/few_shot/resume/labels.txt: 29L [00:00, 197780.19L/s]
build line mapper: 29L [00:00, 250793.44L/s] [00:00<?, ?it/s]
load vocab from files: 100%|██████████| 29/29 [00:00<00:00, 8732.49it/s]
load vocab from list: 100%|██████████| 28/28 [00:00<00:00, 275036.33it/s]
load dataset from data/few_shot/resume/train_1350.json: 92it [00:00, 917.12it/s]

load cached ./temp/67aae1402c328e13a97f12024469cc97_578a629df36736a7b0ca315689a0fbc2_a783a23408031aaf8881013b1b168597_61206f767c93b652c614f8099bc479e7/1000000/matched_words
load cached ./temp/67aae1402c328e13a97f12024469cc97_578a629df36736a7b0ca315689a0fbc2_a783a23408031aaf8881013b1b168597_61206f767c93b652c614f8099bc479e7/1000000/word_vocab
load cached ./temp/67aae1402c328e13a97f12024469cc97_578a629df36736a7b0ca315689a0fbc2_a783a23408031aaf8881013b1b168597_61206f767c93b652c614f8099bc479e7/1000000/vocab_embedding


load dataset from data/few_shot/resume/train_1350.json: 1350it [00:01, 797.73it/s]
load dataset from data/few_shot/resume/dev.json: 463it [00:00, 833.50it/s]
Some weights of the model checkpoint at save_pretrained/resume_pretrain_lebert_1350_pretraind_task/Bert_1290/pytorch_model.bin were not used when initializing LEBertModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing LEBertModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing LEBertModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification m

Load pretrained embedding from file.........


Epoch: 1/30 Train: 100%|██████████| 169/169 [00:44<00:00,  3.81it/s, F1=0.383, train_acc=0.675, train_loss=40.1, train_precision=0.352, train_recall=0.425]       


train_reports:
              precision    recall  f1-score   support

        CONT       0.11      0.14      0.12        86
         EDU       0.64      0.36      0.46       263
         LOC       0.00      0.00      0.00        22
        NAME       0.06      0.11      0.08       347
         ORG       0.50      0.49      0.50      1591
         PRO       0.27      0.15      0.19        86
        RACE       0.00      0.00      0.00        45
       TITLE       0.40      0.46      0.42      2111

   micro avg       0.37      0.42      0.39      4551
   macro avg       0.25      0.21      0.22      4551
weighted avg       0.41      0.42      0.41      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.65it/s, F1=0.853, eval_acc=0.95, eval_loss=5.93, eval_precision=0.797, eval_recall=0.919] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.89      0.97      0.93        33
         EDU       0.82      0.90      0.86       106
         LOC       0.50      0.50      0.50         2
        NAME       0.96      0.99      0.98       110
         ORG       0.75      0.89      0.81       523
         PRO       0.34      0.61      0.44        18
        RACE       0.93      0.93      0.93        15
       TITLE       0.79      0.93      0.86       690

   micro avg       0.78      0.92      0.84      1497
   macro avg       0.75      0.84      0.79      1497
weighted avg       0.79      0.92      0.85      1497



Epoch: 2/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.71it/s, F1=0.874, train_acc=0.966, train_loss=4.61, train_precision=0.841, train_recall=0.912]


train_reports:
              precision    recall  f1-score   support

        CONT       0.90      0.97      0.93        86
         EDU       0.94      0.96      0.95       263
         LOC       0.16      0.14      0.15        22
        NAME       0.98      0.98      0.98       347
         ORG       0.79      0.90      0.84      1591
         PRO       0.47      0.64      0.54        86
        RACE       0.85      0.87      0.86        45
       TITLE       0.85      0.92      0.88      2111

   micro avg       0.83      0.91      0.87      4551
   macro avg       0.74      0.80      0.77      4551
weighted avg       0.83      0.91      0.87      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.37it/s, F1=0.909, eval_acc=0.97, eval_loss=3.42, eval_precision=0.874, eval_recall=0.948] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      1.00      0.98       106
         LOC       1.00      1.00      1.00         2
        NAME       0.97      1.00      0.99       110
         ORG       0.82      0.92      0.86       523
         PRO       0.86      1.00      0.92        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.86      0.94      0.90       690

   micro avg       0.86      0.94      0.90      1497
   macro avg       0.92      0.98      0.95      1497
weighted avg       0.86      0.94      0.90      1497



Epoch: 3/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.73it/s, F1=0.937, train_acc=0.982, train_loss=2.25, train_precision=0.919, train_recall=0.958]


train_reports:
              precision    recall  f1-score   support

        CONT       0.94      0.97      0.95        86
         EDU       0.95      0.98      0.97       263
         LOC       0.60      0.68      0.64        22
        NAME       0.98      0.99      0.99       347
         ORG       0.89      0.94      0.92      1591
         PRO       0.81      0.93      0.86        86
        RACE       0.86      0.93      0.89        45
       TITLE       0.92      0.96      0.94      2111

   micro avg       0.91      0.96      0.93      4551
   macro avg       0.87      0.92      0.90      4551
weighted avg       0.91      0.96      0.93      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.66it/s, F1=0.931, eval_acc=0.967, eval_loss=3.87, eval_precision=0.909, eval_recall=0.955]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      1.00      0.98       106
         LOC       1.00      1.00      1.00         2
        NAME       0.97      1.00      0.99       110
         ORG       0.89      0.93      0.91       523
         PRO       0.82      1.00      0.90        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.88      0.95      0.91       690

   micro avg       0.90      0.95      0.93      1497
   macro avg       0.93      0.99      0.96      1497
weighted avg       0.90      0.95      0.93      1497



Epoch: 4/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.75it/s, F1=0.951, train_acc=0.987, train_loss=1.64, train_precision=0.938, train_recall=0.965]


train_reports:
              precision    recall  f1-score   support

        CONT       0.98      0.99      0.98        86
         EDU       0.99      0.98      0.98       263
         LOC       0.59      0.73      0.65        22
        NAME       0.98      0.99      0.99       347
         ORG       0.93      0.96      0.94      1591
         PRO       0.89      0.94      0.92        86
        RACE       0.87      0.91      0.89        45
       TITLE       0.94      0.97      0.95      2111

   micro avg       0.94      0.97      0.95      4551
   macro avg       0.90      0.93      0.91      4551
weighted avg       0.94      0.97      0.95      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.16it/s, F1=0.927, eval_acc=0.966, eval_loss=4.38, eval_precision=0.906, eval_recall=0.949]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.95      1.00      0.98       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.86      0.94      0.90       523
         PRO       0.77      0.94      0.85        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.91      0.94      0.92       690

   micro avg       0.90      0.95      0.92      1497
   macro avg       0.89      0.97      0.92      1497
weighted avg       0.90      0.95      0.92      1497



Epoch: 5/30 Train: 100%|██████████| 169/169 [00:44<00:00,  3.77it/s, F1=0.965, train_acc=0.992, train_loss=1, train_precision=0.954, train_recall=0.976]    


train_reports:
              precision    recall  f1-score   support

        CONT       0.98      0.99      0.98        86
         EDU       0.99      0.99      0.99       263
         LOC       0.79      0.86      0.83        22
        NAME       0.99      1.00      1.00       347
         ORG       0.94      0.97      0.96      1591
         PRO       0.93      0.97      0.95        86
        RACE       0.85      0.91      0.88        45
       TITLE       0.95      0.98      0.97      2111

   micro avg       0.95      0.98      0.97      4551
   macro avg       0.93      0.96      0.94      4551
weighted avg       0.95      0.98      0.97      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.55it/s, F1=0.906, eval_acc=0.962, eval_loss=4.57, eval_precision=0.871, eval_recall=0.945]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.95      1.00      0.98       106
         LOC       0.67      1.00      0.80         2
        NAME       0.97      1.00      0.99       110
         ORG       0.82      0.94      0.88       523
         PRO       0.82      1.00      0.90        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.85      0.92      0.89       690

   micro avg       0.86      0.94      0.90      1497
   macro avg       0.88      0.98      0.92      1497
weighted avg       0.86      0.94      0.90      1497



Epoch: 6/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.47it/s, F1=0.982, train_acc=0.996, train_loss=0.587, train_precision=0.977, train_recall=0.987]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      0.99      0.99        86
         EDU       1.00      1.00      1.00       263
         LOC       0.84      0.95      0.89        22
        NAME       0.99      1.00      1.00       347
         ORG       0.97      0.98      0.98      1591
         PRO       0.97      0.99      0.98        86
        RACE       0.93      0.96      0.95        45
       TITLE       0.97      0.99      0.98      2111

   micro avg       0.98      0.99      0.98      4551
   macro avg       0.96      0.98      0.97      4551
weighted avg       0.98      0.99      0.98      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.52it/s, F1=0.929, eval_acc=0.969, eval_loss=3.94, eval_precision=0.91, eval_recall=0.948] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      1.00      0.98       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.86      0.93      0.90       523
         PRO       0.78      1.00      0.88        18
        RACE       1.00      0.93      0.97        15
       TITLE       0.92      0.93      0.92       690

   micro avg       0.91      0.95      0.93      1497
   macro avg       0.94      0.98      0.95      1497
weighted avg       0.91      0.95      0.93      1497



Epoch: 7/30 Train: 100%|██████████| 169/169 [00:44<00:00,  3.76it/s, F1=0.989, train_acc=0.997, train_loss=0.326, train_precision=0.986, train_recall=0.992]


train_reports:
              precision    recall  f1-score   support

        CONT       0.99      0.99      0.99        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       0.99      0.99      0.99       347
         ORG       0.98      0.99      0.98      1591
         PRO       1.00      1.00      1.00        86
        RACE       0.91      0.96      0.93        45
       TITLE       0.99      0.99      0.99      2111

   micro avg       0.98      0.99      0.99      4551
   macro avg       0.98      0.99      0.99      4551
weighted avg       0.98      0.99      0.99      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.56it/s, F1=0.935, eval_acc=0.972, eval_loss=4.63, eval_precision=0.923, eval_recall=0.947]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.97      0.97      0.97        33
         EDU       0.96      1.00      0.98       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      0.99      0.99       110
         ORG       0.89      0.92      0.91       523
         PRO       0.86      1.00      0.92        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.92      0.94      0.93       690

   micro avg       0.92      0.94      0.93      1497
   macro avg       0.91      0.98      0.94      1497
weighted avg       0.92      0.94      0.93      1497



Epoch: 8/30 Train: 100%|██████████| 169/169 [00:47<00:00,  3.56it/s, F1=0.98, train_acc=0.996, train_loss=0.5, train_precision=0.975, train_recall=0.986]   


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       0.95      0.95      0.95        22
        NAME       1.00      1.00      1.00       347
         ORG       0.96      0.98      0.97      1591
         PRO       0.95      0.98      0.97        86
        RACE       0.96      0.98      0.97        45
       TITLE       0.98      0.99      0.98      2111

   micro avg       0.98      0.99      0.98      4551
   macro avg       0.98      0.98      0.98      4551
weighted avg       0.98      0.99      0.98      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.64it/s, F1=0.92, eval_acc=0.967, eval_loss=5.39, eval_precision=0.904, eval_recall=0.936] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.96      1.00      0.98       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.86      0.93      0.89       523
         PRO       0.78      1.00      0.88        18
        RACE       0.94      1.00      0.97        15
       TITLE       0.90      0.91      0.91       690

   micro avg       0.90      0.93      0.91      1497
   macro avg       0.88      0.98      0.92      1497
weighted avg       0.90      0.93      0.91      1497



Epoch: 9/30 Train: 100%|██████████| 169/169 [00:44<00:00,  3.77it/s, F1=0.986, train_acc=0.997, train_loss=0.542, train_precision=0.983, train_recall=0.989]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       0.98      0.99      0.99       263
         LOC       0.95      0.95      0.95        22
        NAME       1.00      1.00      1.00       347
         ORG       0.98      0.99      0.98      1591
         PRO       0.99      1.00      0.99        86
        RACE       1.00      0.98      0.99        45
       TITLE       0.98      0.99      0.99      2111

   micro avg       0.98      0.99      0.99      4551
   macro avg       0.99      0.99      0.99      4551
weighted avg       0.98      0.99      0.99      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.59it/s, F1=0.9, eval_acc=0.963, eval_loss=5.76, eval_precision=0.871, eval_recall=0.932]  


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.96      0.99      0.98       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.82      0.93      0.87       523
         PRO       0.82      1.00      0.90        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.85      0.90      0.88       690

   micro avg       0.86      0.93      0.89      1497
   macro avg       0.88      0.97      0.92      1497
weighted avg       0.86      0.93      0.89      1497



Epoch: 10/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.69it/s, F1=0.985, train_acc=0.998, train_loss=0.357, train_precision=0.98, train_recall=0.991] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       0.99      1.00      0.99       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      0.99      1.00       347
         ORG       0.97      0.99      0.98      1591
         PRO       0.99      0.99      0.99        86
        RACE       1.00      1.00      1.00        45
       TITLE       0.98      0.99      0.98      2111

   micro avg       0.98      0.99      0.99      4551
   macro avg       0.99      0.99      0.99      4551
weighted avg       0.98      0.99      0.99      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.70it/s, F1=0.928, eval_acc=0.967, eval_loss=5.5, eval_precision=0.91, eval_recall=0.946]  


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.96      1.00      0.98       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.88      0.93      0.90       523
         PRO       0.82      1.00      0.90        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.91      0.93      0.92       690

   micro avg       0.91      0.94      0.92      1497
   macro avg       0.89      0.98      0.93      1497
weighted avg       0.91      0.94      0.93      1497



Epoch: 11/30 Train: 100%|██████████| 169/169 [00:47<00:00,  3.56it/s, F1=0.99, train_acc=0.998, train_loss=0.299, train_precision=0.988, train_recall=0.992] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       0.95      0.95      0.95        22
        NAME       1.00      1.00      1.00       347
         ORG       0.98      0.99      0.99      1591
         PRO       0.99      0.99      0.99        86
        RACE       1.00      1.00      1.00        45
       TITLE       0.99      0.99      0.99      2111

   micro avg       0.99      0.99      0.99      4551
   macro avg       0.99      0.99      0.99      4551
weighted avg       0.99      0.99      0.99      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.66it/s, F1=0.931, eval_acc=0.97, eval_loss=4.31, eval_precision=0.918, eval_recall=0.945] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.97      0.98      0.98       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.88      0.92      0.90       523
         PRO       0.82      1.00      0.90        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.92      0.94      0.93       690

   micro avg       0.91      0.94      0.93      1497
   macro avg       0.90      0.98      0.93      1497
weighted avg       0.91      0.94      0.93      1497



Epoch: 12/30 Train: 100%|██████████| 169/169 [00:44<00:00,  3.76it/s, F1=0.992, train_acc=0.998, train_loss=0.283, train_precision=0.989, train_recall=0.994]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       0.99      0.99      0.99      1591
         PRO       0.93      0.97      0.95        86
        RACE       1.00      1.00      1.00        45
       TITLE       0.99      0.99      0.99      2111

   micro avg       0.99      0.99      0.99      4551
   macro avg       0.99      0.99      0.99      4551
weighted avg       0.99      0.99      0.99      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.56it/s, F1=0.924, eval_acc=0.967, eval_loss=4.89, eval_precision=0.903, eval_recall=0.946]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.96      1.00      0.98       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.87      0.93      0.90       523
         PRO       0.82      1.00      0.90        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.90      0.93      0.91       690

   micro avg       0.90      0.94      0.92      1497
   macro avg       0.89      0.98      0.93      1497
weighted avg       0.90      0.94      0.92      1497



Epoch: 13/30 Train: 100%|██████████| 169/169 [00:47<00:00,  3.52it/s, F1=0.994, train_acc=0.999, train_loss=0.193, train_precision=0.993, train_recall=0.996]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       0.99      0.99      0.99      1591
         PRO       0.97      0.99      0.98        86
        RACE       1.00      1.00      1.00        45
       TITLE       0.99      1.00      0.99      2111

   micro avg       0.99      1.00      0.99      4551
   macro avg       0.99      1.00      1.00      4551
weighted avg       0.99      1.00      0.99      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.56it/s, F1=0.933, eval_acc=0.971, eval_loss=4.35, eval_precision=0.922, eval_recall=0.945]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.98      0.96      0.97       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.89      0.91      0.90       523
         PRO       0.78      1.00      0.88        18
        RACE       1.00      0.93      0.97        15
       TITLE       0.92      0.95      0.93       690

   micro avg       0.92      0.94      0.93      1497
   macro avg       0.90      0.97      0.92      1497
weighted avg       0.92      0.94      0.93      1497



Epoch: 14/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.73it/s, F1=0.996, train_acc=0.999, train_loss=0.152, train_precision=0.995, train_recall=0.997] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       0.99      1.00      0.99      1591
         PRO       0.99      1.00      0.99        86
        RACE       1.00      1.00      1.00        45
       TITLE       0.99      1.00      1.00      2111

   micro avg       0.99      1.00      1.00      4551
   macro avg       1.00      1.00      1.00      4551
weighted avg       0.99      1.00      1.00      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.57it/s, F1=0.939, eval_acc=0.97, eval_loss=5.17, eval_precision=0.924, eval_recall=0.954] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      0.97      0.96       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.89      0.93      0.91       523
         PRO       0.82      1.00      0.90        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.93      0.95      0.94       690

   micro avg       0.92      0.95      0.94      1497
   macro avg       0.95      0.98      0.96      1497
weighted avg       0.92      0.95      0.94      1497



Epoch: 15/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.52it/s, F1=0.997, train_acc=0.999, train_loss=0.123, train_precision=0.996, train_recall=0.998]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       0.99      0.99      0.99      1591
         PRO       1.00      1.00      1.00        86
        RACE       1.00      1.00      1.00        45
       TITLE       1.00      1.00      1.00      2111

   micro avg       1.00      1.00      1.00      4551
   macro avg       1.00      1.00      1.00      4551
weighted avg       1.00      1.00      1.00      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.23it/s, F1=0.947, eval_acc=0.974, eval_loss=4.5, eval_precision=0.935, eval_recall=0.959] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.96      1.00      0.98       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      0.99      0.99       110
         ORG       0.91      0.94      0.93       523
         PRO       0.86      1.00      0.92        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.94      0.95      0.95       690

   micro avg       0.93      0.96      0.94      1497
   macro avg       0.91      0.98      0.94      1497
weighted avg       0.93      0.96      0.95      1497



Epoch: 16/30 Train: 100%|██████████| 169/169 [00:44<00:00,  3.77it/s, F1=0.999, train_acc=1, train_loss=0.0359, train_precision=0.999, train_recall=0.999]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       0.99      1.00      0.99       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       1.00      1.00      1.00      1591
         PRO       1.00      1.00      1.00        86
        RACE       1.00      1.00      1.00        45
       TITLE       1.00      1.00      1.00      2111

   micro avg       1.00      1.00      1.00      4551
   macro avg       1.00      1.00      1.00      4551
weighted avg       1.00      1.00      1.00      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.64it/s, F1=0.939, eval_acc=0.97, eval_loss=5.34, eval_precision=0.928, eval_recall=0.951] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.97      1.00      0.99       106
         LOC       0.67      1.00      0.80         2
        NAME       0.99      1.00      1.00       110
         ORG       0.90      0.92      0.91       523
         PRO       0.78      1.00      0.88        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.94      0.95      0.94       690

   micro avg       0.93      0.95      0.94      1497
   macro avg       0.90      0.98      0.93      1497
weighted avg       0.93      0.95      0.94      1497



Epoch: 17/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.74it/s, F1=1, train_acc=1, train_loss=0.0179, train_precision=0.999, train_recall=1]    


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       1.00      1.00      1.00      1591
         PRO       1.00      1.00      1.00        86
        RACE       1.00      1.00      1.00        45
       TITLE       1.00      1.00      1.00      2111

   micro avg       1.00      1.00      1.00      4551
   macro avg       1.00      1.00      1.00      4551
weighted avg       1.00      1.00      1.00      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.64it/s, F1=0.943, eval_acc=0.972, eval_loss=5.18, eval_precision=0.93, eval_recall=0.955] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      1.00      0.98       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.90      0.93      0.92       523
         PRO       0.78      1.00      0.88        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.94      0.95      0.95       690

   micro avg       0.93      0.95      0.94      1497
   macro avg       0.95      0.99      0.96      1497
weighted avg       0.93      0.95      0.94      1497



Epoch: 18/30 Train: 100%|██████████| 169/169 [00:47<00:00,  3.52it/s, F1=0.997, train_acc=0.999, train_loss=0.149, train_precision=0.996, train_recall=0.998]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       1.00      1.00      1.00      1591
         PRO       1.00      1.00      1.00        86
        RACE       1.00      1.00      1.00        45
       TITLE       0.99      1.00      0.99      2111

   micro avg       1.00      1.00      1.00      4551
   macro avg       1.00      1.00      1.00      4551
weighted avg       1.00      1.00      1.00      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.63it/s, F1=0.928, eval_acc=0.966, eval_loss=6.8, eval_precision=0.911, eval_recall=0.946] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.91      0.96      0.94       106
         LOC       1.00      1.00      1.00         2
        NAME       0.99      1.00      1.00       110
         ORG       0.88      0.92      0.90       523
         PRO       0.86      1.00      0.92        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.91      0.94      0.92       690

   micro avg       0.91      0.94      0.92      1497
   macro avg       0.94      0.98      0.96      1497
weighted avg       0.91      0.94      0.92      1497



Epoch: 19/30 Train: 100%|██████████| 169/169 [00:44<00:00,  3.77it/s, F1=0.995, train_acc=0.999, train_loss=0.182, train_precision=0.994, train_recall=0.997]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       1.00      1.00      1.00      1591
         PRO       1.00      1.00      1.00        86
        RACE       1.00      1.00      1.00        45
       TITLE       0.99      0.99      0.99      2111

   micro avg       0.99      1.00      0.99      4551
   macro avg       1.00      1.00      1.00      4551
weighted avg       0.99      1.00      0.99      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.68it/s, F1=0.942, eval_acc=0.972, eval_loss=5.58, eval_precision=0.929, eval_recall=0.956]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.95      1.00      0.98       106
         LOC       0.67      1.00      0.80         2
        NAME       0.99      1.00      1.00       110
         ORG       0.89      0.94      0.92       523
         PRO       0.86      1.00      0.92        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.93      0.95      0.94       690

   micro avg       0.92      0.95      0.94      1497
   macro avg       0.90      0.98      0.94      1497
weighted avg       0.92      0.95      0.94      1497



Epoch: 20/30 Train: 100%|██████████| 169/169 [00:44<00:00,  3.77it/s, F1=0.992, train_acc=0.997, train_loss=0.498, train_precision=0.989, train_recall=0.995]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       0.98      0.99      0.99       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       0.99      0.99      0.99      1591
         PRO       0.99      1.00      0.99        86
        RACE       1.00      1.00      1.00        45
       TITLE       0.99      0.99      0.99      2111

   micro avg       0.99      0.99      0.99      4551
   macro avg       0.99      1.00      1.00      4551
weighted avg       0.99      0.99      0.99      4551



Eval Result: 100%|██████████| 8/8 [00:04<00:00,  1.79it/s, F1=0.919, eval_acc=0.969, eval_loss=5.62, eval_precision=0.904, eval_recall=0.935]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      0.92      0.94       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.87      0.91      0.89       523
         PRO       0.68      0.83      0.75        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.90      0.93      0.92       690

   micro avg       0.90      0.93      0.91      1497
   macro avg       0.92      0.95      0.94      1497
weighted avg       0.90      0.93      0.91      1497



Epoch: 21/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.74it/s, F1=0.99, train_acc=0.997, train_loss=0.605, train_precision=0.989, train_recall=0.993] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       0.98      0.99      0.99       263
         LOC       1.00      1.00      1.00        22
        NAME       0.99      0.99      0.99       347
         ORG       0.99      0.99      0.99      1591
         PRO       0.98      0.99      0.98        86
        RACE       1.00      1.00      1.00        45
       TITLE       0.99      0.99      0.99      2111

   micro avg       0.99      0.99      0.99      4551
   macro avg       0.99      0.99      0.99      4551
weighted avg       0.99      0.99      0.99      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.66it/s, F1=0.937, eval_acc=0.97, eval_loss=4.96, eval_precision=0.924, eval_recall=0.95]  


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.95      0.99      0.97       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      0.98      0.98       110
         ORG       0.90      0.93      0.92       523
         PRO       0.86      1.00      0.92        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.92      0.95      0.94       690

   micro avg       0.92      0.95      0.94      1497
   macro avg       0.90      0.98      0.94      1497
weighted avg       0.92      0.95      0.94      1497



Epoch: 22/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.75it/s, F1=0.995, train_acc=0.998, train_loss=0.258, train_precision=0.994, train_recall=0.997]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       0.99      1.00      1.00      1591
         PRO       1.00      1.00      1.00        86
        RACE       1.00      1.00      1.00        45
       TITLE       0.99      1.00      0.99      2111

   micro avg       0.99      1.00      1.00      4551
   macro avg       1.00      1.00      1.00      4551
weighted avg       0.99      1.00      1.00      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.49it/s, F1=0.938, eval_acc=0.974, eval_loss=4.46, eval_precision=0.932, eval_recall=0.944]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.96      0.99      0.98       106
         LOC       1.00      1.00      1.00         2
        NAME       0.97      1.00      0.99       110
         ORG       0.91      0.93      0.92       523
         PRO       0.82      1.00      0.90        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.93      0.92      0.93       690

   micro avg       0.93      0.94      0.93      1497
   macro avg       0.95      0.98      0.96      1497
weighted avg       0.93      0.94      0.93      1497



Epoch: 23/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.51it/s, F1=0.992, train_acc=0.998, train_loss=0.275, train_precision=0.99, train_recall=0.994] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       0.99      1.00      0.99       347
         ORG       0.99      0.99      0.99      1591
         PRO       1.00      1.00      1.00        86
        RACE       1.00      1.00      1.00        45
       TITLE       0.99      0.99      0.99      2111

   micro avg       0.99      0.99      0.99      4551
   macro avg       1.00      1.00      1.00      4551
weighted avg       0.99      0.99      0.99      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.66it/s, F1=0.938, eval_acc=0.972, eval_loss=4.87, eval_precision=0.928, eval_recall=0.948]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.95      1.00      0.98       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.90      0.92      0.91       523
         PRO       0.86      1.00      0.92        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.93      0.95      0.94       690

   micro avg       0.92      0.95      0.93      1497
   macro avg       0.90      0.98      0.94      1497
weighted avg       0.92      0.95      0.93      1497



Epoch: 24/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.73it/s, F1=0.997, train_acc=1, train_loss=0.0656, train_precision=0.996, train_recall=0.998]    


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       0.99      1.00      1.00      1591
         PRO       1.00      1.00      1.00        86
        RACE       1.00      1.00      1.00        45
       TITLE       1.00      1.00      1.00      2111

   micro avg       1.00      1.00      1.00      4551
   macro avg       1.00      1.00      1.00      4551
weighted avg       1.00      1.00      1.00      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.68it/s, F1=0.943, eval_acc=0.972, eval_loss=5.18, eval_precision=0.932, eval_recall=0.955]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.95      1.00      0.97       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.90      0.93      0.91       523
         PRO       0.86      1.00      0.92        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.94      0.95      0.95       690

   micro avg       0.93      0.95      0.94      1497
   macro avg       0.90      0.98      0.94      1497
weighted avg       0.93      0.95      0.94      1497



Epoch: 25/30 Train: 100%|██████████| 169/169 [00:47<00:00,  3.54it/s, F1=0.998, train_acc=0.999, train_loss=0.12, train_precision=0.997, train_recall=0.998]  


train_reports:
              precision    recall  f1-score   support

        CONT       0.99      0.99      0.99        86
         EDU       0.99      1.00      0.99       263
         LOC       0.96      1.00      0.98        22
        NAME       1.00      1.00      1.00       347
         ORG       1.00      1.00      1.00      1591
         PRO       1.00      1.00      1.00        86
        RACE       1.00      1.00      1.00        45
       TITLE       1.00      1.00      1.00      2111

   micro avg       1.00      1.00      1.00      4551
   macro avg       0.99      1.00      0.99      4551
weighted avg       1.00      1.00      1.00      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.30it/s, F1=0.951, eval_acc=0.975, eval_loss=4.7, eval_precision=0.944, eval_recall=0.959] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.97      1.00      0.99        33
         EDU       0.96      1.00      0.98       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.91      0.94      0.92       523
         PRO       0.86      1.00      0.92        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.95      0.96      0.96       690

   micro avg       0.94      0.96      0.95      1497
   macro avg       0.95      0.99      0.97      1497
weighted avg       0.94      0.96      0.95      1497



Epoch: 26/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.73it/s, F1=0.995, train_acc=0.999, train_loss=0.2, train_precision=0.994, train_recall=0.997]  


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       0.99      0.99      0.99       263
         LOC       0.95      0.95      0.95        22
        NAME       1.00      1.00      1.00       347
         ORG       0.99      1.00      0.99      1591
         PRO       0.99      0.99      0.99        86
        RACE       1.00      1.00      1.00        45
       TITLE       0.99      1.00      1.00      2111

   micro avg       0.99      1.00      0.99      4551
   macro avg       0.99      0.99      0.99      4551
weighted avg       0.99      1.00      0.99      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.58it/s, F1=0.928, eval_acc=0.967, eval_loss=6.12, eval_precision=0.916, eval_recall=0.94] 


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.95      1.00      0.97       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.87      0.92      0.90       523
         PRO       0.82      1.00      0.90        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.92      0.92      0.92       690

   micro avg       0.91      0.94      0.92      1497
   macro avg       0.89      0.98      0.93      1497
weighted avg       0.91      0.94      0.92      1497



Epoch: 27/30 Train: 100%|██████████| 169/169 [00:44<00:00,  3.76it/s, F1=0.989, train_acc=0.998, train_loss=0.396, train_precision=0.987, train_recall=0.992]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       0.95      0.95      0.95        22
        NAME       1.00      1.00      1.00       347
         ORG       0.98      0.99      0.99      1591
         PRO       0.99      1.00      0.99        86
        RACE       1.00      1.00      1.00        45
       TITLE       0.98      0.99      0.99      2111

   micro avg       0.99      0.99      0.99      4551
   macro avg       0.99      0.99      0.99      4551
weighted avg       0.99      0.99      0.99      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.22it/s, F1=0.929, eval_acc=0.966, eval_loss=5.71, eval_precision=0.914, eval_recall=0.945]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.95      1.00      0.98       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.88      0.92      0.90       523
         PRO       0.86      1.00      0.92        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.91      0.93      0.92       690

   micro avg       0.91      0.94      0.92      1497
   macro avg       0.90      0.98      0.93      1497
weighted avg       0.91      0.94      0.92      1497



Epoch: 28/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.47it/s, F1=0.992, train_acc=0.999, train_loss=0.265, train_precision=0.991, train_recall=0.994]


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       1.00      1.00      1.00       263
         LOC       0.92      1.00      0.96        22
        NAME       1.00      1.00      1.00       347
         ORG       0.99      0.99      0.99      1591
         PRO       0.99      0.99      0.99        86
        RACE       1.00      1.00      1.00        45
       TITLE       0.99      0.99      0.99      2111

   micro avg       0.99      0.99      0.99      4551
   macro avg       0.99      1.00      0.99      4551
weighted avg       0.99      0.99      0.99      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.64it/s, F1=0.912, eval_acc=0.965, eval_loss=4.94, eval_precision=0.893, eval_recall=0.932]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       0.94      0.97      0.96        33
         EDU       0.95      0.99      0.97       106
         LOC       0.67      1.00      0.80         2
        NAME       0.98      1.00      0.99       110
         ORG       0.84      0.91      0.88       523
         PRO       0.82      1.00      0.90        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.89      0.91      0.90       690

   micro avg       0.88      0.93      0.91      1497
   macro avg       0.89      0.97      0.92      1497
weighted avg       0.89      0.93      0.91      1497



Epoch: 29/30 Train: 100%|██████████| 169/169 [00:45<00:00,  3.74it/s, F1=0.992, train_acc=0.998, train_loss=0.338, train_precision=0.99, train_recall=0.994] 


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       0.99      0.99      0.99       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       0.99      0.99      0.99      1591
         PRO       1.00      1.00      1.00        86
        RACE       1.00      1.00      1.00        45
       TITLE       0.99      0.99      0.99      2111

   micro avg       0.99      0.99      0.99      4551
   macro avg       1.00      1.00      1.00      4551
weighted avg       0.99      0.99      0.99      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.47it/s, F1=0.931, eval_acc=0.967, eval_loss=5.73, eval_precision=0.913, eval_recall=0.949]


eval_reports:


  0%|          | 0/169 [00:00<?, ?it/s]

              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.91      1.00      0.95       106
         LOC       1.00      1.00      1.00         2
        NAME       0.98      1.00      0.99       110
         ORG       0.87      0.92      0.89       523
         PRO       0.86      1.00      0.92        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.92      0.95      0.93       690

   micro avg       0.91      0.95      0.93      1497
   macro avg       0.94      0.98      0.96      1497
weighted avg       0.91      0.95      0.93      1497



Epoch: 30/30 Train: 100%|██████████| 169/169 [00:48<00:00,  3.51it/s, F1=0.999, train_acc=1, train_loss=0.0849, train_precision=0.999, train_recall=0.999]   


train_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        86
         EDU       0.98      0.99      0.99       263
         LOC       1.00      1.00      1.00        22
        NAME       1.00      1.00      1.00       347
         ORG       1.00      1.00      1.00      1591
         PRO       1.00      1.00      1.00        86
        RACE       1.00      1.00      1.00        45
       TITLE       1.00      1.00      1.00      2111

   micro avg       1.00      1.00      1.00      4551
   macro avg       1.00      1.00      1.00      4551
weighted avg       1.00      1.00      1.00      4551



Eval Result: 100%|██████████| 8/8 [00:01<00:00,  4.65it/s, F1=0.942, eval_acc=0.972, eval_loss=5.02, eval_precision=0.931, eval_recall=0.954]


eval_reports:
              precision    recall  f1-score   support

        CONT       1.00      1.00      1.00        33
         EDU       0.95      1.00      0.98       106
         LOC       1.00      1.00      1.00         2
        NAME       0.96      1.00      0.98       110
         ORG       0.90      0.93      0.92       523
         PRO       0.77      0.94      0.85        18
        RACE       1.00      1.00      1.00        15
       TITLE       0.94      0.95      0.94       690

   micro avg       0.93      0.95      0.94      1497
   macro avg       0.94      0.98      0.96      1497
weighted avg       0.93      0.95      0.94      1497

