In [1]:
import os

os.environ['CUDA_DEVICE_ORDER'] = "PCI_BUS_ID"
os.environ["CUDA_VISIBLE_DEVICES"] = "0"
#os.environ["CUDA_LAUNCH_BLOCKING"] = '1'
os.environ['WANDB_DISABLED'] = 'True'

In [3]:
import torch
import re
import random
from transformers import ElectraForTokenClassification, AutoConfig, AutoTokenizer
from transformers import AdamW
import pandas as pd
from torch.utils.data import Dataset as DS
from datasets import Dataset
from transformers import DefaultDataCollator
from transformers import Trainer, TrainingArguments
from seqeval.metrics import classification_report
from sklearn.metrics import f1_score
import numpy as np
from datasets import load_metric
import wandb

In [4]:
from seqeval.scheme import IOB1, IOB2, IOE1, IOE2, IOBES, BILOU, Entities, Prefix, Tag
from seqeval.scheme import IOBES

In [5]:
permutations = [['ORG', 'PER', 'CVL', 'DAT', 'LOC', 'QNT'],
               ['DAT', 'QNT', 'PER', 'LOC', 'ORG', 'CVL'],
               ['CVL', 'LOC', 'ORG', 'QNT', 'DAT', 'PER'],
               ['QNT', 'ORG', 'DAT', 'PER', 'CVL', 'LOC'],
               ['LOC', 'CVL', 'QNT', 'ORG', 'PER', 'DAT'],
               ['PER', 'DAT', 'LOC', 'CVL', 'QNT', 'ORG']]

In [6]:
class NERDataset(DS):
    def __init__(self, dataset, tokenizer, label2id, max_length):
        super().__init__()
        self.tokenizer = tokenizer
        self.label2id = label2id
        self.max_length = max_length
        self.dataset = dataset
        self.data = []
        
        for i in range(len(self.dataset['label'])):
            text = dataset['label'][i]
            tagged_words = re.findall('<.*?:.*?>', text)
            
            word2ids = dict()
            for tagged_word in tagged_words:
                tag_splited = tagged_word.strip('<>').split(':')
                tag = tag_splited[-1]
                word = ':'.join(tag_splited[:-1])
                    
                word_tok = self.tokenizer.encode(word)[1:-1]
                if word not in word2ids:

                    label_id = [self.label2id['B-'+tag]]
                    if len(word_tok) > 1 :
                        label_id.extend([self.label2id['I-'+tag]] * (len(word_tok)-1))
                    word2ids[word] = {
                        'target_ids': word_tok,
                        'label_id': label_id 
                    }
                    text = text.replace(tagged_word, word)

            tokenized = self.tokenizer(text, truncation=True, max_length=self.max_length, padding='max_length')
            if 0 in tokenized['input_ids']:
                tok_length = tokenized['input_ids'].index(0)
            else:
                tok_length = self.max_length
            label_input = tokenized['input_ids'][:tok_length]
            labels = self._gen_labels(label_input, word2ids)
            labels.insert(0, -100)
            pad = [-100] * (self.max_length - len(labels))
            labels.extend(pad)

            temp = {
                'input_ids' : tokenized['input_ids'],
                'attention_mask' : tokenized['attention_mask'],
                'labels' : labels
            }
            
            self.data.append(temp)
        
    def _gen_labels(self, input_ids, word2ids):
        sequence = input_ids[1:-1]
        labels = [0] * len(sequence)
        
        for v in word2ids.values():
            target_ids = v['target_ids']
            label_id = v['label_id']
            
            i=0
            target_ids_length = len(target_ids)
            
            while i < len(sequence):
                if sequence[i:i + target_ids_length] == target_ids:
                    labels[i:i + target_ids_length] = label_id
                    i = i + target_ids_length
                else:
                    i += 1
                    
        return labels
    
    def __len__(self):
        return len(self.data)
    
    def __getitem__(self, idx):
        return {
            'input_ids': self.data[idx]['input_ids'],
            'attention_mask': self.data[idx]['attention_mask'],
            'labels': self.data[idx]['labels'],
        }

In [7]:
class IOBE(IOBES):
    allowed_prefix = Prefix.I | Prefix.O | Prefix.B | Prefix.E
    start_patterns = {
        (Prefix.ANY, Prefix.B, Tag.ANY),
        (Prefix.ANY, Prefix.S, Tag.ANY)
    }
    inside_patterns = {
        (Prefix.B, Prefix.I, Tag.SAME),
        (Prefix.B, Prefix.E, Tag.SAME),
        (Prefix.I, Prefix.I, Tag.SAME),
        (Prefix.I, Prefix.E, Tag.SAME)
    }
    end_patterns = {
        (Prefix.S, Prefix.ANY, Tag.ANY),
        (Prefix.E, Prefix.ANY, Tag.ANY),
        (Prefix.B, Prefix.O, Tag.ANY),
        (Prefix.B, Prefix.I, Tag.DIFF),
        (Prefix.B, Prefix.B, Tag.ANY),
    }

In [8]:
def compute_metrics(eval_pred):
    logits, labels = eval_pred
    predictions = np.argmax(logits, axis=-1)
    #import pdb;pdb.set_trace()
    predictions = predictions.flatten()
    labels = labels.flatten()
    npre = []
    nlab = []
 
    for i in range(len(labels)):
        if labels[i] != -100:
            npre.append(predictions[i])
            nlab.append(labels[i])
    npre = torch.tensor(npre)
    nlab = torch.tensor(nlab)
    
    label_indices = label_arr.copy()
    npre = [label_indices[pred] for pred in npre]
    nlab = [label_indices[label] for label in nlab]
    del label_indices[label_indices.index("O")]
    entity_level_metrics = classification_report(
        [nlab], [npre], digits=3,
        suffix=False,
        mode= 'strict', scheme=IOBE, 
        zero_division=True, output_dict=True
    )

    metrics = {}
    
    for key in entity_level_metrics.keys():
        if len(key) == 3:
            metrics[key+"_f1"] = entity_level_metrics[key]['f1-score']
            metrics[key+"_recall"] = entity_level_metrics[key]['recall']
            metrics[key+"_precision"] = entity_level_metrics[key]['precision']
            
        if key == 'macro avg':
            metrics["entity_macro_f1"] = entity_level_metrics['macro avg']['f1-score']
            metrics["entity_macro_precision"] = entity_level_metrics['macro avg']['precision']
            metrics["entity_macro_recall"] = entity_level_metrics['macro avg']['recall']
            
    return metrics

In [9]:
def base_train(config):
    
    model = ElectraForTokenClassification.from_pretrained(config['base_model_dir'], num_labels=(config['step']*2+1))
    tokenizer = AutoTokenizer.from_pretrained(config['base_model_dir'])
    train_file = pd.read_csv(config['train_file'])
    valid_file = pd.read_csv(config['valid_file'], sep='\t') 
    
    label2id = {'O':0}
    count = 1
    for i in range(config['step']):
        label2id['B-'+permutations[config['perm']][i]] = count
        count += 1
        label2id['I-'+permutations[config['perm']][i]] = count
        count += 1

    train_data = NERDataset(train_file, tokenizer=tokenizer, max_length=300, label2id=label2id)
    valid_data = NERDataset(valid_file, tokenizer=tokenizer, max_length=300, label2id=label2id)
    id2label = {label2id[label] : label for label in label2id.keys()}
    
    #import pdb;pdb.set_trace()
    
    model.config.label2id = label2id
    model.config.id2label = id2label

    global label_arr
    
    label_arr = []
    for v in id2label.values():
        label_arr.append(v)
        

    data_collator = DefaultDataCollator()
    device = torch.device("cuda")
    model.to(device)
     
    training_args = TrainingArguments(

        output_dir=config['output_dir'],
        do_eval = True,
        learning_rate=config['learning_rate'],
        per_device_train_batch_size=16,
        per_device_eval_batch_size=16,
        num_train_epochs=config['train_epoch'],
        weight_decay=0.1,
        save_strategy = 'epoch',
        logging_strategy = 'epoch',
        evaluation_strategy = 'epoch',
        load_best_model_at_end = True,
        label_names = ['labels'],
        metric_for_best_model = 'entity_macro_f1',
        warmup_ratio = 0.05,
        no_cuda = False
    )

    trainer = Trainer(
        model=model,
        args=training_args,
        train_dataset=train_data,
        eval_dataset = valid_data,
        data_collator=data_collator,
        tokenizer = tokenizer,
        compute_metrics=compute_metrics
    )

    trainer.train()
    trainer.save_model(config['output_dir'] + '/final')
    
    for f_name in os.listdir(config['output_dir']):
        if f_name.startswith('checkpoint'):
            for f in os.listdir(config['output_dir']+'/'+f_name):
                os.remove(config['output_dir']+'/'+f_name+'/'+f)
            os.rmdir(config['output_dir']+'/'+f_name)



In [10]:
def test(config):
    
    model = ElectraForTokenClassification.from_pretrained(config['model'])
    
    global label_arr
    
    label_arr = []
    for v in model.config.id2label.values():
        label_arr.append(v)
    
    tokenizer = AutoTokenizer.from_pretrained(config['model'])
    
    test_file = pd.read_csv(config['test_file'], sep='\t')
    label2id = model.config.label2id
    
    test_dataset = NERDataset(test_file, tokenizer=tokenizer, max_length=300, label2id=label2id)
    
    device = torch.device("cuda")
    model.to(device)
    
    data_collator = DefaultDataCollator()
    
    training_args = TrainingArguments(
        output_dir=config['model'],
        per_device_eval_batch_size=32,
    )

    trainer = Trainer(
        args=training_args,
        model=model,
        data_collator=data_collator,
        compute_metrics=compute_metrics
    )
    
    metrics = trainer.evaluate(test_dataset)
    trainer.save_metrics(split='test', metrics=metrics)
    

In [11]:
import os

if(__name__=="__main__"):
    
    for per_num_int in range(1,7):
        per_num = str(per_num_int)
        permutation_dir = "full_cl_data/perm_" + per_num

        data_file_dict = {
            "train" : [],
            "valid" : []
        }

        for i in range(6):
            for f_name in os.listdir(permutation_dir + '/'):
                if f_name.startswith('step'+str(i+1)):
                    data_file_dict['train'].append(f_name)
                    break

            for f_name in os.listdir('test_data/perm' + str(per_num)):
                if f_name.startswith('eval_'+str(i+1)):
                    data_file_dict['valid'].append(f_name)
                    break

        for i in range(6):

            base_config = {
                'base_model_dir' : 'monologg/koelectra-base-v3-discriminator',
                'train_file' : permutation_dir + '/' + data_file_dict['train'][i],
                'valid_file' : 'test_data/perm' + str(per_num) + '/' + data_file_dict['valid'][i],
                'output_dir' : 'full_cl_result/perm_' + per_num + '/step' + str(i+1),
                'train_epoch' : 10,
                'learning_rate' : 5e-05,
                'step' : i+1,
                'perm': per_num_int-1
            }

            base_train(base_config)
            
            test_config = {
                'model':'full_cl_result/perm_' + per_num + '/step' + str(i+1) + '/final',
                'test_file': 'test_data/perm' + str(per_num) + '/' + data_file_dict['valid'][i]
            }    

            test(test_config)

Some weights of the model checkpoint at monologg/koelectra-base-v3-discriminator were not used when initializing ElectraForTokenClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense_prediction.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense.weight']
- This IS expected if you are initializing ElectraForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForTokenClassification were not initialized from the model checkpoint at monologg/koelectra-base-v3-discriminator and are newly initialized: ['classifier

Epoch,Training Loss,Validation Loss,Org F1,Org Recall,Org Precision,Entity Macro F1,Entity Macro Precision,Entity Macro Recall
1,0.1679,0.034776,0.836759,0.880407,0.797235,0.836759,0.797235,0.880407
2,0.029,0.0355,0.847015,0.866412,0.828467,0.847015,0.828467,0.866412
3,0.013,0.039711,0.859223,0.900763,0.821346,0.859223,0.821346,0.900763
4,0.0059,0.041336,0.840713,0.930025,0.767051,0.840713,0.767051,0.930025
5,0.0042,0.044613,0.857823,0.917303,0.805587,0.857823,0.805587,0.917303
6,0.0021,0.050226,0.856803,0.917303,0.80379,0.856803,0.80379,0.917303
7,0.001,0.058443,0.847813,0.924936,0.782562,0.847813,0.782562,0.924936
8,0.0022,0.056253,0.859044,0.903308,0.818916,0.859044,0.818916,0.903308
9,0.0009,0.056773,0.858338,0.913486,0.80947,0.858338,0.80947,0.913486
10,0.0005,0.057455,0.85697,0.899491,0.818287,0.85697,0.818287,0.899491


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Some weights of the model checkpoint at monologg/koelectra-base-v3-discriminator were not used when initializing ElectraForTokenClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense_prediction.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense.weight']
- This IS expected if you are initializing ElectraForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForTokenClassification were not initialized from the model checkpoint at monologg/koelectra-base-v3-discriminator and are newly initialized: ['classifier

Epoch,Training Loss,Validation Loss,Org F1,Org Recall,Org Precision,Per F1,Per Recall,Per Precision,Entity Macro F1,Entity Macro Precision,Entity Macro Recall
1,0.2152,0.046796,0.845481,0.922392,0.780409,0.940805,0.934169,0.947536,0.893143,0.863972,0.928281
2,0.0343,0.043017,0.841153,0.946565,0.756867,0.940632,0.956113,0.925645,0.890893,0.841256,0.951339
3,0.0178,0.044112,0.855991,0.945293,0.782105,0.94081,0.946708,0.934985,0.8984,0.858545,0.946001
4,0.0105,0.052833,0.862582,0.922392,0.810056,0.941543,0.946708,0.936434,0.902063,0.873245,0.93455
5,0.0056,0.056466,0.866066,0.917303,0.82025,0.946792,0.948276,0.945312,0.906429,0.882781,0.932789
6,0.0041,0.061635,0.865056,0.933842,0.805708,0.938329,0.942006,0.934681,0.901693,0.870195,0.937924
7,0.0023,0.062923,0.86967,0.92112,0.823663,0.946625,0.945141,0.948113,0.908147,0.885888,0.93313
8,0.0017,0.068903,0.865636,0.926209,0.8125,0.943962,0.937304,0.950715,0.904799,0.881608,0.931756
9,0.0011,0.073491,0.868923,0.898219,0.841478,0.944708,0.937304,0.952229,0.906815,0.896854,0.917761
10,0.0008,0.07311,0.869565,0.903308,0.838253,0.947785,0.938871,0.956869,0.908675,0.897561,0.92109


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Some weights of the model checkpoint at monologg/koelectra-base-v3-discriminator were not used when initializing ElectraForTokenClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense_prediction.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense.weight']
- This IS expected if you are initializing ElectraForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForTokenClassification were not initialized from the model checkpoint at monologg/koelectra-base-v3-discriminator and are newly initialized: ['classifier

Epoch,Training Loss,Validation Loss,Cvl F1,Cvl Recall,Cvl Precision,Org F1,Org Recall,Org Precision,Per F1,Per Recall,Per Precision,Entity Macro F1,Entity Macro Precision,Entity Macro Recall
1,0.2834,0.078659,0.890068,0.862601,0.919342,0.865562,0.898089,0.835308,0.929183,0.935737,0.92272,0.894938,0.892457,0.898809
2,0.0572,0.067088,0.902828,0.914769,0.891195,0.872044,0.915924,0.832176,0.932308,0.949843,0.915408,0.902393,0.879593,0.926845
3,0.0319,0.073267,0.906114,0.914769,0.897621,0.883005,0.913376,0.854589,0.942924,0.945141,0.940718,0.910681,0.897642,0.924428
4,0.0197,0.087601,0.907002,0.927994,0.886938,0.879134,0.93121,0.832574,0.944138,0.940439,0.947867,0.910091,0.889127,0.933214
5,0.0108,0.090665,0.915193,0.931668,0.899291,0.880633,0.921019,0.843641,0.944314,0.943574,0.945055,0.91338,0.895995,0.932087
6,0.0066,0.096063,0.914683,0.917708,0.911679,0.871046,0.912102,0.833527,0.940252,0.937304,0.943218,0.90866,0.896141,0.922371
7,0.0041,0.105714,0.915267,0.900808,0.930197,0.873325,0.913376,0.836639,0.947286,0.943574,0.951027,0.911959,0.905955,0.919253
8,0.0027,0.111894,0.914286,0.928729,0.900285,0.882026,0.909554,0.856115,0.948617,0.940439,0.956938,0.914976,0.904446,0.926241
9,0.0016,0.118014,0.914817,0.939015,0.891835,0.877064,0.913376,0.843529,0.940805,0.934169,0.947536,0.910896,0.8943,0.928854
10,0.0013,0.118524,0.918345,0.921381,0.915328,0.879511,0.915924,0.845882,0.944444,0.932602,0.956592,0.9141,0.905934,0.923302


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Some weights of the model checkpoint at monologg/koelectra-base-v3-discriminator were not used when initializing ElectraForTokenClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense_prediction.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense.weight']
- This IS expected if you are initializing ElectraForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForTokenClassification were not initialized from the model checkpoint at monologg/koelectra-base-v3-discriminator and are newly initialized: ['classifier

Epoch,Training Loss,Validation Loss,Cvl F1,Cvl Recall,Cvl Precision,Dat F1,Dat Recall,Dat Precision,Org F1,Org Recall,Org Precision,Per F1,Per Recall,Per Precision,Entity Macro F1,Entity Macro Precision,Entity Macro Recall
1,0.2956,0.083158,0.90876,0.918442,0.899281,0.885845,0.889908,0.881818,0.866831,0.895541,0.839904,0.943838,0.948276,0.939441,0.901319,0.890111,0.913042
2,0.0637,0.073771,0.911658,0.925055,0.898644,0.892308,0.88685,0.897833,0.882917,0.878981,0.886889,0.947702,0.937304,0.958333,0.908646,0.910425,0.907048
3,0.0372,0.075074,0.906429,0.932403,0.881862,0.890282,0.868502,0.913183,0.874172,0.924841,0.828767,0.952756,0.948276,0.957278,0.90591,0.895273,0.918505
4,0.0221,0.088707,0.910206,0.927259,0.893768,0.904401,0.911315,0.89759,0.860981,0.938854,0.795038,0.950558,0.934169,0.967532,0.906536,0.888482,0.927899
5,0.0135,0.102602,0.909289,0.920647,0.898208,0.847458,0.917431,0.787402,0.838638,0.956688,0.746521,0.946783,0.934169,0.959742,0.885542,0.847968,0.932234
6,0.0082,0.110689,0.906903,0.94122,0.875,0.912711,0.911315,0.91411,0.88543,0.905732,0.866017,0.948535,0.938871,0.9584,0.913395,0.903382,0.924285
7,0.0055,0.123889,0.92053,0.919177,0.921887,0.892638,0.889908,0.895385,0.886839,0.918471,0.857313,0.94081,0.946708,0.934985,0.910204,0.902392,0.918566
8,0.0038,0.12204,0.911302,0.936076,0.887805,0.906344,0.917431,0.895522,0.887255,0.922293,0.854782,0.946288,0.938871,0.953822,0.912797,0.897983,0.928668
9,0.0025,0.127877,0.9196,0.91183,0.927504,0.901235,0.892966,0.909657,0.879758,0.927389,0.836782,0.948031,0.943574,0.952532,0.912156,0.906619,0.91894
10,0.0015,0.132231,0.920205,0.923586,0.916849,0.905426,0.892966,0.918239,0.886585,0.926115,0.850292,0.950355,0.945141,0.955626,0.915643,0.910252,0.921952


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Some weights of the model checkpoint at monologg/koelectra-base-v3-discriminator were not used when initializing ElectraForTokenClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense_prediction.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense.weight']
- This IS expected if you are initializing ElectraForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForTokenClassification were not initialized from the model checkpoint at monologg/koelectra-base-v3-discriminator and are newly initialized: ['classifier

Epoch,Training Loss,Validation Loss,Cvl F1,Cvl Recall,Cvl Precision,Dat F1,Dat Recall,Dat Precision,Loc F1,Loc Recall,Loc Precision,Org F1,Org Recall,Org Precision,Per F1,Per Recall,Per Precision,Entity Macro F1,Entity Macro Precision,Entity Macro Recall
1,0.3062,0.091052,0.900634,0.939706,0.864682,0.899696,0.905199,0.89426,0.887189,0.904483,0.870544,0.871287,0.901408,0.843114,0.931978,0.934169,0.929797,0.898157,0.880479,0.916993
2,0.0727,0.079296,0.920727,0.930882,0.910791,0.889908,0.889908,0.889908,0.899065,0.889864,0.908458,0.888055,0.909091,0.867971,0.947451,0.946708,0.948195,0.909041,0.905065,0.913291
3,0.0431,0.097354,0.919199,0.911765,0.926756,0.907692,0.902141,0.913313,0.893932,0.883041,0.905095,0.879467,0.929577,0.834483,0.950794,0.938871,0.963023,0.910217,0.908534,0.913079
4,0.0264,0.097402,0.912318,0.944853,0.881949,0.905426,0.892966,0.918239,0.912518,0.920078,0.905081,0.886294,0.923175,0.852246,0.95444,0.968652,0.940639,0.914199,0.899631,0.929945
5,0.016,0.105638,0.920118,0.914706,0.925595,0.923547,0.923547,0.923547,0.904597,0.891813,0.917753,0.879511,0.920615,0.84192,0.945882,0.945141,0.946625,0.914731,0.911088,0.919164
6,0.0107,0.11435,0.921852,0.936765,0.907407,0.898678,0.93578,0.864407,0.915172,0.920078,0.910318,0.893316,0.889885,0.896774,0.938136,0.938871,0.937402,0.913431,0.903262,0.924276
7,0.0069,0.132353,0.920393,0.930882,0.910137,0.919753,0.911315,0.928349,0.908468,0.904483,0.912488,0.882139,0.929577,0.839306,0.947368,0.945141,0.949606,0.915624,0.907977,0.92428
8,0.0043,0.134261,0.91925,0.9375,0.901697,0.917574,0.902141,0.933544,0.910256,0.89961,0.921158,0.879951,0.924456,0.839535,0.949416,0.956113,0.942813,0.91529,0.907749,0.923964
9,0.0027,0.141175,0.924198,0.932353,0.916185,0.918083,0.908257,0.928125,0.914563,0.918129,0.911025,0.888191,0.90525,0.871763,0.944882,0.940439,0.949367,0.917984,0.915293,0.920885
10,0.0019,0.144968,0.922464,0.936029,0.909286,0.910769,0.905199,0.916409,0.913641,0.907407,0.91996,0.88625,0.90781,0.86569,0.950198,0.942006,0.958533,0.916664,0.913975,0.91969


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Some weights of the model checkpoint at monologg/koelectra-base-v3-discriminator were not used when initializing ElectraForTokenClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense_prediction.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense.weight']
- This IS expected if you are initializing ElectraForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForTokenClassification were not initialized from the model checkpoint at monologg/koelectra-base-v3-discriminator and are newly initialized: ['classifier

Epoch,Training Loss,Validation Loss,Cvl F1,Cvl Recall,Cvl Precision,Dat F1,Dat Recall,Dat Precision,Loc F1,Loc Recall,Loc Precision,Org F1,Org Recall,Org Precision,Per F1,Per Recall,Per Precision,Qnt F1,Qnt Recall,Qnt Precision,Entity Macro F1,Entity Macro Precision,Entity Macro Recall
1,0.3062,0.107368,0.920459,0.914706,0.926284,0.875723,0.926606,0.830137,0.894277,0.898635,0.889961,0.849526,0.918054,0.790518,0.943606,0.931034,0.956522,0.862745,0.897959,0.830189,0.891056,0.870602,0.914499
2,0.0814,0.093497,0.913433,0.9,0.927273,0.904239,0.880734,0.929032,0.897523,0.900585,0.894482,0.881188,0.911652,0.852695,0.93909,0.954545,0.924127,0.884354,0.884354,0.884354,0.903304,0.901994,0.905312
3,0.0497,0.091815,0.913422,0.888235,0.940078,0.929356,0.905199,0.954839,0.900534,0.904483,0.896618,0.872892,0.861716,0.884363,0.952681,0.946708,0.95873,0.882759,0.870748,0.895105,0.908607,0.921622,0.896182
4,0.0306,0.103289,0.921898,0.928676,0.915217,0.907716,0.917431,0.898204,0.910766,0.915205,0.906371,0.876308,0.911652,0.843602,0.951788,0.959248,0.944444,0.90785,0.904762,0.910959,0.912721,0.903133,0.922829
5,0.0188,0.117455,0.927774,0.916176,0.939668,0.912773,0.896024,0.930159,0.90566,0.912281,0.899135,0.881398,0.903969,0.859927,0.953507,0.948276,0.958796,0.888889,0.897959,0.88,0.911667,0.911281,0.912448
6,0.0126,0.125414,0.927167,0.936029,0.91847,0.92575,0.896024,0.957516,0.910634,0.888889,0.93347,0.873563,0.924456,0.827982,0.946457,0.942006,0.950949,0.90301,0.918367,0.888158,0.91443,0.912758,0.917629
7,0.0088,0.134512,0.922907,0.919853,0.925981,0.928349,0.911315,0.946032,0.908374,0.898635,0.918327,0.876895,0.925736,0.832949,0.956182,0.95768,0.954688,0.880259,0.92517,0.839506,0.912161,0.902914,0.923065
8,0.0054,0.142252,0.923077,0.935294,0.911175,0.922601,0.911315,0.934169,0.913952,0.916179,0.911736,0.882716,0.915493,0.852205,0.952607,0.945141,0.960191,0.888889,0.92517,0.855346,0.913974,0.904137,0.924765
9,0.0032,0.155201,0.924771,0.926471,0.923077,0.921418,0.914373,0.928571,0.909897,0.900585,0.919403,0.881919,0.918054,0.848521,0.954403,0.951411,0.957413,0.901695,0.904762,0.898649,0.915684,0.912606,0.919276
10,0.0022,0.157625,0.925899,0.927941,0.923865,0.919255,0.905199,0.933754,0.911504,0.903509,0.919643,0.884521,0.921895,0.850059,0.954331,0.949843,0.958861,0.890365,0.911565,0.87013,0.914312,0.909385,0.919992


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Some weights of the model checkpoint at monologg/koelectra-base-v3-discriminator were not used when initializing ElectraForTokenClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense_prediction.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense.weight']
- This IS expected if you are initializing ElectraForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForTokenClassification were not initialized from the model checkpoint at monologg/koelectra-base-v3-discriminator and are newly initialized: ['classifier

Epoch,Training Loss,Validation Loss,Dat F1,Dat Recall,Dat Precision,Entity Macro F1,Entity Macro Precision,Entity Macro Recall
1,0.1703,0.021656,0.840336,0.923077,0.771208,0.840336,0.771208,0.923077
2,0.0193,0.016789,0.85037,0.883077,0.82,0.85037,0.82,0.883077
3,0.01,0.015121,0.889937,0.870769,0.909968,0.889937,0.909968,0.870769
4,0.0065,0.015085,0.874618,0.88,0.869301,0.874618,0.869301,0.88
5,0.0041,0.015765,0.880989,0.876923,0.885093,0.880989,0.885093,0.876923
6,0.002,0.016143,0.871642,0.898462,0.846377,0.871642,0.846377,0.898462
7,0.001,0.018764,0.894977,0.904615,0.885542,0.894977,0.885542,0.904615
8,0.0007,0.019627,0.887879,0.901538,0.874627,0.887879,0.874627,0.901538
9,0.0005,0.019407,0.893617,0.904615,0.882883,0.893617,0.882883,0.904615
10,0.0003,0.019525,0.893939,0.907692,0.880597,0.893939,0.880597,0.907692


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Some weights of the model checkpoint at monologg/koelectra-base-v3-discriminator were not used when initializing ElectraForTokenClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense_prediction.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense.weight']
- This IS expected if you are initializing ElectraForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForTokenClassification were not initialized from the model checkpoint at monologg/koelectra-base-v3-discriminator and are newly initialized: ['classifier

Epoch,Training Loss,Validation Loss,Dat F1,Dat Recall,Dat Precision,Qnt F1,Qnt Recall,Qnt Precision,Entity Macro F1,Entity Macro Precision,Entity Macro Recall
1,0.2068,0.032738,0.888179,0.855385,0.923588,0.820513,0.876712,0.771084,0.854346,0.847336,0.866048
2,0.0279,0.025583,0.888189,0.867692,0.909677,0.834951,0.883562,0.791411,0.86157,0.850544,0.875627
3,0.0176,0.029439,0.881459,0.892308,0.870871,0.86755,0.89726,0.839744,0.874504,0.855307,0.894784
4,0.0102,0.025765,0.865443,0.870769,0.860182,0.830769,0.924658,0.75419,0.848106,0.807186,0.897713
5,0.0059,0.029656,0.904239,0.886154,0.923077,0.875862,0.869863,0.881944,0.89005,0.902511,0.878008
6,0.004,0.031482,0.888889,0.873846,0.904459,0.802395,0.917808,0.712766,0.845642,0.808612,0.895827
7,0.0024,0.032849,0.902439,0.910769,0.89426,0.858065,0.910959,0.810976,0.880252,0.852618,0.910864
8,0.0017,0.035803,0.900621,0.892308,0.909091,0.854305,0.883562,0.826923,0.877463,0.868007,0.887935
9,0.001,0.035867,0.905199,0.910769,0.899696,0.872131,0.910959,0.836478,0.888665,0.868087,0.910864
10,0.0007,0.036432,0.905426,0.898462,0.9125,0.865574,0.90411,0.830189,0.8855,0.871344,0.901286


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Some weights of the model checkpoint at monologg/koelectra-base-v3-discriminator were not used when initializing ElectraForTokenClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense_prediction.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense.weight']
- This IS expected if you are initializing ElectraForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForTokenClassification were not initialized from the model checkpoint at monologg/koelectra-base-v3-discriminator and are newly initialized: ['classifier

Epoch,Training Loss,Validation Loss,Dat F1,Dat Recall,Dat Precision,Per F1,Per Recall,Per Precision,Qnt F1,Qnt Recall,Qnt Precision,Entity Macro F1,Entity Macro Precision,Entity Macro Recall
1,0.2502,0.048329,0.793296,0.868502,0.730077,0.931783,0.944969,0.91896,0.785714,0.897959,0.698413,0.836931,0.782483,0.90381
2,0.0338,0.036807,0.886503,0.883792,0.889231,0.946625,0.948113,0.945141,0.891892,0.897959,0.885906,0.90834,0.906759,0.909955
3,0.0195,0.035762,0.900929,0.889908,0.912226,0.939815,0.957547,0.922727,0.878049,0.857143,0.9,0.906264,0.911651,0.901533
4,0.0126,0.035502,0.888889,0.892966,0.884848,0.949843,0.95283,0.946875,0.86262,0.918367,0.813253,0.900451,0.881659,0.921388
5,0.0081,0.041612,0.887147,0.865443,0.909968,0.941456,0.935535,0.947452,0.849673,0.884354,0.81761,0.892759,0.891677,0.895111
6,0.0049,0.043869,0.886762,0.850153,0.926667,0.944532,0.937107,0.952077,0.865772,0.877551,0.854305,0.899022,0.911016,0.88827
7,0.0031,0.045742,0.88785,0.87156,0.904762,0.942292,0.937107,0.947536,0.829114,0.891156,0.775148,0.886419,0.875815,0.899941
8,0.002,0.049589,0.885802,0.877676,0.894081,0.946288,0.941824,0.950794,0.85906,0.870748,0.847682,0.89705,0.897519,0.896749
9,0.0012,0.052302,0.902628,0.892966,0.9125,0.941915,0.943396,0.940439,0.86,0.877551,0.843137,0.901514,0.898692,0.904638
10,0.0009,0.053024,0.902628,0.892966,0.9125,0.943485,0.944969,0.942006,0.860841,0.904762,0.820988,0.902318,0.891831,0.914232


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Some weights of the model checkpoint at monologg/koelectra-base-v3-discriminator were not used when initializing ElectraForTokenClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense_prediction.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense.weight']
- This IS expected if you are initializing ElectraForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForTokenClassification were not initialized from the model checkpoint at monologg/koelectra-base-v3-discriminator and are newly initialized: ['classifier

Epoch,Training Loss,Validation Loss,Dat F1,Dat Recall,Dat Precision,Loc F1,Loc Recall,Loc Precision,Per F1,Per Recall,Per Precision,Qnt F1,Qnt Recall,Qnt Precision,Entity Macro F1,Entity Macro Precision,Entity Macro Recall
1,0.2609,0.059309,0.881789,0.844037,0.923077,0.892473,0.887269,0.897738,0.934375,0.940252,0.928571,0.852349,0.863946,0.84106,0.890247,0.897612,0.883876
2,0.0432,0.04523,0.917683,0.920489,0.914894,0.913488,0.954325,0.876004,0.944615,0.965409,0.924699,0.865772,0.877551,0.854305,0.91039,0.892475,0.929443
3,0.0268,0.045802,0.907975,0.905199,0.910769,0.912594,0.943635,0.88353,0.94,0.960692,0.920181,0.841772,0.904762,0.786982,0.900585,0.875366,0.928572
4,0.0158,0.048847,0.895801,0.880734,0.911392,0.906265,0.906706,0.905825,0.952082,0.95283,0.951334,0.897959,0.897959,0.897959,0.913027,0.916628,0.909557
5,0.0102,0.053149,0.896657,0.902141,0.891239,0.914534,0.920311,0.908829,0.94647,0.959119,0.93415,0.872964,0.911565,0.8375,0.907656,0.892929,0.923284
6,0.0064,0.057239,0.903817,0.905199,0.902439,0.913126,0.939747,0.887971,0.944795,0.941824,0.947785,0.899329,0.911565,0.887417,0.915267,0.906403,0.924584
7,0.0044,0.062801,0.896445,0.88685,0.90625,0.91298,0.912536,0.913424,0.953942,0.960692,0.947287,0.893333,0.911565,0.875817,0.914175,0.910694,0.917911
8,0.0027,0.066272,0.889226,0.896024,0.88253,0.913652,0.920311,0.907088,0.957265,0.968553,0.946237,0.883721,0.904762,0.863636,0.910966,0.899873,0.922413
9,0.0016,0.068152,0.882883,0.899083,0.867257,0.91401,0.919339,0.908742,0.957614,0.959119,0.956113,0.899329,0.911565,0.887417,0.913459,0.904882,0.922276
10,0.0012,0.068691,0.896024,0.896024,0.896024,0.910939,0.91448,0.907425,0.959248,0.962264,0.95625,0.902357,0.911565,0.893333,0.917142,0.913258,0.921083


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Some weights of the model checkpoint at monologg/koelectra-base-v3-discriminator were not used when initializing ElectraForTokenClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense_prediction.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense.weight']
- This IS expected if you are initializing ElectraForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForTokenClassification were not initialized from the model checkpoint at monologg/koelectra-base-v3-discriminator and are newly initialized: ['classifier

Epoch,Training Loss,Validation Loss,Dat F1,Dat Recall,Dat Precision,Loc F1,Loc Recall,Loc Precision,Org F1,Org Recall,Org Precision,Per F1,Per Recall,Per Precision,Qnt F1,Qnt Recall,Qnt Precision,Entity Macro F1,Entity Macro Precision,Entity Macro Recall
1,0.2886,0.075605,0.8864,0.847095,0.92953,0.891828,0.919182,0.866055,0.858056,0.858056,0.858056,0.934921,0.923197,0.946945,0.861111,0.843537,0.879433,0.886463,0.896004,0.878214
2,0.06,0.069274,0.893939,0.902141,0.885886,0.901463,0.899708,0.903226,0.884639,0.91688,0.854589,0.947368,0.973354,0.922734,0.861842,0.891156,0.834395,0.89785,0.880166,0.916648
3,0.0367,0.071145,0.909938,0.896024,0.92429,0.901435,0.917235,0.886171,0.876746,0.923274,0.834682,0.951779,0.943574,0.960128,0.875817,0.911565,0.842767,0.903143,0.889608,0.918334
4,0.023,0.084812,0.903846,0.862385,0.949495,0.900971,0.903603,0.898354,0.868146,0.850384,0.886667,0.951049,0.959248,0.942989,0.865574,0.897959,0.835443,0.897917,0.90259,0.894716
5,0.0142,0.085809,0.912226,0.889908,0.935691,0.907836,0.896787,0.919162,0.882817,0.929668,0.840462,0.949922,0.951411,0.948438,0.906574,0.891156,0.922535,0.911875,0.913258,0.911786
6,0.009,0.092016,0.921418,0.914373,0.928571,0.912482,0.928919,0.896617,0.879647,0.892583,0.867081,0.946136,0.949843,0.942457,0.871287,0.897959,0.846154,0.906194,0.896176,0.916736
7,0.0058,0.101636,0.923313,0.920489,0.926154,0.912146,0.925024,0.899621,0.880653,0.896419,0.865432,0.950896,0.956113,0.945736,0.895623,0.904762,0.886667,0.912526,0.904722,0.920562
8,0.0039,0.109261,0.911901,0.902141,0.921875,0.911405,0.906524,0.916339,0.884833,0.898977,0.871128,0.958009,0.965517,0.950617,0.893333,0.911565,0.875817,0.911896,0.907155,0.916945
9,0.0023,0.112416,0.912226,0.889908,0.935691,0.912451,0.91334,0.911565,0.881463,0.893862,0.869403,0.953271,0.959248,0.947368,0.888889,0.897959,0.88,0.90966,0.908805,0.910863
10,0.0015,0.115552,0.906542,0.889908,0.92381,0.912916,0.908471,0.917404,0.884447,0.905371,0.864469,0.952978,0.952978,0.952978,0.882943,0.897959,0.868421,0.907965,0.905416,0.910938


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Some weights of the model checkpoint at monologg/koelectra-base-v3-discriminator were not used when initializing ElectraForTokenClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense_prediction.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense.weight']
- This IS expected if you are initializing ElectraForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForTokenClassification were not initialized from the model checkpoint at monologg/koelectra-base-v3-discriminator and are newly initialized: ['classifier

Epoch,Training Loss,Validation Loss,Cvl F1,Cvl Recall,Cvl Precision,Dat F1,Dat Recall,Dat Precision,Loc F1,Loc Recall,Loc Precision,Org F1,Org Recall,Org Precision,Per F1,Per Recall,Per Precision,Qnt F1,Qnt Recall,Qnt Precision,Entity Macro F1,Entity Macro Precision,Entity Macro Recall
1,0.3049,0.101651,0.917864,0.916176,0.919557,0.905325,0.93578,0.876791,0.901544,0.910331,0.892925,0.844796,0.888604,0.805104,0.943485,0.942006,0.944969,0.83871,0.884354,0.797546,0.891954,0.872815,0.912875
2,0.0794,0.09276,0.920328,0.908824,0.932127,0.912226,0.889908,0.935691,0.902499,0.897661,0.907389,0.877724,0.928297,0.832377,0.949729,0.962382,0.937405,0.863636,0.904762,0.826087,0.904357,0.895179,0.915306
3,0.0476,0.091688,0.91853,0.891176,0.947615,0.909091,0.902141,0.916149,0.91264,0.911306,0.913978,0.875242,0.866837,0.883812,0.954617,0.956113,0.953125,0.906574,0.891156,0.922535,0.912782,0.922869,0.903122
4,0.0294,0.099772,0.918449,0.931618,0.905647,0.90184,0.899083,0.904615,0.914313,0.946394,0.884335,0.875858,0.898848,0.854015,0.947779,0.952978,0.942636,0.907216,0.897959,0.916667,0.910909,0.901319,0.921146
5,0.0184,0.110851,0.921365,0.913235,0.929641,0.903125,0.883792,0.923323,0.910318,0.920078,0.900763,0.877323,0.90653,0.84994,0.950588,0.949843,0.951334,0.876623,0.918367,0.838509,0.906557,0.898918,0.915308
6,0.0122,0.129161,0.921569,0.933088,0.91033,0.9088,0.868502,0.95302,0.903741,0.883041,0.925434,0.871549,0.929577,0.820339,0.950872,0.940439,0.961538,0.906667,0.92517,0.888889,0.910533,0.909925,0.913303
7,0.0072,0.137644,0.923869,0.923529,0.924209,0.907378,0.883792,0.932258,0.903421,0.875244,0.933472,0.87439,0.918054,0.834692,0.955364,0.956113,0.954617,0.889632,0.904762,0.875,0.909009,0.909041,0.910249
8,0.0049,0.149796,0.924309,0.933824,0.914986,0.9125,0.892966,0.932907,0.914676,0.91423,0.915122,0.882682,0.910371,0.856627,0.955224,0.952978,0.95748,0.886731,0.931973,0.845679,0.912687,0.9038,0.922724
9,0.0032,0.154463,0.926649,0.924265,0.929047,0.914729,0.902141,0.927673,0.912039,0.904483,0.919722,0.885696,0.90781,0.864634,0.954545,0.954545,0.954545,0.888889,0.897959,0.88,0.913758,0.912604,0.915201
10,0.0021,0.159601,0.927152,0.926471,0.927835,0.90881,0.899083,0.91875,0.915769,0.911306,0.920276,0.889582,0.912932,0.867397,0.956863,0.956113,0.957614,0.895623,0.904762,0.886667,0.915633,0.91309,0.918444


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Some weights of the model checkpoint at monologg/koelectra-base-v3-discriminator were not used when initializing ElectraForTokenClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense_prediction.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense.weight']
- This IS expected if you are initializing ElectraForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForTokenClassification were not initialized from the model checkpoint at monologg/koelectra-base-v3-discriminator and are newly initialized: ['classifier

Epoch,Training Loss,Validation Loss,Cvl F1,Cvl Recall,Cvl Precision,Entity Macro F1,Entity Macro Precision,Entity Macro Recall
1,0.1925,0.041194,0.847912,0.791176,0.913413,0.847912,0.913413,0.791176
2,0.0317,0.032082,0.891321,0.868382,0.915504,0.891321,0.915504,0.868382
3,0.0162,0.039601,0.894049,0.905882,0.882521,0.894049,0.882521,0.905882
4,0.0064,0.043602,0.891258,0.922059,0.862448,0.891258,0.862448,0.922059
5,0.0039,0.049392,0.891476,0.872794,0.910975,0.891476,0.910975,0.872794
6,0.0048,0.04803,0.893525,0.913235,0.874648,0.893525,0.874648,0.913235
7,0.0016,0.055547,0.893246,0.904412,0.882353,0.893246,0.882353,0.904412
8,0.0014,0.051044,0.897813,0.920588,0.876137,0.897813,0.876137,0.920588
9,0.001,0.054409,0.900298,0.889706,0.911145,0.900298,0.911145,0.889706
10,0.0007,0.053944,0.900628,0.896324,0.904974,0.900628,0.904974,0.896324


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Some weights of the model checkpoint at monologg/koelectra-base-v3-discriminator were not used when initializing ElectraForTokenClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense_prediction.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense.weight']
- This IS expected if you are initializing ElectraForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForTokenClassification were not initialized from the model checkpoint at monologg/koelectra-base-v3-discriminator and are newly initialized: ['classifier

Epoch,Training Loss,Validation Loss,Cvl F1,Cvl Recall,Cvl Precision,Loc F1,Loc Recall,Loc Precision,Entity Macro F1,Entity Macro Precision,Entity Macro Recall
1,0.2212,0.058675,0.889561,0.865342,0.915175,0.892379,0.940604,0.848858,0.89097,0.882016,0.902973
2,0.0397,0.051995,0.893633,0.862399,0.927215,0.906921,0.925024,0.889513,0.900277,0.908364,0.893712
3,0.0196,0.055129,0.915091,0.908021,0.922272,0.908345,0.969815,0.854202,0.911718,0.888237,0.938918
4,0.0106,0.059275,0.9116,0.899191,0.924357,0.902917,0.919182,0.887218,0.907259,0.905788,0.909186
5,0.0059,0.071343,0.902857,0.930096,0.877169,0.894447,0.870497,0.919753,0.898652,0.898461,0.900296
6,0.0039,0.075051,0.896991,0.932303,0.864256,0.904576,0.904576,0.904576,0.900784,0.884416,0.91844
7,0.0023,0.07886,0.910927,0.92936,0.893211,0.901024,0.899708,0.902344,0.905975,0.897777,0.914534
8,0.0015,0.081599,0.915689,0.919058,0.912345,0.900246,0.891918,0.90873,0.907967,0.910537,0.905488
9,0.0011,0.080594,0.913825,0.916851,0.910819,0.903288,0.909445,0.897214,0.908556,0.904016,0.913148
10,0.0008,0.082304,0.912996,0.922737,0.903458,0.901999,0.900682,0.90332,0.907498,0.903389,0.911709


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Some weights of the model checkpoint at monologg/koelectra-base-v3-discriminator were not used when initializing ElectraForTokenClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense_prediction.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense.weight']
- This IS expected if you are initializing ElectraForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForTokenClassification were not initialized from the model checkpoint at monologg/koelectra-base-v3-discriminator and are newly initialized: ['classifier

Epoch,Training Loss,Validation Loss,Cvl F1,Cvl Recall,Cvl Precision,Loc F1,Loc Recall,Loc Precision,Org F1,Org Recall,Org Precision,Entity Macro F1,Entity Macro Precision,Entity Macro Recall
1,0.2795,0.084835,0.886364,0.860927,0.913349,0.887317,0.856585,0.920335,0.873171,0.916773,0.833527,0.882284,0.889071,0.878095
2,0.0565,0.074705,0.910927,0.92936,0.893211,0.891566,0.866341,0.918304,0.873868,0.927017,0.826484,0.89212,0.879333,0.907573
3,0.0306,0.081086,0.907636,0.918322,0.897196,0.891023,0.905366,0.877127,0.87396,0.941101,0.81576,0.890873,0.863361,0.921596
4,0.0182,0.092432,0.908506,0.935247,0.883252,0.905588,0.917073,0.894386,0.88,0.929577,0.835443,0.898031,0.871027,0.927299
5,0.0104,0.098267,0.920896,0.908021,0.934141,0.896447,0.861463,0.934392,0.871642,0.934699,0.816555,0.896328,0.895029,0.901394
6,0.0059,0.106498,0.908699,0.930096,0.888264,0.913652,0.923902,0.903626,0.885,0.90653,0.864469,0.90245,0.885453,0.920176
7,0.0038,0.115965,0.91385,0.924945,0.903017,0.911479,0.914146,0.908826,0.881522,0.919334,0.846698,0.902284,0.886181,0.919475
8,0.0026,0.125657,0.913819,0.905077,0.922731,0.905095,0.883902,0.927329,0.884591,0.90781,0.86253,0.901168,0.904197,0.89893
9,0.0016,0.128006,0.917371,0.919058,0.915689,0.906219,0.89561,0.917083,0.882972,0.912932,0.854916,0.902187,0.895896,0.9092
10,0.0012,0.13062,0.919778,0.915379,0.92422,0.909451,0.896585,0.922691,0.883692,0.919334,0.850711,0.904307,0.899207,0.910433


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Some weights of the model checkpoint at monologg/koelectra-base-v3-discriminator were not used when initializing ElectraForTokenClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense_prediction.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense.weight']
- This IS expected if you are initializing ElectraForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForTokenClassification were not initialized from the model checkpoint at monologg/koelectra-base-v3-discriminator and are newly initialized: ['classifier

Epoch,Training Loss,Validation Loss,Cvl F1,Cvl Recall,Cvl Precision,Loc F1,Loc Recall,Loc Precision,Org F1,Org Recall,Org Precision,Qnt F1,Qnt Recall,Qnt Precision,Entity Macro F1,Entity Macro Precision,Entity Macro Recall
1,0.2994,0.092692,0.903203,0.923473,0.883803,0.879664,0.92,0.842717,0.872636,0.886044,0.859627,0.808511,0.904762,0.730769,0.866003,0.829229,0.90857
2,0.0648,0.078414,0.906407,0.926416,0.887245,0.911111,0.96,0.86696,0.889325,0.869398,0.910188,0.876254,0.891156,0.861842,0.895775,0.881559,0.911743
3,0.0379,0.087985,0.918545,0.92936,0.90798,0.916091,0.905366,0.927073,0.890529,0.927017,0.856805,0.734247,0.911565,0.614679,0.864853,0.826634,0.918327
4,0.0225,0.092201,0.91298,0.926416,0.899929,0.906375,0.887805,0.925738,0.864547,0.939821,0.800436,0.888889,0.870748,0.907801,0.893198,0.883476,0.906198
5,0.0149,0.102389,0.914746,0.919794,0.909753,0.904016,0.900488,0.907571,0.87003,0.93854,0.810841,0.875817,0.911565,0.842767,0.891152,0.867733,0.917597
6,0.0092,0.10682,0.913669,0.934511,0.893737,0.916067,0.931707,0.900943,0.893035,0.919334,0.868198,0.895105,0.870748,0.920863,0.904469,0.895935,0.914075
7,0.0057,0.117013,0.914265,0.910228,0.918337,0.913519,0.896585,0.931104,0.878528,0.916773,0.843345,0.904762,0.904762,0.904762,0.902768,0.899387,0.907087
8,0.0034,0.124302,0.915847,0.924945,0.906926,0.919261,0.921951,0.916586,0.881761,0.897567,0.866502,0.880795,0.904762,0.858065,0.899416,0.88702,0.912306
9,0.0023,0.133191,0.916205,0.913171,0.919259,0.914399,0.901463,0.927711,0.881957,0.923175,0.844262,0.894915,0.897959,0.891892,0.901869,0.895781,0.908942
10,0.0014,0.13629,0.917613,0.922001,0.913265,0.916461,0.90439,0.928858,0.885749,0.923175,0.85124,0.884488,0.911565,0.858974,0.901078,0.888084,0.915283


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Some weights of the model checkpoint at monologg/koelectra-base-v3-discriminator were not used when initializing ElectraForTokenClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense_prediction.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense.weight']
- This IS expected if you are initializing ElectraForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForTokenClassification were not initialized from the model checkpoint at monologg/koelectra-base-v3-discriminator and are newly initialized: ['classifier

Epoch,Training Loss,Validation Loss,Cvl F1,Cvl Recall,Cvl Precision,Dat F1,Dat Recall,Dat Precision,Loc F1,Loc Recall,Loc Precision,Org F1,Org Recall,Org Precision,Qnt F1,Qnt Recall,Qnt Precision,Entity Macro F1,Entity Macro Precision,Entity Macro Recall
1,0.3133,0.095056,0.910842,0.939662,0.883737,0.88062,0.871166,0.890282,0.886416,0.932683,0.844523,0.8687,0.838668,0.900963,0.871622,0.877551,0.865772,0.88364,0.877055,0.891946
2,0.0729,0.078711,0.924431,0.927152,0.921726,0.896124,0.886503,0.905956,0.903818,0.912195,0.895594,0.881612,0.896287,0.86741,0.86645,0.904762,0.83125,0.894487,0.884387,0.90538
3,0.0439,0.092495,0.924376,0.926416,0.922344,0.9125,0.895706,0.929936,0.903382,0.912195,0.894737,0.877214,0.919334,0.838785,0.874172,0.897959,0.851613,0.898329,0.887483,0.910322
4,0.0269,0.10538,0.920088,0.923473,0.916728,0.903328,0.874233,0.934426,0.900437,0.90439,0.896518,0.872314,0.883483,0.861423,0.869281,0.904762,0.836478,0.89309,0.889115,0.898068
5,0.0173,0.11015,0.92759,0.919058,0.936282,0.922601,0.91411,0.93125,0.907308,0.902439,0.912229,0.880791,0.912932,0.850835,0.903448,0.891156,0.916084,0.908347,0.909336,0.907939
6,0.0113,0.119621,0.923077,0.931567,0.91474,0.919084,0.923313,0.914894,0.913447,0.91122,0.915686,0.890841,0.909091,0.873309,0.868687,0.877551,0.86,0.903027,0.895726,0.910548
7,0.0071,0.125569,0.922461,0.932303,0.912824,0.918239,0.895706,0.941935,0.913086,0.912195,0.913978,0.888617,0.929577,0.851114,0.884211,0.857143,0.913043,0.905323,0.906579,0.905385
8,0.0043,0.141064,0.926194,0.941869,0.911032,0.915625,0.898773,0.933121,0.902584,0.885854,0.919959,0.88318,0.924456,0.845433,0.881356,0.884354,0.878378,0.901788,0.897585,0.907061
9,0.003,0.145669,0.926829,0.922737,0.930958,0.930818,0.907975,0.954839,0.908555,0.901463,0.915758,0.887097,0.915493,0.860409,0.871287,0.897959,0.846154,0.904917,0.901624,0.909126
10,0.002,0.150306,0.92891,0.937454,0.92052,0.924528,0.90184,0.948387,0.910793,0.901463,0.920319,0.883863,0.925736,0.845614,0.86755,0.891156,0.845161,0.903129,0.896,0.91153


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Some weights of the model checkpoint at monologg/koelectra-base-v3-discriminator were not used when initializing ElectraForTokenClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense_prediction.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense.weight']
- This IS expected if you are initializing ElectraForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForTokenClassification were not initialized from the model checkpoint at monologg/koelectra-base-v3-discriminator and are newly initialized: ['classifier

Epoch,Training Loss,Validation Loss,Cvl F1,Cvl Recall,Cvl Precision,Dat F1,Dat Recall,Dat Precision,Loc F1,Loc Recall,Loc Precision,Org F1,Org Recall,Org Precision,Per F1,Per Recall,Per Precision,Qnt F1,Qnt Recall,Qnt Precision,Entity Macro F1,Entity Macro Precision,Entity Macro Recall
1,0.3051,0.101255,0.917938,0.929412,0.906743,0.898944,0.911315,0.886905,0.892639,0.927875,0.859982,0.85063,0.90781,0.800226,0.938743,0.924765,0.95315,0.819048,0.877551,0.767857,0.886324,0.862477,0.913121
2,0.0779,0.093413,0.925899,0.927941,0.923865,0.89441,0.880734,0.908517,0.911416,0.937622,0.886636,0.883807,0.915493,0.854241,0.946792,0.948276,0.945312,0.85342,0.891156,0.81875,0.902624,0.889554,0.91687
3,0.0463,0.091373,0.919703,0.909559,0.930075,0.919003,0.902141,0.936508,0.910617,0.898635,0.922923,0.879594,0.888604,0.870765,0.948535,0.938871,0.9584,0.876254,0.891156,0.861842,0.908951,0.913419,0.904828
4,0.0285,0.101257,0.923525,0.932353,0.914863,0.917933,0.923547,0.912387,0.915108,0.929825,0.90085,0.872549,0.911652,0.836663,0.951638,0.956113,0.947205,0.891089,0.918367,0.865385,0.911974,0.896225,0.928643
5,0.018,0.115285,0.922682,0.925735,0.919649,0.917317,0.899083,0.936306,0.916988,0.925926,0.908222,0.884615,0.912932,0.858002,0.952756,0.948276,0.957278,0.869281,0.904762,0.836478,0.910607,0.902656,0.919452
6,0.0113,0.129064,0.928752,0.944118,0.913879,0.914197,0.896024,0.933121,0.910979,0.897661,0.924699,0.88318,0.924456,0.845433,0.949527,0.943574,0.955556,0.891892,0.897959,0.885906,0.913088,0.909766,0.917299
7,0.0076,0.135042,0.927133,0.930882,0.923414,0.909648,0.908257,0.911043,0.920807,0.912281,0.929494,0.882861,0.916773,0.851367,0.954186,0.946708,0.961783,0.871795,0.92517,0.824242,0.911072,0.900224,0.923345
8,0.005,0.145422,0.923741,0.944118,0.904225,0.924031,0.911315,0.937107,0.913215,0.902534,0.924152,0.880435,0.933419,0.833143,0.951334,0.949843,0.95283,0.893333,0.911565,0.875817,0.914348,0.904546,0.925466
9,0.0035,0.152543,0.926061,0.930147,0.922012,0.921175,0.911315,0.93125,0.917073,0.916179,0.917969,0.884735,0.909091,0.86165,0.954186,0.946708,0.961783,0.885993,0.92517,0.85,0.914871,0.907444,0.923102
10,0.0028,0.155535,0.927737,0.934559,0.921014,0.921175,0.911315,0.93125,0.917197,0.912281,0.922167,0.88806,0.914213,0.863362,0.952607,0.945141,0.960191,0.89701,0.918367,0.876623,0.917298,0.912435,0.922646


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Some weights of the model checkpoint at monologg/koelectra-base-v3-discriminator were not used when initializing ElectraForTokenClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense_prediction.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense.weight']
- This IS expected if you are initializing ElectraForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForTokenClassification were not initialized from the model checkpoint at monologg/koelectra-base-v3-discriminator and are newly initialized: ['classifier

Epoch,Training Loss,Validation Loss,Qnt F1,Qnt Recall,Qnt Precision,Entity Macro F1,Entity Macro Precision,Entity Macro Recall
1,0.1743,0.030069,0.656977,0.773973,0.570707,0.656977,0.570707,0.773973
2,0.0169,0.023276,0.79868,0.828767,0.770701,0.79868,0.770701,0.828767
3,0.012,0.019856,0.813559,0.821918,0.805369,0.813559,0.805369,0.821918
4,0.0056,0.019182,0.851064,0.821918,0.882353,0.851064,0.882353,0.821918
5,0.0041,0.020054,0.81672,0.869863,0.769697,0.81672,0.769697,0.869863
6,0.0025,0.023324,0.859016,0.89726,0.823899,0.859016,0.823899,0.89726
7,0.0015,0.023852,0.858086,0.890411,0.828025,0.858086,0.828025,0.890411
8,0.001,0.023717,0.840391,0.883562,0.801242,0.840391,0.801242,0.883562
9,0.0007,0.023598,0.83871,0.890411,0.792683,0.83871,0.792683,0.890411
10,0.0004,0.023723,0.842444,0.89726,0.793939,0.842444,0.793939,0.89726


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Some weights of the model checkpoint at monologg/koelectra-base-v3-discriminator were not used when initializing ElectraForTokenClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense_prediction.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense.weight']
- This IS expected if you are initializing ElectraForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForTokenClassification were not initialized from the model checkpoint at monologg/koelectra-base-v3-discriminator and are newly initialized: ['classifier

Epoch,Training Loss,Validation Loss,Org F1,Org Recall,Org Precision,Qnt F1,Qnt Recall,Qnt Precision,Entity Macro F1,Entity Macro Precision,Entity Macro Recall
1,0.2282,0.054995,0.845373,0.900763,0.7964,0.793548,0.842466,0.75,0.819461,0.7732,0.871615
2,0.0399,0.055738,0.828004,0.955471,0.730545,0.844156,0.890411,0.802469,0.83608,0.766507,0.922941
3,0.0228,0.052572,0.85518,0.950382,0.777315,0.898955,0.883562,0.914894,0.877068,0.846104,0.916972
4,0.0138,0.052835,0.863772,0.923664,0.811173,0.825,0.90411,0.758621,0.844386,0.784897,0.913887
5,0.0075,0.064355,0.869245,0.900763,0.839858,0.874552,0.835616,0.917293,0.871898,0.878575,0.86819
6,0.0054,0.061346,0.865847,0.940204,0.802389,0.843137,0.883562,0.80625,0.854492,0.804319,0.911883
7,0.0028,0.072585,0.872072,0.923664,0.825939,0.885906,0.90411,0.868421,0.878989,0.84718,0.913887
8,0.0021,0.072993,0.870546,0.93257,0.816258,0.898246,0.876712,0.920863,0.884396,0.868561,0.904641
9,0.0013,0.081644,0.872684,0.928753,0.822999,0.861842,0.89726,0.829114,0.867263,0.826056,0.913007
10,0.0009,0.08149,0.875604,0.922392,0.833333,0.86755,0.89726,0.839744,0.871577,0.836538,0.909826


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Some weights of the model checkpoint at monologg/koelectra-base-v3-discriminator were not used when initializing ElectraForTokenClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense_prediction.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense.weight']
- This IS expected if you are initializing ElectraForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForTokenClassification were not initialized from the model checkpoint at monologg/koelectra-base-v3-discriminator and are newly initialized: ['classifier

Epoch,Training Loss,Validation Loss,Dat F1,Dat Recall,Dat Precision,Org F1,Org Recall,Org Precision,Qnt F1,Qnt Recall,Qnt Precision,Entity Macro F1,Entity Macro Precision,Entity Macro Recall
1,0.2657,0.069665,0.868657,0.892638,0.84593,0.864417,0.928753,0.808416,0.812308,0.90411,0.73743,0.84846,0.797259,0.9085
2,0.0427,0.057769,0.894815,0.92638,0.86533,0.871576,0.910941,0.835473,0.86755,0.89726,0.839744,0.87798,0.846849,0.911527
3,0.0241,0.062933,0.910494,0.904908,0.916149,0.856977,0.937659,0.789079,0.858086,0.890411,0.828025,0.875185,0.844418,0.910993
4,0.0158,0.069332,0.903323,0.917178,0.889881,0.869159,0.946565,0.803456,0.844884,0.876712,0.815287,0.872456,0.836208,0.913485
5,0.01,0.074996,0.901716,0.886503,0.91746,0.886045,0.924936,0.850292,0.861017,0.869863,0.852349,0.882926,0.873367,0.893767
6,0.0095,0.077618,0.908537,0.91411,0.90303,0.882817,0.924936,0.844367,0.789157,0.89726,0.704301,0.86017,0.817233,0.912102
7,0.0056,0.081067,0.924499,0.920245,0.928793,0.881734,0.905852,0.858866,0.83871,0.890411,0.792683,0.881648,0.860114,0.905503
8,0.0036,0.089175,0.907692,0.904908,0.910494,0.88117,0.919847,0.845614,0.871287,0.90411,0.840764,0.886716,0.865624,0.909622
9,0.0023,0.091167,0.916667,0.911043,0.92236,0.880148,0.910941,0.851367,0.834395,0.89726,0.779762,0.87707,0.851163,0.906415
10,0.0015,0.09465,0.912442,0.911043,0.913846,0.88412,0.917303,0.853254,0.859935,0.90411,0.819876,0.885499,0.862325,0.910818


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Some weights of the model checkpoint at monologg/koelectra-base-v3-discriminator were not used when initializing ElectraForTokenClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense_prediction.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense.weight']
- This IS expected if you are initializing ElectraForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForTokenClassification were not initialized from the model checkpoint at monologg/koelectra-base-v3-discriminator and are newly initialized: ['classifier

Epoch,Training Loss,Validation Loss,Dat F1,Dat Recall,Dat Precision,Org F1,Org Recall,Org Precision,Per F1,Per Recall,Per Precision,Qnt F1,Qnt Recall,Qnt Precision,Entity Macro F1,Entity Macro Precision,Entity Macro Recall
1,0.2792,0.068446,0.885759,0.865443,0.907051,0.864374,0.847328,0.882119,0.934697,0.931034,0.938389,0.827362,0.863946,0.79375,0.878048,0.880327,0.876938
2,0.0511,0.058685,0.895706,0.892966,0.898462,0.878049,0.89313,0.863469,0.952756,0.948276,0.957278,0.883721,0.904762,0.863636,0.902558,0.895711,0.909783
3,0.0309,0.062257,0.903125,0.883792,0.923323,0.873188,0.919847,0.831034,0.932813,0.935737,0.929907,0.839117,0.904762,0.782353,0.887061,0.866654,0.911034
4,0.0192,0.062689,0.897516,0.883792,0.911672,0.861029,0.926209,0.80442,0.948859,0.945141,0.952607,0.846154,0.897959,0.8,0.888389,0.867175,0.913275
5,0.0122,0.075946,0.897397,0.896024,0.898773,0.879147,0.94402,0.822616,0.954617,0.956113,0.953125,0.882943,0.897959,0.868421,0.903526,0.885734,0.923529
6,0.0079,0.078231,0.909091,0.902141,0.916149,0.88835,0.931298,0.849188,0.950479,0.932602,0.969055,0.90785,0.904762,0.910959,0.913942,0.911338,0.917701
7,0.005,0.085545,0.884013,0.862385,0.906752,0.875153,0.909669,0.84316,0.951334,0.949843,0.95283,0.880795,0.904762,0.858065,0.897824,0.890202,0.906665
8,0.0033,0.09115,0.890555,0.908257,0.873529,0.8753,0.928753,0.827664,0.953052,0.954545,0.951562,0.867314,0.911565,0.82716,0.896555,0.869979,0.92578
9,0.0021,0.096701,0.903522,0.902141,0.904908,0.87515,0.927481,0.828409,0.956795,0.954545,0.959055,0.89726,0.891156,0.903448,0.908182,0.898955,0.918831
10,0.0015,0.098451,0.900459,0.899083,0.90184,0.879518,0.928753,0.83524,0.955083,0.949843,0.96038,0.902357,0.911565,0.893333,0.909354,0.897699,0.922311


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Some weights of the model checkpoint at monologg/koelectra-base-v3-discriminator were not used when initializing ElectraForTokenClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense_prediction.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense.weight']
- This IS expected if you are initializing ElectraForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForTokenClassification were not initialized from the model checkpoint at monologg/koelectra-base-v3-discriminator and are newly initialized: ['classifier

Epoch,Training Loss,Validation Loss,Cvl F1,Cvl Recall,Cvl Precision,Dat F1,Dat Recall,Dat Precision,Org F1,Org Recall,Org Precision,Per F1,Per Recall,Per Precision,Qnt F1,Qnt Recall,Qnt Precision,Entity Macro F1,Entity Macro Precision,Entity Macro Recall
1,0.3163,0.099213,0.883562,0.947832,0.827453,0.887172,0.877676,0.896875,0.867168,0.881529,0.853268,0.939441,0.948276,0.930769,0.841424,0.884354,0.802469,0.883753,0.862167,0.907933
2,0.0738,0.083693,0.921283,0.928729,0.913955,0.882443,0.883792,0.881098,0.884497,0.912102,0.858513,0.944969,0.942006,0.94795,0.858934,0.931973,0.796512,0.898425,0.879605,0.91972
3,0.043,0.094596,0.914706,0.914034,0.915379,0.914463,0.899083,0.93038,0.878661,0.936306,0.827703,0.932813,0.935737,0.929907,0.89701,0.918367,0.876623,0.907531,0.895998,0.920705
4,0.0262,0.100144,0.916936,0.936811,0.897887,0.899371,0.874618,0.925566,0.883344,0.901911,0.865526,0.954014,0.959248,0.948837,0.85443,0.918367,0.798817,0.901619,0.887327,0.918191
5,0.017,0.109609,0.919927,0.92432,0.915575,0.912773,0.896024,0.930159,0.886265,0.90828,0.865291,0.945282,0.934169,0.956661,0.879195,0.891156,0.86755,0.908688,0.907047,0.91079
6,0.0105,0.11905,0.920578,0.936811,0.904897,0.911901,0.902141,0.921875,0.890019,0.89172,0.888325,0.94902,0.948276,0.949765,0.866242,0.92517,0.814371,0.907552,0.895847,0.920824
7,0.007,0.127671,0.92291,0.936811,0.909415,0.914992,0.905199,0.925,0.882033,0.928662,0.839862,0.957547,0.954545,0.960568,0.868421,0.897959,0.840764,0.909181,0.895122,0.924635
8,0.0043,0.139398,0.919751,0.922116,0.917398,0.905901,0.868502,0.946667,0.882972,0.90828,0.859036,0.953271,0.959248,0.947368,0.879195,0.891156,0.86755,0.908218,0.907604,0.90986
9,0.0027,0.147646,0.92466,0.92432,0.925,0.913313,0.902141,0.924765,0.881773,0.912102,0.853397,0.952532,0.943574,0.961661,0.882155,0.891156,0.873333,0.910887,0.907631,0.914659
10,0.0018,0.150564,0.920263,0.92432,0.916242,0.917317,0.899083,0.936306,0.885714,0.90828,0.864242,0.950198,0.942006,0.958533,0.879195,0.891156,0.86755,0.910537,0.908574,0.912969


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Some weights of the model checkpoint at monologg/koelectra-base-v3-discriminator were not used when initializing ElectraForTokenClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense_prediction.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense.weight']
- This IS expected if you are initializing ElectraForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForTokenClassification were not initialized from the model checkpoint at monologg/koelectra-base-v3-discriminator and are newly initialized: ['classifier

Epoch,Training Loss,Validation Loss,Cvl F1,Cvl Recall,Cvl Precision,Dat F1,Dat Recall,Dat Precision,Loc F1,Loc Recall,Loc Precision,Org F1,Org Recall,Org Precision,Per F1,Per Recall,Per Precision,Qnt F1,Qnt Recall,Qnt Precision,Entity Macro F1,Entity Macro Precision,Entity Macro Recall
1,0.3038,0.102283,0.919162,0.902941,0.935976,0.895434,0.929664,0.863636,0.90149,0.91423,0.8891,0.860409,0.915493,0.811578,0.936371,0.934169,0.938583,0.81875,0.891156,0.757225,0.888603,0.866016,0.914609
2,0.0779,0.094425,0.92091,0.9375,0.904897,0.908805,0.883792,0.935275,0.899756,0.896686,0.902846,0.873494,0.928297,0.824801,0.93859,0.970219,0.908957,0.868421,0.897959,0.840764,0.901663,0.886257,0.919076
3,0.0467,0.093638,0.923248,0.915441,0.931189,0.912226,0.889908,0.935691,0.899256,0.883041,0.916077,0.864728,0.8758,0.853933,0.951713,0.95768,0.94582,0.869565,0.884354,0.855263,0.903456,0.906329,0.901037
4,0.0286,0.101186,0.920086,0.939706,0.901269,0.91047,0.917431,0.903614,0.909528,0.921053,0.898289,0.874237,0.916773,0.835473,0.943367,0.952978,0.933948,0.87013,0.911565,0.832298,0.904636,0.884149,0.926584
5,0.018,0.111516,0.922848,0.910294,0.935752,0.917574,0.902141,0.933544,0.905473,0.88694,0.924797,0.888344,0.927017,0.852768,0.948022,0.95768,0.938556,0.879195,0.891156,0.86755,0.910242,0.908828,0.912538
6,0.0116,0.131192,0.923521,0.941176,0.906516,0.925466,0.911315,0.940063,0.908552,0.895712,0.921765,0.880148,0.916773,0.846336,0.955153,0.951411,0.958926,0.89769,0.92517,0.871795,0.915088,0.907567,0.923593
7,0.0072,0.138521,0.921512,0.932353,0.91092,0.915515,0.911315,0.919753,0.907011,0.888889,0.925888,0.880342,0.923175,0.841307,0.954086,0.960815,0.94745,0.9,0.918367,0.882353,0.913078,0.904612,0.922486
8,0.0049,0.14447,0.921129,0.936029,0.906695,0.923557,0.905199,0.942675,0.917556,0.922027,0.913127,0.889027,0.918054,0.861779,0.953271,0.959248,0.947368,0.884488,0.911565,0.858974,0.914838,0.905103,0.925354
9,0.003,0.154611,0.928333,0.919118,0.937734,0.91358,0.905199,0.922118,0.913108,0.906433,0.919881,0.889306,0.910371,0.869193,0.95693,0.95768,0.956182,0.890365,0.911565,0.87013,0.91527,0.91254,0.918394
10,0.0018,0.159879,0.924487,0.927206,0.921784,0.916923,0.911315,0.922601,0.909449,0.900585,0.918489,0.884354,0.915493,0.855263,0.952306,0.954545,0.950078,0.893333,0.911565,0.875817,0.913475,0.907339,0.920118


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Some weights of the model checkpoint at monologg/koelectra-base-v3-discriminator were not used when initializing ElectraForTokenClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense_prediction.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense.weight']
- This IS expected if you are initializing ElectraForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForTokenClassification were not initialized from the model checkpoint at monologg/koelectra-base-v3-discriminator and are newly initialized: ['classifier

Epoch,Training Loss,Validation Loss,Loc F1,Loc Recall,Loc Precision,Entity Macro F1,Entity Macro Precision,Entity Macro Recall
1,0.1976,0.098419,0.0,0.0,1.0,0.0,1.0,0.0
2,0.0988,0.098671,0.0,0.0,1.0,0.0,1.0,0.0
3,0.0981,0.098828,0.0,0.0,1.0,0.0,1.0,0.0
4,0.0983,0.099391,0.0,0.0,1.0,0.0,1.0,0.0
5,0.0983,0.098106,0.0,0.0,1.0,0.0,1.0,0.0
6,0.0997,0.098633,0.0,0.0,1.0,0.0,1.0,0.0
7,0.0987,0.09809,0.0,0.0,1.0,0.0,1.0,0.0
8,0.0982,0.098816,0.0,0.0,1.0,0.0,1.0,0.0
9,0.0988,0.09815,0.0,0.0,1.0,0.0,1.0,0.0
10,0.0981,0.098347,0.0,0.0,1.0,0.0,1.0,0.0


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Some weights of the model checkpoint at monologg/koelectra-base-v3-discriminator were not used when initializing ElectraForTokenClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense_prediction.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense.weight']
- This IS expected if you are initializing ElectraForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForTokenClassification were not initialized from the model checkpoint at monologg/koelectra-base-v3-discriminator and are newly initialized: ['classifier

Epoch,Training Loss,Validation Loss,Cvl F1,Cvl Recall,Cvl Precision,Loc F1,Loc Recall,Loc Precision,Entity Macro F1,Entity Macro Precision,Entity Macro Recall
1,0.2243,0.058098,0.887606,0.848418,0.930589,0.897411,0.911392,0.883853,0.892509,0.907221,0.879905
2,0.0408,0.049856,0.908029,0.915379,0.900797,0.903103,0.92113,0.885768,0.905566,0.893282,0.918254
3,0.0213,0.051958,0.911947,0.918322,0.90566,0.888989,0.962999,0.825543,0.900468,0.865601,0.940661
4,0.0119,0.063355,0.905136,0.933775,0.878201,0.89726,0.892892,0.901672,0.901198,0.889936,0.913333
5,0.0072,0.072319,0.904228,0.92053,0.888494,0.89068,0.860759,0.922756,0.897454,0.905625,0.890645
6,0.004,0.080383,0.910682,0.919058,0.902457,0.891423,0.875365,0.908081,0.901052,0.905269,0.897212
7,0.0024,0.073827,0.907076,0.933775,0.881862,0.893638,0.895813,0.891473,0.900357,0.886668,0.914794
8,0.0016,0.07908,0.909613,0.933039,0.887334,0.897398,0.889971,0.90495,0.903505,0.896142,0.911505
9,0.001,0.081794,0.911466,0.924209,0.899069,0.896552,0.898734,0.89438,0.904009,0.896725,0.911472
10,0.0007,0.083709,0.915881,0.92936,0.902788,0.898778,0.894839,0.90275,0.907329,0.902769,0.9121


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Some weights of the model checkpoint at monologg/koelectra-base-v3-discriminator were not used when initializing ElectraForTokenClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense_prediction.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense.weight']
- This IS expected if you are initializing ElectraForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForTokenClassification were not initialized from the model checkpoint at monologg/koelectra-base-v3-discriminator and are newly initialized: ['classifier

Epoch,Training Loss,Validation Loss,Cvl F1,Cvl Recall,Cvl Precision,Loc F1,Loc Recall,Loc Precision,Qnt F1,Qnt Recall,Qnt Precision,Entity Macro F1,Entity Macro Precision,Entity Macro Recall
1,0.2747,0.074372,0.896023,0.903606,0.888567,0.873587,0.826848,0.925926,0.795181,0.897959,0.713514,0.85493,0.842669,0.876138
2,0.0526,0.061603,0.907654,0.92936,0.886938,0.907958,0.921206,0.895085,0.889632,0.904762,0.875,0.901748,0.885674,0.918443
3,0.0304,0.060051,0.916332,0.922737,0.910015,0.906146,0.925097,0.887955,0.855263,0.884354,0.828025,0.89258,0.875332,0.910729
4,0.0181,0.066167,0.914495,0.916851,0.912152,0.902724,0.902724,0.902724,0.82866,0.904762,0.764368,0.88196,0.859748,0.908112
5,0.0111,0.073134,0.915254,0.89404,0.9375,0.906375,0.885214,0.928571,0.850649,0.891156,0.813665,0.890759,0.893245,0.890137
6,0.0071,0.079489,0.906506,0.93819,0.876891,0.911057,0.901751,0.920556,0.85342,0.891156,0.81875,0.890327,0.872066,0.910366
7,0.0043,0.081205,0.915716,0.915379,0.916053,0.906312,0.893969,0.919,0.845161,0.891156,0.803681,0.889063,0.879578,0.900168
8,0.0026,0.085138,0.919177,0.92053,0.917828,0.904645,0.899805,0.909538,0.85342,0.891156,0.81875,0.892414,0.882039,0.903831
9,0.0016,0.091769,0.912869,0.921266,0.904624,0.90927,0.896887,0.922,0.854369,0.897959,0.814815,0.892169,0.88048,0.905371
10,0.001,0.094267,0.915081,0.919794,0.910415,0.909451,0.893969,0.925478,0.85342,0.891156,0.81875,0.89265,0.884881,0.90164


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Some weights of the model checkpoint at monologg/koelectra-base-v3-discriminator were not used when initializing ElectraForTokenClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense_prediction.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense.weight']
- This IS expected if you are initializing ElectraForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForTokenClassification were not initialized from the model checkpoint at monologg/koelectra-base-v3-discriminator and are newly initialized: ['classifier

Epoch,Training Loss,Validation Loss,Cvl F1,Cvl Recall,Cvl Precision,Loc F1,Loc Recall,Loc Precision,Org F1,Org Recall,Org Precision,Qnt F1,Qnt Recall,Qnt Precision,Entity Macro F1,Entity Macro Precision,Entity Macro Recall
1,0.2979,0.090636,0.896109,0.923473,0.870319,0.881053,0.914146,0.850272,0.862155,0.880922,0.844172,0.822785,0.884354,0.769231,0.865525,0.833498,0.900724
2,0.0643,0.079631,0.904984,0.928624,0.882517,0.908831,0.92878,0.88972,0.881818,0.869398,0.894598,0.858086,0.884354,0.833333,0.88843,0.875042,0.902789
3,0.0385,0.080063,0.915291,0.93819,0.893483,0.899074,0.899512,0.898635,0.876351,0.934699,0.824859,0.867314,0.911565,0.82716,0.889507,0.861034,0.920991
4,0.0231,0.09106,0.914683,0.919058,0.91035,0.909538,0.902439,0.916749,0.886169,0.927017,0.848769,0.888158,0.918367,0.859873,0.899637,0.883935,0.91672
5,0.0147,0.102582,0.910475,0.924209,0.897143,0.902716,0.891707,0.914,0.865955,0.934699,0.80663,0.839506,0.92517,0.768362,0.879663,0.846534,0.918946
6,0.0093,0.111031,0.917002,0.922737,0.911337,0.91138,0.918049,0.904808,0.893805,0.90525,0.882647,0.85623,0.911565,0.807229,0.894604,0.876505,0.9144
7,0.0057,0.119112,0.918188,0.924945,0.91153,0.904573,0.887805,0.921986,0.890693,0.912932,0.869512,0.888889,0.897959,0.88,0.900586,0.895757,0.90591
8,0.0037,0.125098,0.918583,0.925681,0.911594,0.910979,0.898537,0.923771,0.889299,0.925736,0.855621,0.881579,0.911565,0.853503,0.90011,0.886123,0.91538
9,0.0022,0.133809,0.919708,0.927152,0.912382,0.913519,0.896585,0.931104,0.890386,0.930858,0.853286,0.89701,0.918367,0.876623,0.905156,0.893349,0.918241
10,0.0016,0.136596,0.919414,0.923473,0.91539,0.912593,0.901463,0.924,0.893432,0.923175,0.865546,0.902357,0.911565,0.893333,0.906949,0.899567,0.914919


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Some weights of the model checkpoint at monologg/koelectra-base-v3-discriminator were not used when initializing ElectraForTokenClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense_prediction.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense.weight']
- This IS expected if you are initializing ElectraForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForTokenClassification were not initialized from the model checkpoint at monologg/koelectra-base-v3-discriminator and are newly initialized: ['classifier

Epoch,Training Loss,Validation Loss,Cvl F1,Cvl Recall,Cvl Precision,Loc F1,Loc Recall,Loc Precision,Org F1,Org Recall,Org Precision,Per F1,Per Recall,Per Precision,Qnt F1,Qnt Recall,Qnt Precision,Entity Macro F1,Entity Macro Precision,Entity Macro Recall
1,0.3083,0.096103,0.905634,0.945588,0.868919,0.895169,0.957115,0.840753,0.873737,0.886044,0.861768,0.918462,0.935737,0.901813,0.852459,0.884354,0.822785,0.889092,0.859208,0.921767
2,0.0716,0.083935,0.922173,0.923529,0.920821,0.904218,0.887914,0.921132,0.884663,0.923175,0.849234,0.951258,0.948276,0.954259,0.883721,0.904762,0.863636,0.909207,0.901817,0.917531
3,0.0429,0.088934,0.921101,0.922794,0.919414,0.907345,0.921053,0.89404,0.891925,0.919334,0.866104,0.955626,0.945141,0.966346,0.888136,0.891156,0.885135,0.912827,0.906208,0.919896
4,0.0264,0.101716,0.919431,0.927206,0.911786,0.893471,0.88694,0.900099,0.872079,0.90781,0.839053,0.955153,0.951411,0.958926,0.867314,0.911565,0.82716,0.90149,0.887405,0.916986
5,0.0166,0.113092,0.92233,0.908088,0.937026,0.908006,0.889864,0.926904,0.879121,0.921895,0.84014,0.944969,0.942006,0.94795,0.897959,0.897959,0.897959,0.910477,0.909996,0.911962
6,0.0109,0.116881,0.919735,0.918382,0.921091,0.8999,0.876218,0.924897,0.883397,0.892446,0.874529,0.951931,0.946708,0.957211,0.902098,0.877551,0.928058,0.911412,0.921157,0.902261
7,0.0066,0.127028,0.919017,0.934559,0.903983,0.913869,0.915205,0.912536,0.884567,0.902689,0.867159,0.951779,0.943574,0.960128,0.872852,0.863946,0.881944,0.908417,0.90515,0.911994
8,0.0042,0.137693,0.922569,0.924265,0.920879,0.909182,0.887914,0.931493,0.880353,0.895006,0.866171,0.954403,0.951411,0.957413,0.889632,0.904762,0.875,0.911228,0.910191,0.912672
9,0.0028,0.141464,0.924265,0.924265,0.924265,0.91264,0.911306,0.913978,0.891672,0.911652,0.872549,0.948859,0.945141,0.952607,0.883721,0.904762,0.863636,0.912231,0.905407,0.919425
10,0.0019,0.144809,0.922797,0.931618,0.914141,0.915154,0.909357,0.921027,0.887508,0.914213,0.862319,0.949922,0.951411,0.948438,0.882155,0.891156,0.873333,0.911507,0.903852,0.919551


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Some weights of the model checkpoint at monologg/koelectra-base-v3-discriminator were not used when initializing ElectraForTokenClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense_prediction.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense.weight']
- This IS expected if you are initializing ElectraForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForTokenClassification were not initialized from the model checkpoint at monologg/koelectra-base-v3-discriminator and are newly initialized: ['classifier

Epoch,Training Loss,Validation Loss,Cvl F1,Cvl Recall,Cvl Precision,Dat F1,Dat Recall,Dat Precision,Loc F1,Loc Recall,Loc Precision,Org F1,Org Recall,Org Precision,Per F1,Per Recall,Per Precision,Qnt F1,Qnt Recall,Qnt Precision,Entity Macro F1,Entity Macro Precision,Entity Macro Recall
1,0.3034,0.106041,0.912757,0.915441,0.910088,0.894118,0.929664,0.86119,0.89697,0.937622,0.859696,0.855569,0.895006,0.819461,0.939227,0.932602,0.945946,0.831746,0.891156,0.779762,0.888398,0.86269,0.916915
2,0.0778,0.096889,0.925362,0.916176,0.934734,0.907956,0.889908,0.926752,0.904624,0.915205,0.894286,0.881653,0.901408,0.862745,0.947123,0.954545,0.939815,0.882155,0.891156,0.873333,0.908146,0.905277,0.9114
3,0.0472,0.091513,0.915344,0.890441,0.94168,0.904239,0.880734,0.929032,0.904947,0.909357,0.900579,0.871158,0.852753,0.890374,0.949099,0.949843,0.948357,0.891156,0.891156,0.891156,0.90599,0.916863,0.895714
4,0.029,0.102866,0.919927,0.925,0.914909,0.90303,0.911315,0.894895,0.905624,0.925926,0.886194,0.871106,0.912932,0.832944,0.950743,0.952978,0.948518,0.88,0.897959,0.862745,0.905072,0.890034,0.921018
5,0.0187,0.109492,0.919714,0.897059,0.943542,0.914557,0.883792,0.947541,0.913211,0.923002,0.903626,0.885185,0.918054,0.854589,0.952157,0.951411,0.952904,0.88,0.897959,0.862745,0.910804,0.910825,0.911879
6,0.0118,0.128255,0.925559,0.927941,0.923189,0.911353,0.896024,0.927215,0.905679,0.893762,0.917918,0.875384,0.912932,0.840802,0.952456,0.942006,0.963141,0.912162,0.918367,0.90604,0.913766,0.913051,0.915172
7,0.0076,0.1366,0.926254,0.923529,0.928994,0.905426,0.892966,0.918239,0.913086,0.911306,0.914873,0.885,0.90653,0.864469,0.949179,0.951411,0.946958,0.888889,0.92517,0.855346,0.911306,0.904813,0.918485
8,0.0046,0.148093,0.923021,0.925735,0.920322,0.919505,0.908257,0.931034,0.907425,0.917154,0.897901,0.887508,0.914213,0.862319,0.953052,0.954545,0.951562,0.895623,0.904762,0.886667,0.914355,0.908301,0.920778
9,0.0032,0.151263,0.922173,0.923529,0.920821,0.926677,0.908257,0.94586,0.915122,0.91423,0.916016,0.89351,0.90781,0.879653,0.952157,0.951411,0.952904,0.890365,0.911565,0.87013,0.916667,0.914231,0.919467
10,0.0019,0.155763,0.925516,0.922794,0.928254,0.911076,0.892966,0.929936,0.91744,0.915205,0.919687,0.893058,0.914213,0.872861,0.951563,0.954545,0.948598,0.885906,0.897959,0.874172,0.914093,0.912251,0.91628


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Some weights of the model checkpoint at monologg/koelectra-base-v3-discriminator were not used when initializing ElectraForTokenClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense_prediction.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense.weight']
- This IS expected if you are initializing ElectraForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForTokenClassification were not initialized from the model checkpoint at monologg/koelectra-base-v3-discriminator and are newly initialized: ['classifier

Epoch,Training Loss,Validation Loss,Per F1,Per Recall,Per Precision,Entity Macro F1,Entity Macro Precision,Entity Macro Recall
1,0.1612,0.01779,0.93397,0.922956,0.94525,0.93397,0.94525,0.922956
2,0.0162,0.013792,0.918336,0.937107,0.900302,0.918336,0.900302,0.937107
3,0.0081,0.015436,0.937008,0.935535,0.938486,0.937008,0.938486,0.935535
4,0.0049,0.015804,0.931617,0.910377,0.953871,0.931617,0.953871,0.910377
5,0.0027,0.019383,0.932379,0.921384,0.943639,0.932379,0.943639,0.921384
6,0.0022,0.018381,0.931836,0.913522,0.9509,0.931836,0.9509,0.913522
7,0.0012,0.018718,0.933018,0.930818,0.935229,0.933018,0.935229,0.930818
8,0.0009,0.018624,0.932283,0.930818,0.933754,0.932283,0.933754,0.930818
9,0.0008,0.019368,0.929755,0.926101,0.933439,0.929755,0.933439,0.926101
10,0.0006,0.01942,0.929644,0.924528,0.934817,0.929644,0.934817,0.924528


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Some weights of the model checkpoint at monologg/koelectra-base-v3-discriminator were not used when initializing ElectraForTokenClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense_prediction.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense.weight']
- This IS expected if you are initializing ElectraForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForTokenClassification were not initialized from the model checkpoint at monologg/koelectra-base-v3-discriminator and are newly initialized: ['classifier

Epoch,Training Loss,Validation Loss,Dat F1,Dat Recall,Dat Precision,Per F1,Per Recall,Per Precision,Entity Macro F1,Entity Macro Precision,Entity Macro Recall
1,0.1986,0.045341,0.830534,0.831804,0.829268,0.933852,0.943396,0.924499,0.882193,0.876884,0.8876
2,0.0249,0.026628,0.885145,0.883792,0.886503,0.927851,0.940252,0.915773,0.906498,0.901138,0.912022
3,0.0131,0.027649,0.876106,0.908257,0.846154,0.924012,0.955975,0.894118,0.900059,0.870136,0.932116
4,0.0086,0.025741,0.881098,0.883792,0.878419,0.914153,0.929245,0.899543,0.897625,0.888981,0.906519
5,0.0056,0.025861,0.88958,0.874618,0.905063,0.933121,0.921384,0.945161,0.911351,0.925112,0.898001
6,0.0033,0.025789,0.890282,0.868502,0.913183,0.938449,0.922956,0.954472,0.914366,0.933827,0.895729
7,0.0022,0.027929,0.885802,0.877676,0.894081,0.93617,0.933962,0.938389,0.910986,0.916235,0.905819
8,0.0016,0.030895,0.886536,0.896024,0.877246,0.9377,0.922956,0.952922,0.912118,0.915084,0.90949
9,0.001,0.030846,0.892587,0.902141,0.883234,0.935535,0.935535,0.935535,0.914061,0.909384,0.918838
10,0.0008,0.030645,0.896024,0.896024,0.896024,0.940239,0.927673,0.95315,0.918132,0.924587,0.911849


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Some weights of the model checkpoint at monologg/koelectra-base-v3-discriminator were not used when initializing ElectraForTokenClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense_prediction.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense.weight']
- This IS expected if you are initializing ElectraForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForTokenClassification were not initialized from the model checkpoint at monologg/koelectra-base-v3-discriminator and are newly initialized: ['classifier

Epoch,Training Loss,Validation Loss,Dat F1,Dat Recall,Dat Precision,Loc F1,Loc Recall,Loc Precision,Per F1,Per Recall,Per Precision,Entity Macro F1,Entity Macro Precision,Entity Macro Recall
1,0.2442,0.047445,0.88,0.874618,0.885449,0.899951,0.896887,0.903036,0.937844,0.937107,0.938583,0.905932,0.909023,0.902871
2,0.036,0.040014,0.899536,0.889908,0.909375,0.895945,0.892023,0.899902,0.944444,0.935535,0.953526,0.913309,0.920934,0.905822
3,0.02,0.038843,0.877743,0.856269,0.900322,0.898678,0.892996,0.904433,0.94127,0.93239,0.950321,0.905897,0.918359,0.893885
4,0.0125,0.04143,0.891207,0.914373,0.869186,0.898804,0.950389,0.852531,0.943785,0.937107,0.950558,0.911265,0.890758,0.933956
5,0.0069,0.04203,0.898331,0.905199,0.891566,0.899065,0.888132,0.910269,0.943426,0.930818,0.956381,0.913607,0.919406,0.90805
6,0.0045,0.042941,0.916031,0.917431,0.914634,0.898876,0.894942,0.902846,0.948125,0.933962,0.962723,0.92101,0.926734,0.915445
7,0.0029,0.046337,0.907436,0.914373,0.900602,0.904785,0.910506,0.899135,0.950872,0.943396,0.958466,0.921031,0.919401,0.922758
8,0.0019,0.052171,0.903522,0.902141,0.904908,0.900733,0.895914,0.905605,0.949881,0.938679,0.961353,0.918045,0.923955,0.912245
9,0.0011,0.053225,0.90303,0.911315,0.894895,0.904785,0.910506,0.899135,0.94586,0.933962,0.958065,0.917892,0.917365,0.918594
10,0.0008,0.053674,0.900602,0.914373,0.88724,0.903069,0.901751,0.90439,0.946783,0.937107,0.956661,0.916818,0.916097,0.917744


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Some weights of the model checkpoint at monologg/koelectra-base-v3-discriminator were not used when initializing ElectraForTokenClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense_prediction.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense.weight']
- This IS expected if you are initializing ElectraForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForTokenClassification were not initialized from the model checkpoint at monologg/koelectra-base-v3-discriminator and are newly initialized: ['classifier

Epoch,Training Loss,Validation Loss,Cvl F1,Cvl Recall,Cvl Precision,Dat F1,Dat Recall,Dat Precision,Loc F1,Loc Recall,Loc Precision,Per F1,Per Recall,Per Precision,Entity Macro F1,Entity Macro Precision,Entity Macro Recall
1,0.2778,0.073899,0.899037,0.92579,0.873786,0.881141,0.850153,0.914474,0.888023,0.88716,0.888889,0.932912,0.929245,0.936609,0.900278,0.903439,0.898087
2,0.0547,0.06558,0.908758,0.911095,0.906433,0.896764,0.889908,0.903727,0.899773,0.964981,0.842821,0.938291,0.93239,0.944268,0.910897,0.899312,0.924593
3,0.0301,0.065795,0.917544,0.927994,0.907328,0.901899,0.87156,0.934426,0.906718,0.912451,0.901057,0.942745,0.944969,0.940532,0.917227,0.920836,0.914243
4,0.018,0.068306,0.911063,0.92579,0.896797,0.882995,0.865443,0.901274,0.90483,0.920233,0.889934,0.943574,0.946541,0.940625,0.910616,0.907158,0.914502
5,0.0109,0.077156,0.917249,0.916238,0.918262,0.894656,0.896024,0.893293,0.915534,0.917315,0.91376,0.942292,0.937107,0.947536,0.917433,0.918213,0.916671
6,0.0068,0.0863,0.913455,0.922851,0.904248,0.903427,0.88685,0.920635,0.912023,0.907588,0.916503,0.945055,0.946541,0.943574,0.91849,0.92124,0.915957
7,0.0042,0.090929,0.917853,0.923586,0.912192,0.898148,0.889908,0.906542,0.913532,0.909533,0.917566,0.943785,0.937107,0.950558,0.91833,0.921715,0.915033
8,0.0032,0.098382,0.918092,0.926525,0.909812,0.893939,0.902141,0.885886,0.914592,0.911479,0.917728,0.940898,0.938679,0.943128,0.916881,0.914138,0.919706
9,0.0021,0.100711,0.913479,0.903747,0.923423,0.901366,0.908257,0.894578,0.915486,0.911479,0.919529,0.942948,0.935535,0.950479,0.91832,0.922002,0.914754
10,0.0013,0.103755,0.917155,0.919177,0.915143,0.904615,0.899083,0.910217,0.915897,0.916342,0.915452,0.942384,0.938679,0.946117,0.920013,0.921732,0.91832


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Some weights of the model checkpoint at monologg/koelectra-base-v3-discriminator were not used when initializing ElectraForTokenClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense_prediction.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense.weight']
- This IS expected if you are initializing ElectraForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForTokenClassification were not initialized from the model checkpoint at monologg/koelectra-base-v3-discriminator and are newly initialized: ['classifier

Epoch,Training Loss,Validation Loss,Cvl F1,Cvl Recall,Cvl Precision,Dat F1,Dat Recall,Dat Precision,Loc F1,Loc Recall,Loc Precision,Per F1,Per Recall,Per Precision,Qnt F1,Qnt Recall,Qnt Precision,Entity Macro F1,Entity Macro Precision,Entity Macro Recall
1,0.2993,0.082368,0.913202,0.919912,0.906589,0.9,0.880734,0.920128,0.891945,0.88241,0.901688,0.928515,0.929245,0.927786,0.867797,0.870748,0.864865,0.900292,0.904211,0.89661
2,0.0634,0.072301,0.918094,0.905952,0.930566,0.887172,0.877676,0.896875,0.904135,0.934888,0.875341,0.945227,0.949686,0.94081,0.844444,0.904762,0.791667,0.899814,0.887052,0.914593
3,0.0357,0.075065,0.919927,0.92432,0.915575,0.91875,0.899083,0.939297,0.908035,0.911565,0.904532,0.944268,0.93239,0.956452,0.910345,0.897959,0.923077,0.920265,0.927787,0.913063
4,0.0214,0.080583,0.919574,0.919912,0.919236,0.903226,0.856269,0.955631,0.907115,0.892128,0.922613,0.954829,0.963836,0.945988,0.855305,0.904762,0.810976,0.90801,0.910889,0.907382
5,0.0131,0.087086,0.92523,0.922851,0.927622,0.917178,0.914373,0.92,0.909804,0.901846,0.917903,0.94462,0.938679,0.950637,0.89726,0.891156,0.903448,0.918819,0.923922,0.913781
6,0.0082,0.091598,0.923869,0.922851,0.92489,0.926448,0.905199,0.948718,0.912023,0.906706,0.917404,0.944795,0.941824,0.947785,0.909091,0.884354,0.935252,0.923245,0.93481,0.912187
7,0.0054,0.102589,0.921512,0.931668,0.911574,0.919084,0.920489,0.917683,0.911111,0.916424,0.90586,0.951638,0.959119,0.944272,0.890411,0.884354,0.896552,0.918751,0.915188,0.922411
8,0.0037,0.113564,0.921389,0.92579,0.917031,0.909091,0.902141,0.916149,0.908006,0.887269,0.929735,0.948276,0.951258,0.945312,0.864516,0.911565,0.822086,0.910256,0.906063,0.915604
9,0.0024,0.113978,0.924715,0.925055,0.924376,0.916031,0.917431,0.914634,0.90579,0.896987,0.914767,0.945712,0.944969,0.946457,0.867314,0.911565,0.82716,0.911912,0.905479,0.919201
10,0.0016,0.11781,0.92522,0.927259,0.923189,0.917829,0.905199,0.930818,0.90651,0.899903,0.913215,0.948859,0.948113,0.949606,0.860841,0.904762,0.820988,0.911852,0.907563,0.917047


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Some weights of the model checkpoint at monologg/koelectra-base-v3-discriminator were not used when initializing ElectraForTokenClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense_prediction.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense.weight']
- This IS expected if you are initializing ElectraForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForTokenClassification were not initialized from the model checkpoint at monologg/koelectra-base-v3-discriminator and are newly initialized: ['classifier

Epoch,Training Loss,Validation Loss,Cvl F1,Cvl Recall,Cvl Precision,Dat F1,Dat Recall,Dat Precision,Loc F1,Loc Recall,Loc Precision,Org F1,Org Recall,Org Precision,Per F1,Per Recall,Per Precision,Qnt F1,Qnt Recall,Qnt Precision,Entity Macro F1,Entity Macro Precision,Entity Macro Recall
1,0.3029,0.104975,0.914798,0.9,0.930091,0.855932,0.926606,0.795276,0.894889,0.904483,0.885496,0.853397,0.916773,0.798216,0.94127,0.929467,0.953376,0.859935,0.897959,0.825,0.886704,0.864576,0.912548
2,0.0791,0.091114,0.924487,0.927206,0.921784,0.903633,0.874618,0.934641,0.898898,0.91423,0.884072,0.869779,0.90653,0.835891,0.942457,0.949843,0.935185,0.870432,0.891156,0.850649,0.901614,0.893704,0.910597
3,0.0466,0.092517,0.916353,0.894118,0.939722,0.910518,0.88685,0.935484,0.90329,0.883041,0.92449,0.877081,0.877081,0.877081,0.946952,0.937304,0.9568,0.895833,0.877551,0.914894,0.908338,0.924745,0.892657
4,0.028,0.102278,0.927042,0.938971,0.915412,0.918587,0.914373,0.92284,0.910244,0.909357,0.911133,0.887805,0.932138,0.847497,0.954829,0.960815,0.948916,0.891089,0.918367,0.865385,0.914933,0.901864,0.929004
5,0.0175,0.112625,0.926991,0.924265,0.929734,0.90881,0.899083,0.91875,0.911851,0.907407,0.916339,0.890819,0.919334,0.864019,0.95283,0.949843,0.955836,0.891892,0.897959,0.885906,0.913866,0.911764,0.916315
6,0.011,0.130843,0.924303,0.938235,0.910778,0.918495,0.896024,0.942122,0.912765,0.902534,0.92323,0.88228,0.911652,0.854742,0.951563,0.954545,0.948598,0.920415,0.904762,0.93662,0.918303,0.919348,0.917959
7,0.0072,0.135859,0.923639,0.929412,0.917938,0.917574,0.902141,0.933544,0.915423,0.896686,0.934959,0.886406,0.914213,0.860241,0.951334,0.949843,0.95283,0.9,0.918367,0.882353,0.915729,0.913644,0.918444
8,0.0045,0.143461,0.92491,0.941912,0.908511,0.92,0.914373,0.925697,0.917315,0.919103,0.915534,0.887227,0.911652,0.864078,0.94647,0.956113,0.93702,0.9,0.918367,0.882353,0.915987,0.905532,0.92692
9,0.0027,0.154322,0.928833,0.930882,0.926794,0.92093,0.908257,0.933962,0.91482,0.905458,0.924378,0.887626,0.900128,0.875467,0.952157,0.951411,0.952904,0.888889,0.897959,0.88,0.915543,0.915584,0.915683
10,0.0018,0.160084,0.927737,0.934559,0.921014,0.92093,0.908257,0.933962,0.917035,0.910331,0.923838,0.891807,0.912932,0.871638,0.952232,0.952978,0.951487,0.902357,0.911565,0.893333,0.918683,0.915879,0.92177


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).
