<a href="https://colab.research.google.com/github/ekaterinatao/NER_biomed_domain/blob/main/active_learning/%D0%92%D0%9A%D0%A0_nerel_bio_RuBioBERT_active_learning_v5_random_seeds.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

# Обучение с разными сидами для расчета доверительных интервалов
# Инструменты
Предобработанный дасасет [NEREL-BIO](https://huggingface.co/datasets/ekaterinatao/nerel_bio_ner_unnested)  

Исходная модель [RuBioBERT](https://huggingface.co/alexyalunin/RuBioBERT)

### Установка зависимостей

In [None]:
!pip install datasets accelerate evaluate wandb seqeval -q

[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m510.5/510.5 kB[0m [31m3.4 MB/s[0m eta [36m0:00:00[0m
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m297.4/297.4 kB[0m [31m21.9 MB/s[0m eta [36m0:00:00[0m
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m84.1/84.1 kB[0m [31m9.6 MB/s[0m eta [36m0:00:00[0m
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m2.2/2.2 MB[0m [31m22.4 MB/s[0m eta [36m0:00:00[0m
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m43.6/43.6 kB[0m [31m4.2 MB/s[0m eta [36m0:00:00[0m
[?25h  Preparing metadata (setup.py) ... [?25l[?25hdone
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m116.3/116.3 kB[0m [31m5.8 MB/s[0m eta [36m0:00:00[0m
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m194.1/194.1 kB[0m [31m2.0 MB/s[0m eta [36m0:00:00[0m
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m134.8/134.8 kB[0m [31m7.6 M

In [None]:
import numpy as np
import pandas as pd
import random
import json
from dataclasses import dataclass
import torch
from torch.nn.functional import softmax
import datasets
from datasets import Dataset, DatasetDict, concatenate_datasets
from transformers import (AutoTokenizer,
                          DataCollatorForTokenClassification,
                          AutoModelForTokenClassification,
                          TrainingArguments, Trainer)
import evaluate
import warnings
warnings.filterwarnings("ignore")

In [None]:
@dataclass
class TrainingConfig:
    dataset = 'ekaterinatao/nerel_bio_ner_unnested'
    checkpoint = 'alexyalunin/RuBioBERT'
    hf_repo_id = "ekaterinatao/nerel-bio-RuBioBERT-al"
    n_labels = 45
    n_epochs = 10
    train_batch_size = 4
    eval_batch_size = 4
    device = "cuda" if torch.cuda.is_available() else "cpu"
    l_rate = 5e-05
    w_decay = 0.1
    warm_up = 0.1
    run_name = "RuBioBERT_AL_v5_3"

config = TrainingConfig()

In [None]:
def fix_seed(seed):
    random.seed(seed)
    np.random.seed(seed)

    torch.manual_seed(seed)
    torch.cuda.manual_seed_all(seed)

    torch.backends.cudnn.deterministic = True
    torch.backends.cudnn.benchmark = False
    print("Current seed: ", seed)

In [None]:
# генерация фиксированного списка сидов для воспроизводимости экспериментов
np.random.seed(64)
seed_lst = np.random.randint(65, 2024, size=4)

### Скачивание датасета

In [None]:
dataset = datasets.load_dataset(config.dataset)
dataset

Downloading readme:   0%|          | 0.00/1.56k [00:00<?, ?B/s]

Downloading data:   0%|          | 0.00/603k [00:00<?, ?B/s]

Downloading data:   0%|          | 0.00/76.2k [00:00<?, ?B/s]

Downloading data:   0%|          | 0.00/70.8k [00:00<?, ?B/s]

Generating train split:   0%|          | 0/612 [00:00<?, ? examples/s]

Generating valid split:   0%|          | 0/77 [00:00<?, ? examples/s]

Generating test split:   0%|          | 0/77 [00:00<?, ? examples/s]

DatasetDict({
    train: Dataset({
        features: ['id', 'words', 'ner_tags'],
        num_rows: 612
    })
    valid: Dataset({
        features: ['id', 'words', 'ner_tags'],
        num_rows: 77
    })
    test: Dataset({
        features: ['id', 'words', 'ner_tags'],
        num_rows: 77
    })
})

In [None]:
# Labels
url = 'https://raw.githubusercontent.com/ekaterinatao/NER_biomed_domain/main/labels.txt'
tags = pd.read_csv(url, names=['tag']).values.tolist()
tags = [item for sublist in tags for item in sublist]
tag_to_id = {tag: i for i, tag in enumerate(tags)}
id_to_tag = {i: tag for i, tag in enumerate(tags)}

___
### Токенизация

In [None]:
tokenizer = AutoTokenizer.from_pretrained(config.checkpoint)

tokenizer_config.json:   0%|          | 0.00/413 [00:00<?, ?B/s]

vocab.txt:   0%|          | 0.00/1.78M [00:00<?, ?B/s]

tokenizer.json:   0%|          | 0.00/2.75M [00:00<?, ?B/s]

special_tokens_map.json:   0%|          | 0.00/112 [00:00<?, ?B/s]

In [None]:
def tokenize_and_align_labels(examples):
    tokenized_inputs = tokenizer(examples["words"], truncation=True, max_length=512, is_split_into_words=True)

    labels = []
    for i, label in enumerate(examples[f"ner_tags"]):
        word_idxs = tokenized_inputs.word_ids(batch_index=i)  # Map tokens to their respective word.
        previous_word_idx = None
        label_ids = []
        for word_idx in word_idxs:
            if word_idx is None:
                label_ids.append(-100) # Set the special tokens to -100.
            elif word_idx != previous_word_idx:  # Only label the first token of a given word.
                label_ids.append(label[word_idx])
            else:
                label_ids.append(-100)
            previous_word_idx = word_idx
        labels.append(label_ids)

    tokenized_inputs["labels"] = labels
    return tokenized_inputs

In [None]:
tokenized_dataset = dataset.map(
    tokenize_and_align_labels, batched=True
)
tokenized_dataset

Map:   0%|          | 0/612 [00:00<?, ? examples/s]

Map:   0%|          | 0/77 [00:00<?, ? examples/s]

Map:   0%|          | 0/77 [00:00<?, ? examples/s]

DatasetDict({
    train: Dataset({
        features: ['id', 'words', 'ner_tags', 'input_ids', 'token_type_ids', 'attention_mask', 'labels'],
        num_rows: 612
    })
    valid: Dataset({
        features: ['id', 'words', 'ner_tags', 'input_ids', 'token_type_ids', 'attention_mask', 'labels'],
        num_rows: 77
    })
    test: Dataset({
        features: ['id', 'words', 'ner_tags', 'input_ids', 'token_type_ids', 'attention_mask', 'labels'],
        num_rows: 77
    })
})

# Обучение модели

In [None]:
seqeval = evaluate.load("seqeval")

def compute_metrics(p):
    predictions, labels = p
    predictions = np.argmax(predictions, axis=2)

    true_predictions = [
        [tags[p] for (p, l) in zip(prediction, label) if l != -100]
        for prediction, label in zip(predictions, labels)
    ]
    true_labels = [
        [tags[l] for (p, l) in zip(prediction, label) if l != -100]
        for prediction, label in zip(predictions, labels)
    ]

    results = seqeval.compute(predictions=true_predictions, references=true_labels)
    return {
        "precision": results["overall_precision"],
        "recall": results["overall_recall"],
        "f1": results["overall_f1"],
        "accuracy": results["overall_accuracy"],
    }

Downloading builder script:   0%|          | 0.00/6.34k [00:00<?, ?B/s]

In [None]:
def choose_samples_random(test_predictions, n_tokens) -> np.ndarray:
    """Функция для рандомного отбора примеров для разметки"""

    return random.sample(range(test_predictions.shape[0]), n_tokens)

In [None]:
data_collator = DataCollatorForTokenClassification(tokenizer=tokenizer)

In [None]:
print(f'device is {config.device}')

device is cuda


In [None]:
from huggingface_hub import notebook_login
notebook_login()

VBox(children=(HTML(value='<center> <img\nsrc=https://huggingface.co/front/assets/huggingface_logo-noborder.sv…

In [None]:
import wandb
wandb.login()

<IPython.core.display.Javascript object>

[34m[1mwandb[0m: Logging into wandb.ai. (Learn how to deploy a W&B server locally: https://wandb.me/wandb-server)
[34m[1mwandb[0m: You can find your API key in your browser here: https://wandb.ai/authorize
wandb: Paste an API key from your profile and hit enter, or press ctrl+c to quit:

 ··········


[34m[1mwandb[0m: Appending key for api.wandb.ai to your netrc file: /root/.netrc


True

In [None]:
def train_and_predict(
    al_train_dataset, eval_dataset, al_test_dataset, test_dataset,
    model, tokenizer, data_collator, compute_metrics, SEED
):
    "Функция для тренировки модели, сохранения метрик и предсказаний"

    global config
    training_args = TrainingArguments(
        output_dir=config.hf_repo_id,
        num_train_epochs=config.n_epochs,
        learning_rate=config.l_rate,
        weight_decay=config.w_decay,
        warmup_ratio=config.warm_up,
        per_device_train_batch_size=config.train_batch_size,
        per_device_eval_batch_size=config.eval_batch_size,
        group_by_length=True,
        optim="adamw_torch",
        lr_scheduler_type="cosine",
        evaluation_strategy="epoch",
        seed = SEED,
        data_seed = SEED,
        push_to_hub=True,
        save_strategy="no",
        report_to="wandb",
        logging_steps=16,
        run_name=config.run_name + f'{SEED}',
    )
    metrics = {}
    trainer = Trainer(
        model=model,
        args=training_args,
        train_dataset=al_train_dataset,
        eval_dataset=eval_dataset,
        tokenizer=tokenizer,
        data_collator=data_collator,
        compute_metrics=compute_metrics,
    )
    train_result = trainer.train()
    metrics['train_loss'] = train_result.metrics['train_loss']
    metrics.update(trainer.evaluate(eval_dataset))
    if al_test_dataset.num_rows > 0:
        al_test_predictions = trainer.predict(
            al_test_dataset, metric_key_prefix="pred"
        )
        probas = al_test_predictions.predictions
        metrics.update(al_test_predictions.metrics)
    else:
        probas = None
    test_predictions = trainer.predict(test_dataset, metric_key_prefix="test")
    metrics.update(test_predictions.metrics)

    return metrics, probas, trainer

In [None]:
def run_active_learning(
    dataset, al_iters, init_train_size, choose_tokens,
    tokenizer, data_collator, compute_metrics, SEED
):
    "Функция для реализации цикла активного обучения"

    train_dataset = dataset['train'].select(
        random.sample(
            range(dataset['train'].num_rows),
            int(dataset['train'].num_rows * init_train_size)
        )
    )
    test_dataset = dataset['train'].filter(
        lambda s: s['id'] not in train_dataset['id']
    )
    all_metrics = {}

    for iter in range(al_iters):
        train_size = train_dataset.num_rows
        print(f'\nIteration: {iter}. Training using {train_size} samples')
        model = AutoModelForTokenClassification.from_pretrained(
            config.checkpoint, num_labels=config.n_labels,
            id2label=id_to_tag, label2id=tag_to_id
        )

        metrics, test_predictions, trainer = train_and_predict(
            train_dataset, dataset['valid'], test_dataset, dataset['test'],
            model, tokenizer, data_collator, compute_metrics, SEED
        )

        all_metrics[f'{iter}'] = {'train_size': train_size, 'metrics': metrics}

        if test_dataset.num_rows >= choose_tokens:
            assert test_predictions is not None, "test_predictions is None, must be array"
            new_args = choose_samples_random(test_predictions, choose_tokens)
            new_train_samples = test_dataset.select(new_args)
            extended_train_dataset = concatenate_datasets(
                [train_dataset, new_train_samples]
            )

            train_dataset = extended_train_dataset
            test_dataset = dataset['train'].filter(
                lambda s: s['id'] not in train_dataset['id']
            )

    return all_metrics, trainer

# Сэмплирование по 4 примера (по ~0.7% данных, 30 итераций активного обучения) для каждого сида (4 цикла).

In [None]:
for SEED in seed_lst:
    fix_seed(SEED)
    run = wandb.init(
        project="ner_bert_nerel_bio",
        name=config.run_name + f'{SEED}',
        reinit=True)
    metrics, trainer = run_active_learning(
        dataset=tokenized_dataset,
        al_iters=30,
        init_train_size=0.007,
        choose_tokens=4,
        tokenizer=tokenizer,
        data_collator=data_collator,
        compute_metrics=compute_metrics,
        SEED=SEED
    )
    run.join()
    with open(f'/content/drive/MyDrive/data/VKR/metrics_30_random_seed{SEED}.json', 'w') as file:
        json.dump(metrics, file)

[34m[1mwandb[0m: Currently logged in as: [33mtaoea[0m. Use [1m`wandb login --relogin`[0m to force relogin


Current seed:  517


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 0. Training using 4 samples


config.json:   0%|          | 0.00/889 [00:00<?, ?B/s]

pytorch_model.bin:   0%|          | 0.00/714M [00:00<?, ?B/s]

Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.847057,0.01114,0.013837,0.012343,0.02735
2,No log,3.642503,0.035247,0.008208,0.013316,0.158974
3,No log,3.487499,0.014493,0.000469,0.000909,0.156177
4,No log,3.388926,0.022472,0.000469,0.000919,0.1554
5,No log,3.318139,0.023529,0.000469,0.00092,0.1554
6,No log,3.258257,0.022989,0.000469,0.000919,0.155556
7,No log,3.207805,0.021053,0.000469,0.000918,0.156333
8,No log,3.175283,0.044643,0.001173,0.002285,0.158042
9,No log,3.159549,0.047619,0.001407,0.002733,0.159596
10,No log,3.155416,0.053846,0.001642,0.003186,0.160218


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 1. Training using 8 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.782848,0.02034,0.025797,0.022746,0.048796
2,No log,3.352875,0.02454,0.001876,0.003486,0.157265
3,No log,3.176967,0.0,0.0,0.0,0.155245
4,No log,3.072405,0.159817,0.008208,0.015615,0.168765
5,No log,2.955209,0.215078,0.022749,0.041145,0.189433
6,No log,2.864684,0.224599,0.02955,0.052228,0.199223
7,No log,2.800239,0.266753,0.048546,0.082143,0.219736
8,2.647800,2.762798,0.258847,0.060038,0.097468,0.236053
9,2.647800,2.746274,0.258427,0.064728,0.103526,0.242735
10,2.647800,2.742603,0.260949,0.067073,0.106716,0.2446


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 2. Training using 12 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.58935,0.038678,0.022514,0.028461,0.148252
2,No log,3.148695,0.0,0.0,0.0,0.155089
3,No log,2.973859,0.028926,0.001642,0.003107,0.160995
4,No log,2.804702,0.150188,0.028143,0.047403,0.206527
5,No log,2.676631,0.290323,0.118199,0.168,0.305828
6,2.760400,2.557781,0.346695,0.190666,0.246028,0.375447
7,2.760400,2.474317,0.335309,0.212242,0.259945,0.40202
8,2.760400,2.421908,0.333217,0.223734,0.267714,0.411655
9,2.760400,2.398966,0.335182,0.226782,0.270527,0.414297
10,2.760400,2.394396,0.336097,0.228189,0.271826,0.415229


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 3. Training using 16 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.468934,0.022277,0.006332,0.009861,0.158042
2,No log,3.072157,0.0,0.0,0.0,0.154934
3,No log,2.81212,0.159459,0.013837,0.025464,0.186169
4,2.932100,2.628561,0.259813,0.130394,0.173641,0.334266
5,2.932100,2.457335,0.300938,0.188086,0.231491,0.400466
6,2.932100,2.30987,0.336845,0.254925,0.290215,0.464491
7,2.932100,2.206501,0.365165,0.300422,0.329645,0.497591
8,1.734600,2.146545,0.376787,0.315197,0.343251,0.507692
9,1.734600,2.118655,0.381032,0.320356,0.34807,0.511577
10,1.734600,2.113736,0.381019,0.32106,0.348479,0.512665


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 4. Training using 20 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.341808,0.056397,0.015713,0.024578,0.169231
2,No log,2.942909,0.017094,0.000469,0.000913,0.156488
3,No log,2.651347,0.28576,0.210366,0.242334,0.397047
4,2.958300,2.378269,0.353205,0.258443,0.298483,0.45237
5,2.958300,2.124806,0.403164,0.346623,0.372762,0.53007
6,2.958300,1.95398,0.443611,0.388368,0.414155,0.55913
7,1.670100,1.854391,0.469753,0.418856,0.442847,0.575758
8,1.670100,1.804808,0.476665,0.42636,0.450111,0.583372
9,1.670100,1.784813,0.479802,0.431754,0.454512,0.587723
10,1.099800,1.78063,0.481771,0.433865,0.456565,0.588656


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 5. Training using 24 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.294162,0.019753,0.001876,0.003427,0.158664
2,No log,2.88755,0.03012,0.001173,0.002257,0.161305
3,3.034500,2.603985,0.317977,0.148921,0.202843,0.33784
4,3.034500,2.320274,0.326744,0.197702,0.246347,0.396115
5,3.034500,2.038206,0.389934,0.330675,0.357868,0.522611
6,1.823600,1.852851,0.459488,0.408302,0.432385,0.575758
7,1.823600,1.7339,0.489472,0.441604,0.464308,0.599845
8,1.128600,1.668547,0.499872,0.459428,0.478798,0.611655
9,1.128600,1.644398,0.506397,0.464118,0.484337,0.615385
10,1.128600,1.640282,0.510382,0.466932,0.487691,0.616939


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 6. Training using 28 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.16202,0.023729,0.003283,0.005768,0.160684
2,No log,2.690516,0.293358,0.111867,0.161969,0.303497
3,3.020300,2.281881,0.381807,0.29925,0.335525,0.50303
4,3.020300,1.890781,0.46265,0.397983,0.427887,0.578244
5,1.686500,1.683195,0.50824,0.448405,0.476452,0.610101
6,1.686500,1.557358,0.543682,0.490385,0.51566,0.641492
7,1.012300,1.494127,0.567694,0.514306,0.539683,0.654701
8,1.012300,1.472706,0.575859,0.52697,0.550331,0.662782
9,1.012300,1.46041,0.58136,0.535413,0.557441,0.666667
10,0.764600,1.4581,0.582272,0.536116,0.558242,0.667444


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 7. Training using 32 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.132885,0.0,0.0,0.0,0.155089
2,3.114500,2.636461,0.342231,0.201454,0.253617,0.397669
3,3.114500,2.10315,0.420561,0.316604,0.361252,0.513908
4,1.735300,1.735245,0.512807,0.44137,0.474414,0.6115
5,1.735300,1.574699,0.545337,0.495075,0.518992,0.640093
6,0.994000,1.463997,0.584389,0.530253,0.556006,0.666822
7,0.994000,1.36997,0.598798,0.560741,0.579145,0.684382
8,0.719600,1.352566,0.599801,0.565197,0.581985,0.688578
9,0.719600,1.342158,0.599154,0.564728,0.581432,0.68951
10,0.611600,1.33909,0.60005,0.566135,0.582599,0.689977


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 8. Training using 36 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.102728,0.016129,0.000469,0.000912,0.156799
2,3.184500,2.63434,0.299024,0.172373,0.218685,0.379798
3,3.184500,2.095098,0.395743,0.322702,0.35551,0.531469
4,1.955100,1.710419,0.513989,0.452392,0.481227,0.612743
5,1.955100,1.513651,0.557784,0.495779,0.524957,0.648174
6,1.161100,1.388609,0.608994,0.562148,0.584634,0.690754
7,1.161100,1.31057,0.628114,0.579503,0.60283,0.703341
8,0.770500,1.270114,0.637582,0.591229,0.613531,0.709713
9,0.612900,1.258018,0.640121,0.595685,0.617104,0.714375
10,0.612900,1.256081,0.641381,0.596857,0.618319,0.714841


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 9. Training using 40 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.104635,0.008621,0.000235,0.000457,0.155089
2,3.216100,2.50625,0.327262,0.252814,0.285261,0.446154
3,3.216100,1.93394,0.418956,0.357645,0.385881,0.554157
4,1.958900,1.578256,0.551938,0.500938,0.525203,0.647086
5,1.102500,1.386964,0.594574,0.549953,0.571394,0.680963
6,1.102500,1.269899,0.632071,0.587008,0.608706,0.711577
7,0.741100,1.204183,0.649233,0.605535,0.626623,0.728205
8,0.551300,1.167876,0.666165,0.623358,0.644051,0.739705
9,0.551300,1.159515,0.668667,0.627111,0.647223,0.741103
10,0.486900,1.158473,0.669835,0.628049,0.648269,0.74157


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 10. Training using 44 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.056336,0.0,0.0,0.0,0.154934
2,3.213100,2.445605,0.350598,0.227017,0.275587,0.427972
3,1.994200,1.806921,0.465029,0.408537,0.434956,0.58648
4,1.994200,1.454305,0.576241,0.525563,0.549736,0.66418
5,1.127900,1.29497,0.624283,0.587242,0.605196,0.708003
6,0.695300,1.212522,0.651063,0.603424,0.626339,0.725253
7,0.695300,1.12398,0.672827,0.631801,0.651669,0.742036
8,0.574500,1.115476,0.675926,0.633443,0.653995,0.746698
9,0.439900,1.098684,0.676404,0.635319,0.655218,0.748718
10,0.439900,1.095289,0.678161,0.636492,0.656666,0.749495


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 11. Training using 48 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.030327,0.009174,0.000235,0.000457,0.15711
2,3.292800,2.282311,0.410498,0.326454,0.363684,0.50272
3,1.958600,1.638862,0.552537,0.505629,0.528043,0.644755
4,1.205200,1.385962,0.592565,0.560741,0.576214,0.678011
5,1.205200,1.23927,0.646269,0.609287,0.627233,0.719658
6,0.804900,1.116303,0.681516,0.64939,0.665065,0.751204
7,0.554900,1.069541,0.68704,0.656426,0.671384,0.758197
8,0.460400,1.063169,0.698118,0.661116,0.679113,0.764413
9,0.460400,1.04822,0.695107,0.662992,0.67867,0.765967
10,0.415800,1.045321,0.696798,0.663462,0.679721,0.7669


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 12. Training using 52 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.039573,0.0,0.0,0.0,0.154934
2,3.291100,2.254863,0.363171,0.266417,0.307359,0.4662
3,2.124300,1.621827,0.552801,0.502111,0.526238,0.649883
4,1.271300,1.312001,0.61752,0.568715,0.592113,0.697591
5,0.795500,1.15077,0.66525,0.624062,0.643998,0.739083
6,0.795500,1.070769,0.680729,0.63954,0.659492,0.751515
7,0.593500,1.01775,0.701776,0.657833,0.679095,0.76892
8,0.430500,1.002991,0.706206,0.66182,0.683293,0.771873
9,0.407200,0.990454,0.709613,0.66651,0.687387,0.774048
10,0.353500,0.988046,0.706102,0.664869,0.684865,0.773427


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 13. Training using 56 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.005323,0.020979,0.000704,0.001361,0.160528
2,3.374100,2.158986,0.399322,0.303705,0.345011,0.499145
3,2.187500,1.524209,0.570385,0.531191,0.550091,0.659984
4,1.378700,1.253212,0.632455,0.596857,0.614141,0.7108
5,0.842900,1.109809,0.679166,0.641417,0.659752,0.747475
6,0.675600,1.019573,0.69505,0.658537,0.676301,0.760995
7,0.481500,0.956955,0.712061,0.675657,0.693381,0.778866
8,0.413000,0.952424,0.711982,0.673077,0.691983,0.778089
9,0.413000,0.933596,0.720089,0.681754,0.700398,0.783061
10,0.361300,0.93242,0.720209,0.680347,0.699711,0.783061


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 14. Training using 60 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,2.968897,0.0,0.0,0.0,0.1554
2,3.422100,2.091101,0.39085,0.324578,0.354644,0.528516
3,2.306600,1.480105,0.560394,0.507036,0.532381,0.658897
4,1.371100,1.20857,0.635027,0.597795,0.615849,0.716239
5,0.912000,1.07023,0.671593,0.628752,0.649467,0.742191
6,0.649700,0.985926,0.70804,0.660882,0.683649,0.774981
7,0.535300,0.934468,0.713786,0.670263,0.69134,0.782595
8,0.403900,0.902175,0.724189,0.685976,0.704565,0.793629
9,0.334700,0.909892,0.720803,0.681754,0.700735,0.791142
10,0.277800,0.908951,0.722112,0.683161,0.702097,0.792852


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 15. Training using 64 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.3434,2.892499,0.087571,0.00727,0.013426,0.174514
2,2.1947,1.882891,0.495457,0.434803,0.463153,0.601088
3,1.3287,1.398545,0.607348,0.569887,0.588022,0.683916
4,0.9151,1.14433,0.66759,0.621717,0.643837,0.734421
5,0.6495,0.991044,0.714108,0.671904,0.692363,0.773737
6,0.4878,0.939942,0.71199,0.675422,0.693224,0.78042
7,0.3852,0.906471,0.739001,0.70122,0.719615,0.798135
8,0.3291,0.89664,0.732544,0.696295,0.713959,0.796426
9,0.2994,0.886338,0.734417,0.699109,0.716328,0.797203
10,0.2824,0.885894,0.735896,0.700516,0.71777,0.79798


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 16. Training using 68 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.3816,2.901709,0.204268,0.031426,0.054472,0.19425
2,2.3066,1.930732,0.446158,0.386726,0.414322,0.554934
3,1.3873,1.363692,0.591847,0.558396,0.574635,0.677389
4,0.9858,1.124938,0.651894,0.617495,0.634229,0.732556
5,0.66,1.008017,0.684313,0.657833,0.670812,0.766434
6,0.4872,0.921544,0.713473,0.676829,0.694668,0.777778
7,0.4138,0.899689,0.714147,0.687852,0.700753,0.790054
8,0.328,0.876687,0.725964,0.697702,0.711552,0.796426
9,0.3142,0.873846,0.722777,0.695826,0.709045,0.79627
10,0.2577,0.874865,0.721559,0.694653,0.70785,0.795493


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 17. Training using 72 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.3954,2.825629,0.227751,0.07622,0.114215,0.273504
2,2.2799,1.752921,0.51887,0.461069,0.488265,0.625175
3,1.342,1.332281,0.60731,0.576689,0.591604,0.690598
4,0.9015,1.094951,0.68824,0.640947,0.663752,0.747164
5,0.7472,1.010528,0.705096,0.655488,0.679387,0.770785
6,0.4452,0.910672,0.722426,0.692777,0.707291,0.791608
7,0.3773,0.898852,0.721965,0.69606,0.708776,0.795183
8,0.277,0.869968,0.736039,0.701689,0.718454,0.799534
9,0.2481,0.859082,0.738822,0.709193,0.723705,0.802953
10,0.2486,0.858831,0.73827,0.70849,0.723073,0.802176


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 18. Training using 76 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.3637,2.819603,0.157667,0.01712,0.030886,0.193007
2,2.3103,1.714518,0.497245,0.444418,0.46935,0.608392
3,1.4081,1.240373,0.642314,0.593809,0.617109,0.712199
4,0.9976,1.031483,0.710513,0.662523,0.68568,0.767366
5,0.6444,0.9216,0.726727,0.681051,0.703148,0.787413
6,0.4059,0.872186,0.738636,0.70122,0.719442,0.797824
7,0.3044,0.854234,0.737438,0.702158,0.719366,0.802642
8,0.3018,0.852036,0.739438,0.710131,0.724489,0.803263
9,0.2501,0.855099,0.741589,0.713415,0.727229,0.805284
10,0.2306,0.852619,0.742439,0.713884,0.727881,0.80575


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 19. Training using 80 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.4936,2.734855,0.282496,0.076454,0.12034,0.270396
2,2.3439,1.702639,0.531034,0.469512,0.498382,0.630148
3,1.4612,1.203621,0.647222,0.601079,0.623298,0.721678
4,0.6985,1.04482,0.691007,0.661351,0.675854,0.764413
5,0.5225,0.910502,0.719768,0.699343,0.709409,0.79223
6,0.4134,0.858755,0.723585,0.69864,0.710894,0.79596
7,0.3262,0.850196,0.730405,0.70591,0.717949,0.802176
8,0.2298,0.841361,0.734055,0.715291,0.724552,0.807615
9,0.2078,0.841578,0.734748,0.714587,0.724527,0.808547
10,0.2263,0.841177,0.734605,0.713415,0.723855,0.807615


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 20. Training using 84 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.4383,2.767942,0.286554,0.102955,0.151484,0.279876
2,2.3818,1.658118,0.521739,0.469981,0.49451,0.625175
3,1.5358,1.206634,0.639737,0.594278,0.61617,0.712821
4,0.7167,0.984499,0.699677,0.659475,0.678981,0.764413
5,0.5003,0.882624,0.731111,0.694418,0.712293,0.794872
6,0.4167,0.827959,0.737506,0.712946,0.725018,0.806993
7,0.2578,0.845887,0.73999,0.710835,0.72512,0.805284
8,0.2435,0.824228,0.747881,0.724203,0.735851,0.816006
9,0.2076,0.816212,0.750851,0.724437,0.737407,0.816783
10,0.1914,0.817823,0.753899,0.72561,0.739484,0.817249


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 21. Training using 88 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.4758,2.661307,0.245768,0.170263,0.201164,0.363481
2,2.388,1.57867,0.568748,0.518996,0.542735,0.655167
3,1.04,1.202629,0.636364,0.602486,0.618962,0.715152
4,0.7726,1.000449,0.693923,0.658771,0.67589,0.766278
5,0.5354,0.883273,0.72955,0.696529,0.712657,0.795338
6,0.3353,0.852917,0.727074,0.702861,0.714763,0.800466
7,0.2561,0.830436,0.740561,0.717636,0.728919,0.808858
8,0.2054,0.820177,0.738543,0.718105,0.728181,0.812898
9,0.2119,0.811293,0.747055,0.728659,0.737742,0.817716
10,0.1863,0.813194,0.746276,0.728424,0.737242,0.818182


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 22. Training using 92 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.3995,2.668815,0.325593,0.147983,0.203483,0.35136
2,2.4529,1.559778,0.561164,0.511023,0.534921,0.656255
3,1.0354,1.145998,0.66716,0.633677,0.649988,0.738462
4,0.8031,0.98213,0.707093,0.668621,0.687319,0.775758
5,0.4527,0.893852,0.726027,0.69606,0.710728,0.792541
6,0.3612,0.808722,0.737352,0.714353,0.72567,0.809013
7,0.2669,0.82953,0.738284,0.72045,0.729258,0.813209
8,0.2139,0.822946,0.740688,0.727486,0.734027,0.814763
9,0.1812,0.816306,0.742229,0.727955,0.735022,0.816472
10,0.189,0.816866,0.74324,0.728424,0.735757,0.816783


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 23. Training using 96 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.5021,2.663968,0.372134,0.148452,0.212238,0.332246
2,1.6892,1.573555,0.563333,0.515244,0.538217,0.655322
3,1.0543,1.174107,0.639147,0.597326,0.617529,0.717949
4,0.6012,0.972367,0.705393,0.656426,0.680029,0.768765
5,0.4693,0.889079,0.727009,0.704503,0.715579,0.798446
6,0.2891,0.820232,0.742061,0.717871,0.729765,0.812743
7,0.2612,0.814991,0.748418,0.721388,0.734655,0.815851
8,0.1948,0.822347,0.747404,0.725844,0.736466,0.818493
9,0.1751,0.803499,0.748796,0.729128,0.738831,0.821445
10,0.168,0.805661,0.749759,0.729362,0.73942,0.821445


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 24. Training using 100 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.4324,2.664326,0.301897,0.126876,0.178666,0.317016
2,1.675,1.565963,0.561064,0.509615,0.534103,0.653302
3,1.1038,1.144208,0.671086,0.617261,0.643049,0.739394
4,0.6295,0.958511,0.706837,0.674015,0.690036,0.777312
5,0.4711,0.870548,0.724071,0.699109,0.711371,0.800155
6,0.3103,0.821651,0.743633,0.719043,0.731132,0.810723
7,0.2763,0.820097,0.73888,0.720685,0.729669,0.81181
8,0.165,0.817331,0.750182,0.726079,0.737934,0.818648
9,0.1734,0.813495,0.749819,0.728893,0.739208,0.820047
10,0.1529,0.815797,0.748491,0.727251,0.737719,0.819114


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 25. Training using 104 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.5194,2.581735,0.319459,0.215994,0.257731,0.411655
2,1.6771,1.456416,0.573031,0.539165,0.555582,0.665579
3,0.9914,1.063991,0.703335,0.662758,0.682444,0.763792
4,0.6287,0.944885,0.717322,0.688555,0.702644,0.787257
5,0.3488,0.811816,0.744764,0.717167,0.730705,0.80979
6,0.3161,0.790165,0.749642,0.735929,0.742722,0.817871
7,0.2309,0.788007,0.756401,0.741323,0.748786,0.82331
8,0.1788,0.753125,0.771456,0.756801,0.764058,0.832168
9,0.1719,0.763092,0.767009,0.753518,0.760203,0.83108
10,0.16,0.761772,0.768881,0.754456,0.7616,0.831857


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 26. Training using 108 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.5359,2.471547,0.332319,0.204972,0.253554,0.402176
2,1.5972,1.416008,0.594534,0.556051,0.574649,0.681896
3,0.8438,1.095623,0.680936,0.641651,0.66071,0.746232
4,0.6415,0.948394,0.706703,0.677533,0.69181,0.780886
5,0.4252,0.849157,0.736536,0.712008,0.724064,0.804351
6,0.2986,0.803758,0.74825,0.727017,0.737481,0.81756
7,0.23,0.80559,0.750483,0.729362,0.739772,0.817405
8,0.1924,0.795624,0.744292,0.726313,0.735193,0.817716
9,0.1459,0.796458,0.753378,0.732176,0.742626,0.821911
10,0.1535,0.798008,0.752411,0.731942,0.742035,0.821756


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 27. Training using 112 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.559,2.460132,0.351019,0.234287,0.281013,0.427195
2,1.6409,1.354211,0.615917,0.584428,0.599759,0.693085
3,0.8101,1.050907,0.69703,0.660413,0.678227,0.771251
4,0.5534,0.874094,0.734242,0.707552,0.72065,0.79798
5,0.3637,0.846495,0.725072,0.709428,0.717165,0.806216
6,0.2687,0.764811,0.743486,0.729362,0.736356,0.818493
7,0.1836,0.769251,0.74552,0.731707,0.738549,0.823155
8,0.16,0.766951,0.75521,0.739447,0.747245,0.826884
9,0.1549,0.759436,0.752801,0.740619,0.74666,0.828283
10,0.1222,0.759204,0.753513,0.742026,0.747725,0.829215


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 28. Training using 116 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.5553,2.430507,0.332401,0.278612,0.303139,0.47195
2,1.5104,1.312694,0.633209,0.599203,0.615737,0.712044
3,0.7967,1.039156,0.694949,0.655019,0.674393,0.759285
4,0.4969,0.876609,0.72264,0.698405,0.710316,0.794561
5,0.3376,0.805504,0.742091,0.720685,0.731231,0.808702
6,0.2728,0.767986,0.751257,0.735929,0.743514,0.81958
7,0.1974,0.770368,0.759259,0.740385,0.749703,0.825019
8,0.1711,0.756675,0.761574,0.744606,0.752994,0.829681
9,0.1587,0.757023,0.761735,0.749765,0.755703,0.830614
10,0.1426,0.757186,0.762154,0.75,0.756028,0.830458


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 29. Training using 120 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.5006,2.352053,0.318243,0.220919,0.260797,0.428283
2,1.5789,1.338104,0.595875,0.569184,0.582224,0.678943
3,0.8636,0.998183,0.712846,0.663696,0.687394,0.760528
4,0.5332,0.861075,0.736932,0.710835,0.723648,0.803263
5,0.3715,0.793314,0.747333,0.722795,0.734859,0.813986
6,0.2757,0.75147,0.753392,0.742261,0.747785,0.823155
7,0.1748,0.774861,0.753647,0.738977,0.74624,0.822067
8,0.1591,0.754443,0.763919,0.749765,0.756776,0.828749
9,0.129,0.767599,0.763849,0.750235,0.756981,0.829526
10,0.1318,0.768183,0.762599,0.748827,0.75565,0.828749


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]



VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
eval/accuracy,▂▁▃▄▂▅▆▅▃▇▇▆▂▄▇▇▇▂█▇▇██▇▆████▆███▄██▇███
eval/f1,▁▁▂▃▁▄▅▄▂▆▆▅▁▄▇▇▆▁▇▇▆██▇▅████▆██▇▃██▇███
eval/loss,▇█▆▅▆▄▃▄▅▃▂▃▆▅▂▂▂▆▁▂▂▁▁▂▃▁▁▁▁▃▁▁▁▅▁▁▂▁▁▁
eval/precision,▁▁▃▄▂▄▅▅▄▆▆▆▁▄▇▇▇▁█▇▇██▇▆████▆██▇▄██▇███
eval/recall,▁▁▂▃▁▄▅▄▂▆▆▅▁▃▇▇▆▁▇▇▆█▇▇▅███▇▆██▇▃██▇███
eval/runtime,▄▂▁▁▂▂▇▂▁▂▂▁▆▂▇▇▇▃▁▁▇▂▂▂▂▂▂▂▂▂▂█▂▂▂▂▂▁▂▂
eval/samples_per_second,▄▇█▇▇▇▂▇█▇▇▇▃▇▂▂▁▆▇█▂▇▇▇▇▇▇▇▇▇▇▁▇▇▇▇▇▇▇▆
eval/steps_per_second,▄▇█▇▇▇▂▇█▇▇▇▃▇▂▂▁▆▇█▂▇▇▇▇▇▇▇▇▇▇▁▇▇▇▇▇▇▇▆
train/epoch,▆█▂▃▃▄▃▃▃▁█▇▆▄▃█▆▄▂█▅▃█▅▂▇▄▁▆▃▇▄█▅▂▆▂▇▃▇
train/global_step,▁▁▁▁▁▂▂▂▂▁▄▄▃▃▂▅▄▃▂▅▄▂▆▄▂▆▄▁▅▃▇▄█▅▂▆▃▇▃█

0,1
eval/accuracy,0.82875
eval/f1,0.75565
eval/loss,0.76818
eval/precision,0.7626
eval/recall,0.74883
eval/runtime,1.124
eval/samples_per_second,68.503
eval/steps_per_second,17.793
train/epoch,10.0
train/global_step,300.0


Current seed:  1063


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 0. Training using 4 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.816309,0.013294,0.016886,0.014876,0.02331
2,No log,3.56267,0.052768,0.047608,0.050055,0.153846
3,No log,3.350509,0.068852,0.02955,0.041352,0.192696
4,No log,3.205517,0.094703,0.027674,0.042831,0.193473
5,No log,3.121142,0.115806,0.034709,0.05341,0.200622
6,No log,3.070256,0.12987,0.044559,0.066352,0.214608
7,No log,3.039236,0.132959,0.049953,0.072622,0.222844
8,No log,3.022436,0.142183,0.05652,0.080886,0.230769
9,No log,3.014938,0.148469,0.060272,0.085738,0.233722
10,No log,3.012997,0.151376,0.061914,0.087883,0.235431


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 1. Training using 8 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.75552,0.017956,0.022045,0.019792,0.034343
2,No log,3.315722,0.027752,0.013837,0.018466,0.150738
3,No log,3.121161,0.049525,0.023218,0.031614,0.171873
4,No log,2.998981,0.060922,0.026032,0.036477,0.182595
5,No log,2.912149,0.126578,0.084662,0.101461,0.243823
6,No log,2.849226,0.165347,0.12242,0.140682,0.287335
7,No log,2.803212,0.193087,0.15197,0.170079,0.319503
8,2.806600,2.773289,0.212926,0.173077,0.190944,0.340637
9,2.806600,2.758312,0.219009,0.179409,0.197241,0.34763
10,2.806600,2.754942,0.219233,0.179644,0.197474,0.348718


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 2. Training using 12 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.572578,0.053753,0.050891,0.052283,0.154779
2,No log,3.074534,0.103636,0.013368,0.023681,0.175602
3,No log,2.886515,0.169607,0.069887,0.098987,0.23683
4,No log,2.718964,0.272013,0.154315,0.196918,0.30878
5,No log,2.567876,0.311452,0.204737,0.247064,0.363326
6,2.815500,2.438594,0.341667,0.25,0.288732,0.410878
7,2.815500,2.344649,0.359736,0.281191,0.315651,0.441181
8,2.815500,2.290304,0.3625,0.292448,0.323728,0.453924
9,2.815500,2.26696,0.366028,0.300188,0.329854,0.460451
10,2.815500,2.262608,0.365708,0.301126,0.330289,0.461383


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 3. Training using 16 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.54571,0.073572,0.066135,0.069655,0.18648
2,No log,3.035805,0.113036,0.06121,0.079416,0.235587
3,No log,2.787884,0.253858,0.154315,0.191949,0.318104
4,2.928300,2.513961,0.322682,0.241557,0.276288,0.415695
5,2.928300,2.29555,0.365061,0.295028,0.326329,0.469775
6,2.928300,2.132999,0.38943,0.32833,0.356279,0.498834
7,2.928300,2.029974,0.422161,0.361867,0.389696,0.524165
8,1.540900,1.972203,0.42942,0.373124,0.399297,0.539549
9,1.540900,1.948359,0.438578,0.381801,0.408225,0.547941
10,1.540900,1.944197,0.440463,0.383443,0.40998,0.549184


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 4. Training using 20 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.363637,0.102041,0.072702,0.084908,0.222222
2,No log,2.939793,0.212766,0.04925,0.079985,0.215851
3,No log,2.664832,0.267691,0.19606,0.226344,0.367211
4,3.007800,2.346626,0.33789,0.266651,0.298073,0.447552
5,3.007800,2.084866,0.407336,0.348968,0.3759,0.532712
6,3.007800,1.906225,0.466421,0.415338,0.4394,0.586946
7,1.650700,1.808294,0.494626,0.442542,0.467137,0.606527
8,1.650700,1.756418,0.506273,0.454268,0.478863,0.616472
9,1.650700,1.732279,0.514173,0.459428,0.485261,0.62129
10,1.094100,1.728579,0.516299,0.4606,0.486862,0.621445


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 5. Training using 24 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.276612,0.074126,0.04925,0.05918,0.191764
2,No log,2.916049,0.077075,0.009146,0.016352,0.173582
3,3.059400,2.575372,0.311286,0.240619,0.271429,0.419736
4,3.059400,2.221738,0.374496,0.326454,0.348828,0.488112
5,3.059400,1.956191,0.426622,0.388602,0.406726,0.550117
6,1.801100,1.794051,0.490665,0.462242,0.476029,0.601865
7,1.801100,1.697153,0.519941,0.492261,0.505722,0.623465
8,1.082100,1.652066,0.524982,0.500235,0.512309,0.633877
9,1.082100,1.630883,0.533284,0.50727,0.519952,0.638695
10,1.082100,1.626836,0.535485,0.509615,0.52223,0.639782


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 6. Training using 28 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.132988,0.032895,0.002345,0.004378,0.159596
2,No log,2.757376,0.193548,0.119606,0.147848,0.295726
3,3.093800,2.369639,0.361886,0.26454,0.30565,0.449883
4,3.093800,1.909897,0.481183,0.434803,0.456819,0.59798
5,1.799500,1.642084,0.544199,0.508208,0.525588,0.643823
6,1.799500,1.522015,0.573149,0.535647,0.553764,0.668531
7,0.966900,1.43507,0.604571,0.576923,0.590424,0.691686
8,0.966900,1.410071,0.604121,0.577627,0.590577,0.692929
9,0.966900,1.405542,0.600294,0.574109,0.58691,0.692308
10,0.693100,1.402885,0.600147,0.574109,0.586839,0.692463


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 7. Training using 32 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.233981,0.074468,0.022983,0.035125,0.177933
2,3.191000,2.678195,0.300566,0.236632,0.264795,0.406061
3,3.191000,2.144897,0.438443,0.375,0.404247,0.547164
4,1.777500,1.734509,0.535315,0.494137,0.513902,0.631702
5,1.777500,1.543184,0.572816,0.539634,0.55573,0.666977
6,0.951700,1.432062,0.598481,0.572936,0.58543,0.690132
7,0.951700,1.367919,0.615329,0.594981,0.604984,0.704274
8,0.638000,1.343125,0.618886,0.599437,0.609006,0.707071
9,0.638000,1.334261,0.619715,0.601548,0.610496,0.708003
10,0.544300,1.332993,0.619773,0.601313,0.610404,0.708003


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 8. Training using 36 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.046621,0.007042,0.000235,0.000454,0.155556
2,3.151300,2.602933,0.311571,0.226079,0.262028,0.400622
3,3.151300,2.022917,0.44835,0.391886,0.41822,0.562549
4,1.839400,1.672334,0.544736,0.516886,0.530445,0.645688
5,1.839400,1.493343,0.585871,0.564024,0.57474,0.676457
6,1.050800,1.385647,0.601689,0.584897,0.593174,0.69526
7,1.050800,1.326943,0.623884,0.606473,0.615055,0.711577
8,0.672000,1.307951,0.625634,0.60788,0.616629,0.711733
9,0.528100,1.305784,0.624668,0.606942,0.615677,0.712044
10,0.528100,1.302304,0.626967,0.607411,0.617034,0.713131


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 9. Training using 40 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.093491,0.0,0.0,0.0,0.154934
2,3.210700,2.545522,0.295209,0.25,0.27073,0.440093
3,3.210700,1.901938,0.472081,0.4144,0.441364,0.583994
4,1.968300,1.53626,0.575288,0.5394,0.556766,0.674281
5,1.050800,1.385252,0.599901,0.568246,0.583644,0.691531
6,1.050800,1.317835,0.614189,0.592871,0.603341,0.705517
7,0.711000,1.269173,0.616639,0.603189,0.60984,0.713442
8,0.535300,1.241238,0.627066,0.613977,0.620453,0.720901
9,0.535300,1.237859,0.631033,0.613274,0.622027,0.720746
10,0.467300,1.236378,0.630147,0.613743,0.621837,0.720901


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 10. Training using 44 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.037817,0.092486,0.011257,0.020071,0.165812
2,3.259800,2.524734,0.356809,0.215056,0.268364,0.383528
3,2.133700,1.816431,0.505835,0.467636,0.485986,0.618493
4,2.133700,1.503741,0.58854,0.558865,0.573319,0.6777
5,1.141100,1.329384,0.621508,0.589587,0.605127,0.704429
6,0.771200,1.25271,0.635455,0.611163,0.623072,0.713442
7,0.771200,1.167716,0.645045,0.627345,0.636072,0.732246
8,0.537300,1.157528,0.649915,0.630863,0.640248,0.735043
9,0.493600,1.149784,0.652953,0.632739,0.642687,0.736131
10,0.493600,1.148626,0.654479,0.633912,0.644031,0.737529


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 11. Training using 48 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,2.983315,0.049618,0.003049,0.005745,0.161461
2,3.275200,2.184538,0.434104,0.365385,0.396791,0.556488
3,1.984900,1.60838,0.570842,0.521576,0.545098,0.663248
4,1.152900,1.320266,0.629222,0.589822,0.608885,0.706915
5,1.152900,1.160369,0.668293,0.642589,0.655189,0.746698
6,0.691500,1.085155,0.679619,0.652205,0.665629,0.761927
7,0.523900,1.05284,0.697983,0.665572,0.681393,0.776068
8,0.419800,1.036075,0.696242,0.673546,0.684706,0.779176
9,0.419800,1.023976,0.697146,0.675891,0.686354,0.779953
10,0.361600,1.023131,0.697241,0.675657,0.686279,0.779953


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 12. Training using 52 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,2.960841,0.104677,0.033068,0.050258,0.21352
2,3.277500,2.115458,0.389169,0.325281,0.354369,0.517172
3,2.050000,1.575662,0.569815,0.520638,0.544118,0.65812
4,1.220800,1.291389,0.637346,0.608349,0.62251,0.718881
5,0.834200,1.166013,0.65825,0.62969,0.643653,0.733023
6,0.834200,1.071235,0.675524,0.649859,0.662443,0.751204
7,0.540400,1.041485,0.677712,0.666745,0.672183,0.756022
8,0.445900,1.006558,0.680876,0.670497,0.675647,0.765967
9,0.345500,0.998406,0.686845,0.675891,0.681324,0.770319
10,0.349700,0.998278,0.685578,0.674484,0.679986,0.769852


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 13. Training using 56 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.001705,0.142105,0.018996,0.033513,0.184149
2,3.311900,2.221947,0.369709,0.301126,0.331912,0.498368
3,2.242600,1.601846,0.548895,0.506801,0.527009,0.646309
4,1.350900,1.318837,0.624265,0.597326,0.610499,0.711267
5,0.878300,1.172425,0.656053,0.632974,0.644307,0.734887
6,0.552800,1.122591,0.663059,0.646576,0.654714,0.742347
7,0.447200,1.06578,0.67148,0.654315,0.662787,0.751981
8,0.360400,1.048305,0.684388,0.667214,0.675692,0.761772
9,0.360400,1.03438,0.688309,0.67378,0.680967,0.766589
10,0.312900,1.034472,0.689118,0.67425,0.681603,0.766589


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 14. Training using 60 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,2.96999,0.021978,0.000469,0.000918,0.155245
2,3.327300,2.009984,0.432987,0.351548,0.38804,0.540171
3,2.159100,1.454909,0.587756,0.558396,0.5727,0.679876
4,1.265400,1.241304,0.63874,0.613274,0.625748,0.722145
5,0.804500,1.102501,0.663178,0.639071,0.650902,0.741259
6,0.577300,1.013422,0.682124,0.665807,0.673867,0.765501
7,0.412600,0.995864,0.691863,0.674015,0.682823,0.772028
8,0.340200,0.968711,0.705235,0.691839,0.698473,0.784149
9,0.305700,0.964333,0.706485,0.694887,0.700638,0.786169
10,0.260400,0.965072,0.706962,0.695356,0.701111,0.786169


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 15. Training using 64 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.3306,2.879388,0.332072,0.082317,0.13193,0.239782
2,2.1743,1.887648,0.470925,0.40455,0.435221,0.581818
3,1.2749,1.442422,0.585821,0.552298,0.568566,0.671639
4,0.8507,1.149189,0.64495,0.624531,0.634576,0.732246
5,0.6073,1.036277,0.669301,0.655488,0.662322,0.757887
6,0.4476,0.976612,0.702214,0.691839,0.696988,0.781352
7,0.3462,0.945055,0.701305,0.693246,0.697252,0.785082
8,0.2924,0.929437,0.708225,0.70075,0.704468,0.792075
9,0.261,0.927978,0.709418,0.703096,0.706243,0.791608
10,0.2524,0.927562,0.7073,0.702158,0.704719,0.791142


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 16. Training using 68 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.4122,2.941486,0.104762,0.00258,0.005035,0.156954
2,2.4176,2.031295,0.436496,0.394934,0.414676,0.559907
3,1.5549,1.501568,0.56336,0.537992,0.550384,0.659984
4,1.0252,1.263208,0.617605,0.602251,0.609831,0.705206
5,0.7018,1.094773,0.652867,0.643527,0.648163,0.733178
6,0.5038,1.007568,0.674761,0.677767,0.676261,0.76115
7,0.4257,0.970715,0.683462,0.687148,0.6853,0.774514
8,0.349,0.971514,0.683817,0.685741,0.684778,0.777778
9,0.2603,0.962183,0.692542,0.694653,0.693596,0.78244
10,0.2549,0.961013,0.693958,0.697702,0.695825,0.784615


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 17. Training using 72 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.3721,2.860738,0.185326,0.091229,0.122269,0.255478
2,2.252,1.73119,0.545906,0.489447,0.516137,0.646309
3,1.3249,1.297803,0.636296,0.599437,0.617317,0.715462
4,0.8249,1.08645,0.673222,0.650328,0.661577,0.748407
5,0.5996,0.996613,0.693443,0.672139,0.682625,0.774359
6,0.4533,0.940068,0.708383,0.695591,0.701929,0.793784
7,0.335,0.928855,0.721092,0.706379,0.71366,0.798912
8,0.2416,0.904769,0.723684,0.709428,0.716485,0.802642
9,0.2013,0.896754,0.722912,0.710366,0.716584,0.804196
10,0.1991,0.89709,0.721163,0.709662,0.715366,0.803419


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 18. Training using 76 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.4205,2.829886,0.228234,0.086069,0.125,0.255012
2,2.2209,1.741381,0.512869,0.44864,0.478609,0.612898
3,1.3725,1.290891,0.625783,0.609053,0.617304,0.708003
4,0.9199,1.130435,0.651265,0.628049,0.639446,0.731935
5,0.628,1.018845,0.677258,0.664869,0.671006,0.755711
6,0.3642,0.972429,0.694537,0.685741,0.690111,0.77265
7,0.2909,0.904573,0.715844,0.707786,0.711792,0.796115
8,0.257,0.903599,0.718557,0.710131,0.714319,0.796115
9,0.1859,0.893376,0.727186,0.717636,0.72238,0.800777
10,0.2099,0.892499,0.724858,0.716698,0.720755,0.800622


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 19. Training using 80 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.4587,2.835821,0.274194,0.043856,0.075617,0.205128
2,2.4067,1.79911,0.478354,0.419794,0.447165,0.585082
3,1.5434,1.333412,0.603385,0.576923,0.589857,0.692929
4,0.748,1.109908,0.655691,0.644465,0.65003,0.737685
5,0.5247,0.985533,0.674479,0.668152,0.671301,0.76317
6,0.3795,0.936987,0.700214,0.691839,0.696001,0.787879
7,0.306,0.904122,0.719469,0.711538,0.715482,0.800311
8,0.2286,0.903744,0.718327,0.708724,0.713493,0.798601
9,0.2113,0.899934,0.72516,0.717167,0.721141,0.804662
10,0.1762,0.896902,0.726151,0.717636,0.721868,0.804973


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 20. Training using 84 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.4374,2.724721,0.261289,0.196764,0.224482,0.383217
2,2.3229,1.57846,0.551581,0.499062,0.524009,0.644289
3,1.3793,1.218429,0.631823,0.608114,0.619742,0.713442
4,0.6732,1.020447,0.689123,0.659709,0.674095,0.758974
5,0.5124,0.933174,0.708682,0.694887,0.701717,0.787413
6,0.4005,0.868526,0.726162,0.710835,0.718417,0.799534
7,0.2577,0.858277,0.735469,0.727017,0.731218,0.807459
8,0.215,0.846953,0.74114,0.725844,0.733412,0.810878
9,0.1768,0.843221,0.741935,0.728189,0.734998,0.812432
10,0.1758,0.84315,0.740865,0.727486,0.734114,0.812432


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 21. Training using 88 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.4934,2.766099,0.12044,0.041041,0.061221,0.20202
2,2.4169,1.647696,0.543191,0.491088,0.515827,0.638695
3,0.9785,1.249744,0.620157,0.593105,0.606329,0.708314
4,0.7058,1.028602,0.67123,0.666979,0.669098,0.757576
5,0.5339,0.931717,0.703924,0.694184,0.69902,0.78819
6,0.3321,0.893793,0.723146,0.713649,0.718366,0.798446
7,0.2425,0.870229,0.731852,0.725844,0.728836,0.810567
8,0.1679,0.86198,0.735836,0.731004,0.733412,0.811966
9,0.1831,0.862228,0.738309,0.733114,0.735703,0.81352
10,0.1505,0.862743,0.738483,0.733114,0.735789,0.81352


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 22. Training using 92 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.4927,2.633276,0.302983,0.183396,0.228488,0.380264
2,2.3378,1.480932,0.587928,0.527674,0.556174,0.663559
3,0.8783,1.12115,0.651202,0.635319,0.643162,0.733955
4,0.7329,0.975079,0.702455,0.684334,0.693276,0.775291
5,0.3912,0.885765,0.731222,0.714587,0.722809,0.805439
6,0.3173,0.843319,0.742305,0.729597,0.735896,0.816628
7,0.214,0.811948,0.75179,0.738743,0.745209,0.820513
8,0.1855,0.812243,0.748463,0.742495,0.745467,0.822067
9,0.1957,0.806968,0.753671,0.746248,0.749941,0.824553
10,0.1591,0.806241,0.752302,0.747186,0.749735,0.824709


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 23. Training using 96 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.4368,2.675462,0.279607,0.113508,0.161468,0.30303
2,1.5259,1.529711,0.568119,0.529081,0.547905,0.660451
3,0.9111,1.152169,0.640097,0.621482,0.630652,0.723232
4,0.5399,0.971368,0.705184,0.682692,0.693756,0.780109
5,0.39,0.910965,0.722556,0.705441,0.713896,0.794406
6,0.2911,0.896814,0.734099,0.719981,0.726971,0.805439
7,0.2353,0.881795,0.734945,0.727017,0.73096,0.81181
8,0.1696,0.863814,0.737312,0.735929,0.73662,0.81554
9,0.1459,0.875263,0.732878,0.7303,0.731587,0.812898
10,0.1554,0.875343,0.733584,0.731004,0.732292,0.812898


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 24. Training using 100 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.4886,2.640605,0.302881,0.216932,0.252801,0.387723
2,1.556,1.494846,0.585992,0.529784,0.556472,0.671329
3,1.0508,1.150495,0.659829,0.633677,0.646489,0.732867
4,0.5995,0.947604,0.705516,0.689962,0.697652,0.778555
5,0.4509,0.855149,0.735763,0.715056,0.725262,0.804973
6,0.295,0.813863,0.740453,0.736632,0.738538,0.813364
7,0.1978,0.814009,0.744004,0.734756,0.739351,0.816162
8,0.1578,0.81871,0.739151,0.734991,0.737065,0.814452
9,0.1461,0.818424,0.742385,0.737336,0.739852,0.817094
10,0.1389,0.814881,0.745687,0.739916,0.74279,0.818493


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 25. Training using 104 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.4535,2.618454,0.362261,0.235929,0.285755,0.416628
2,1.6006,1.465841,0.597436,0.546435,0.570799,0.676768
3,0.989,1.171604,0.651589,0.625,0.638018,0.733023
4,0.5867,0.973323,0.703908,0.688555,0.696147,0.778555
5,0.4073,0.897539,0.711761,0.708255,0.710004,0.795493
6,0.2894,0.872013,0.733254,0.721388,0.727273,0.805905
7,0.1939,0.87024,0.732861,0.727017,0.729927,0.807459
8,0.1607,0.874604,0.739192,0.729831,0.734482,0.8115
9,0.1446,0.866661,0.738061,0.732176,0.735107,0.812743
10,0.1387,0.865444,0.737898,0.73288,0.735381,0.813364


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 26. Training using 108 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.4936,2.667525,0.30584,0.160882,0.21085,0.346853
2,1.7221,1.482293,0.580303,0.538931,0.558852,0.666822
3,0.8386,1.171951,0.636658,0.600375,0.617984,0.719192
4,0.6199,0.962743,0.702467,0.681051,0.691593,0.777001
5,0.4352,0.874283,0.718893,0.700516,0.709585,0.795027
6,0.2767,0.827658,0.735772,0.721623,0.728629,0.810101
7,0.2191,0.816575,0.749109,0.739447,0.744246,0.819114
8,0.1723,0.811464,0.751481,0.743902,0.747672,0.821134
9,0.1548,0.819024,0.751899,0.74273,0.747286,0.820513
10,0.1283,0.819562,0.751659,0.743902,0.74776,0.820668


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 27. Training using 112 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.6061,2.593147,0.309747,0.155019,0.206627,0.34561
2,1.6851,1.435271,0.587748,0.549015,0.567722,0.674903
3,0.7675,1.139319,0.6474,0.627814,0.637457,0.728361
4,0.5021,0.93698,0.691625,0.675891,0.683667,0.77296
5,0.402,0.832156,0.733763,0.720685,0.727165,0.806371
6,0.2703,0.824731,0.732147,0.723734,0.727916,0.810567
7,0.1827,0.801338,0.742857,0.737805,0.740322,0.816939
8,0.1432,0.793865,0.751243,0.744371,0.747791,0.822067
9,0.1378,0.797196,0.74841,0.745075,0.746739,0.821445
10,0.1144,0.800174,0.748879,0.744137,0.7465,0.82129


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 28. Training using 116 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.4779,2.450448,0.393512,0.28166,0.328321,0.48547
2,1.4727,1.389966,0.584744,0.559099,0.571634,0.674126
3,0.782,1.060364,0.675584,0.651501,0.663324,0.745921
4,0.4974,0.866969,0.738222,0.712946,0.725364,0.801399
5,0.327,0.817091,0.754771,0.742026,0.748344,0.821445
6,0.2466,0.806766,0.747303,0.731004,0.739063,0.817716
7,0.1768,0.803713,0.74561,0.736867,0.741213,0.816939
8,0.1399,0.784586,0.754753,0.744841,0.749764,0.824242
9,0.1179,0.791519,0.756271,0.749531,0.752886,0.825796
10,0.1216,0.795402,0.754083,0.747186,0.750618,0.823932


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 29. Training using 120 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.4888,2.45645,0.371079,0.277439,0.317499,0.467288
2,1.6556,1.405439,0.59995,0.557458,0.577924,0.687179
3,0.7901,1.094808,0.650556,0.631332,0.6408,0.736286
4,0.5092,0.951156,0.705455,0.682458,0.693766,0.778244
5,0.3095,0.815301,0.741541,0.724672,0.733009,0.813209
6,0.2372,0.81886,0.749227,0.738508,0.743829,0.820357
7,0.1557,0.815697,0.752143,0.740854,0.746456,0.823621
8,0.1462,0.811363,0.757939,0.755629,0.756782,0.830303
9,0.1309,0.814795,0.758084,0.753283,0.755676,0.829837
10,0.1063,0.814111,0.757669,0.753049,0.755352,0.828904


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
eval/accuracy,▂▁▄▄▃▆▆▆▃▇▇▆▂▄▇█▇▂▇▇▇███▆████▇███▄██▇███
eval/f1,▁▁▃▄▃▅▅▅▂▆▇▆▁▃▇▇▇▁▇▇▆█▇▇▅███▇▆██▇▄██▇███
eval/loss,▇█▆▅▆▄▃▄▆▂▂▃▆▅▂▂▂▆▂▂▃▁▁▁▃▁▁▁▁▃▁▁▁▅▁▁▂▁▁▁
eval/precision,▂▁▃▄▃▅▆▅▃▇▇▆▁▄▇▇▇▂▇▇▆█▇▇▆███▇▆███▄██▇███
eval/recall,▁▁▃▃▂▅▅▅▂▆▇▆▁▃▇▇▇▁▇▇▆█▇▇▅███▇▆██▇▃██▇███
eval/runtime,▂▂▂▁▁▁▇▁▂▁▁▂▁▁██▂▁▂█▅▂▇▁▁▁▂▂▂▁▂█▂▁▂▂██▆▂
eval/samples_per_second,▆▇▇██▇▁█▇▇█▇██▁▁▇█▇▁▄▇▂▇█▇▇▇▇█▇▁▇▇▇▇▁▁▃▇
eval/steps_per_second,▆▇▇██▇▁█▇▇█▇██▁▁▇█▇▁▄▇▂▇█▇▇▇▇█▇▁▇▇▇▇▁▁▃▇
train/epoch,▆█▂▃▃▄▃▃▃▁█▇▆▄▃█▆▄▂█▅▃█▅▂▇▄▁▆▃▇▄█▅▂▆▂▇▃▇
train/global_step,▁▁▁▁▁▂▂▂▂▁▄▄▃▃▂▅▄▃▂▅▄▂▆▄▂▆▄▁▅▃▇▄█▅▂▆▃▇▃█

0,1
eval/accuracy,0.8289
eval/f1,0.75535
eval/loss,0.81411
eval/precision,0.75767
eval/recall,0.75305
eval/runtime,0.8939
eval/samples_per_second,86.143
eval/steps_per_second,22.375
train/epoch,10.0
train/global_step,300.0


Current seed:  184


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 0. Training using 4 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.832788,0.015657,0.019934,0.017538,0.02906
2,No log,3.591454,0.053993,0.062148,0.057785,0.133023
3,No log,3.386785,0.085479,0.075516,0.080189,0.19627
4,No log,3.230706,0.098967,0.069653,0.081762,0.197358
5,No log,3.125157,0.108688,0.068949,0.084374,0.199845
6,No log,3.056917,0.127382,0.089353,0.105031,0.227195
7,No log,3.012968,0.143162,0.109991,0.124403,0.261228
8,No log,2.987821,0.148874,0.119371,0.1325,0.278322
9,No log,2.976237,0.156071,0.127814,0.140536,0.28951
10,No log,2.97325,0.157431,0.129925,0.142362,0.292152


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 1. Training using 8 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.783311,0.020957,0.026501,0.023405,0.053147
2,No log,3.345499,0.100619,0.057223,0.072956,0.222222
3,No log,3.094484,0.150573,0.043152,0.06708,0.222067
4,No log,2.962506,0.198524,0.063086,0.095747,0.252214
5,No log,2.862295,0.241489,0.143058,0.179676,0.344678
6,No log,2.79231,0.264779,0.175422,0.211031,0.383838
7,No log,2.73756,0.279754,0.191839,0.227602,0.398291
8,2.719300,2.700532,0.288588,0.205206,0.239857,0.411655
9,2.719300,2.683302,0.292778,0.211069,0.245298,0.417094
10,2.719300,2.679536,0.292343,0.211304,0.245304,0.417716


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 2. Training using 12 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.55659,0.06421,0.069887,0.066929,0.142813
2,No log,3.076017,0.152044,0.065432,0.09149,0.21958
3,No log,2.889444,0.218137,0.104362,0.14118,0.282517
4,No log,2.747304,0.253904,0.175422,0.20749,0.373893
5,No log,2.612625,0.280095,0.22045,0.246719,0.42129
6,2.796000,2.492796,0.324779,0.26712,0.293141,0.461694
7,2.796000,2.40881,0.35304,0.295497,0.321716,0.485004
8,2.796000,2.35489,0.371421,0.310272,0.338104,0.497125
9,2.796000,2.332067,0.380017,0.317542,0.345982,0.503652
10,2.796000,2.327744,0.380432,0.318246,0.346571,0.50474


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 3. Training using 16 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.482643,0.069236,0.070356,0.069792,0.157731
2,No log,2.995827,0.196053,0.144465,0.166352,0.329448
3,No log,2.774736,0.233799,0.196295,0.213412,0.379798
4,2.946100,2.576461,0.30423,0.236163,0.26591,0.433722
5,2.946100,2.389553,0.371437,0.30863,0.337133,0.488423
6,2.946100,2.230763,0.411024,0.344512,0.374841,0.521523
7,2.946100,2.126149,0.431755,0.363508,0.394703,0.537995
8,1.632200,2.066986,0.439825,0.377111,0.406061,0.547786
9,1.632200,2.039654,0.445291,0.383677,0.412195,0.551826
10,1.632200,2.034545,0.445593,0.384146,0.412594,0.552603


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 4. Training using 20 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.425632,0.067071,0.056989,0.06162,0.154157
2,No log,2.892798,0.225985,0.153377,0.182733,0.299922
3,No log,2.596415,0.341989,0.290338,0.314054,0.47972
4,2.986300,2.301115,0.396966,0.337477,0.364812,0.527428
5,2.986300,2.048018,0.451492,0.393996,0.420789,0.560218
6,2.986300,1.837086,0.513831,0.461773,0.486413,0.609635
7,1.575100,1.735387,0.530858,0.486163,0.507528,0.623932
8,1.575100,1.685976,0.540253,0.500469,0.519601,0.630769
9,1.575100,1.661218,0.54474,0.503987,0.523572,0.635431
10,1.020200,1.656456,0.546792,0.505629,0.525405,0.636674


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 5. Training using 24 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.325291,0.112521,0.095685,0.103422,0.239161
2,No log,2.813636,0.234234,0.146341,0.180139,0.339239
3,3.132800,2.483487,0.348222,0.296201,0.320112,0.490754
4,3.132800,2.110438,0.43733,0.376407,0.404588,0.551204
5,3.132800,1.840136,0.509659,0.451689,0.478926,0.599223
6,1.683600,1.673706,0.55443,0.513602,0.533236,0.64087
7,1.683600,1.587319,0.581401,0.541041,0.560496,0.666511
8,1.009600,1.546965,0.592832,0.55863,0.575223,0.675991
9,1.009600,1.529974,0.598361,0.564962,0.581182,0.681119
10,1.009600,1.526485,0.59995,0.566604,0.582801,0.682517


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 6. Training using 28 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.197729,0.100622,0.08349,0.091259,0.211033
2,No log,2.737128,0.265876,0.236632,0.250403,0.411655
3,3.120700,2.336864,0.354311,0.299719,0.324736,0.494172
4,3.120700,1.927678,0.451271,0.378987,0.411982,0.562082
5,1.788600,1.700189,0.513203,0.460366,0.48535,0.617405
6,1.788600,1.554674,0.560162,0.5197,0.539173,0.660451
7,1.017600,1.498152,0.574956,0.540572,0.557234,0.668531
8,1.017600,1.441545,0.587637,0.555113,0.570912,0.683139
9,1.017600,1.424189,0.592859,0.560741,0.576353,0.686247
10,0.745700,1.421912,0.593409,0.561679,0.577108,0.687024


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 7. Training using 32 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.18162,0.060976,0.010553,0.017993,0.169386
2,3.213500,2.728549,0.248801,0.194653,0.218421,0.411033
3,3.213500,2.244971,0.366511,0.293621,0.326042,0.504118
4,1.881200,1.792426,0.492291,0.419325,0.452888,0.593162
5,1.881200,1.565832,0.568983,0.530019,0.54881,0.665734
6,1.032900,1.436612,0.60134,0.56848,0.584448,0.690754
7,1.032900,1.360545,0.611261,0.583021,0.596807,0.698057
8,0.700300,1.334718,0.616331,0.587711,0.601681,0.702253
9,0.700300,1.312554,0.61999,0.594981,0.607228,0.705828
10,0.605400,1.309408,0.622097,0.596857,0.609216,0.706915


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 8. Training using 36 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.078695,0.119826,0.097092,0.107268,0.241803
2,3.241100,2.609074,0.262471,0.212242,0.234699,0.416006
3,3.241100,2.116791,0.381833,0.319418,0.347848,0.515152
4,1.987100,1.697823,0.511652,0.458255,0.483484,0.627661
5,1.987100,1.485444,0.592304,0.570356,0.581123,0.684071
6,1.181300,1.385678,0.605302,0.583724,0.594317,0.694639
7,1.181300,1.302243,0.61823,0.599672,0.60881,0.709557
8,0.746200,1.263753,0.62729,0.610225,0.61864,0.719037
9,0.622600,1.252082,0.632403,0.616088,0.624139,0.721834
10,0.622600,1.251327,0.633277,0.616792,0.624926,0.722145


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 9. Training using 40 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.073492,0.175789,0.07833,0.108371,0.240715
2,3.288000,2.535536,0.238925,0.183396,0.20751,0.390521
3,3.288000,1.97178,0.435399,0.367495,0.398576,0.552914
4,2.038800,1.596055,0.558638,0.519465,0.53834,0.662626
5,1.213000,1.423622,0.596986,0.575985,0.586297,0.691064
6,1.213000,1.306853,0.619484,0.602486,0.610867,0.704895
7,0.819800,1.251425,0.632037,0.613508,0.622635,0.714685
8,0.601500,1.224958,0.640648,0.621717,0.63104,0.722611
9,0.601500,1.214802,0.640569,0.623593,0.631967,0.725874
10,0.557900,1.213356,0.640366,0.624296,0.632229,0.72603


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 10. Training using 44 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.013464,0.147382,0.103659,0.121713,0.268065
2,3.317900,2.416429,0.319523,0.276735,0.296594,0.480808
3,2.110000,1.78529,0.504982,0.439728,0.470102,0.614297
4,2.110000,1.446282,0.601564,0.559099,0.579555,0.685625
5,1.237100,1.295294,0.636275,0.612101,0.623954,0.715462
6,0.783200,1.181637,0.652764,0.631332,0.641869,0.738462
7,0.783200,1.122345,0.669971,0.649859,0.659762,0.752603
8,0.551700,1.102123,0.678356,0.657833,0.667937,0.758819
9,0.486400,1.091876,0.680183,0.660882,0.670394,0.760528
10,0.486400,1.091026,0.679537,0.660413,0.669838,0.760062


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 11. Training using 48 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,2.976455,0.163043,0.024625,0.042787,0.200777
2,3.395800,2.366533,0.325391,0.204972,0.251511,0.411344
3,2.157700,1.735896,0.497171,0.45333,0.474239,0.611189
4,1.301300,1.423716,0.593797,0.556754,0.574679,0.682828
5,1.301300,1.288954,0.615385,0.596623,0.605859,0.707537
6,0.817500,1.161665,0.657419,0.639071,0.648115,0.738462
7,0.584900,1.121048,0.66092,0.64728,0.654028,0.748563
8,0.488000,1.088216,0.675121,0.655488,0.665159,0.757887
9,0.488000,1.078879,0.676214,0.653377,0.664599,0.759441
10,0.424300,1.077771,0.676121,0.654081,0.664918,0.760062


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 12. Training using 52 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,2.9296,0.157276,0.090994,0.115287,0.271329
2,3.309200,2.210134,0.373674,0.305582,0.336215,0.518104
3,2.142200,1.608523,0.574566,0.527674,0.550122,0.667288
4,1.319200,1.337682,0.612169,0.580441,0.595883,0.694328
5,0.809000,1.186894,0.65778,0.636492,0.646961,0.738462
6,0.809000,1.146284,0.660667,0.645638,0.653066,0.74763
7,0.577700,1.099653,0.676577,0.656426,0.666349,0.755711
8,0.495800,1.077522,0.677373,0.657833,0.66746,0.758508
9,0.375900,1.06723,0.682601,0.659709,0.67096,0.763326
10,0.396800,1.065047,0.682856,0.659475,0.670962,0.76317


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 13. Training using 56 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,2.907212,0.123878,0.016182,0.028625,0.180264
2,3.409000,2.152097,0.382078,0.325985,0.35181,0.519192
3,2.217800,1.555734,0.569914,0.52955,0.548991,0.668376
4,1.383800,1.289559,0.63462,0.6053,0.619613,0.716861
5,0.912100,1.189761,0.649497,0.621013,0.634936,0.728982
6,0.583100,1.1212,0.658857,0.646341,0.652539,0.750272
7,0.474100,1.055508,0.687125,0.672139,0.679549,0.769075
8,0.404500,1.030977,0.691717,0.675657,0.683592,0.773271
9,0.404500,1.02488,0.698439,0.682223,0.690236,0.777467
10,0.362900,1.024726,0.699038,0.681989,0.690408,0.778244


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 14. Training using 60 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,2.932507,0.120091,0.074578,0.092014,0.232634
2,3.537500,2.00764,0.463486,0.407833,0.433882,0.584305
3,2.274300,1.436803,0.605637,0.559334,0.581565,0.690443
4,1.333200,1.203611,0.652333,0.626173,0.638985,0.740171
5,0.897300,1.049444,0.68627,0.662289,0.674066,0.763792
6,0.589200,1.006604,0.695965,0.679644,0.687708,0.77669
7,0.474000,0.978876,0.702056,0.680816,0.691273,0.78042
8,0.385400,0.962538,0.709654,0.687852,0.698583,0.785548
9,0.330000,0.94571,0.714148,0.694887,0.704386,0.789277
10,0.308300,0.943693,0.71618,0.696529,0.706218,0.789899


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 15. Training using 64 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.3899,2.817911,0.26334,0.089118,0.13317,0.261538
2,2.2173,1.843974,0.489142,0.433161,0.459453,0.601709
3,1.2872,1.332776,0.614583,0.581144,0.597396,0.706294
4,0.8509,1.125655,0.669978,0.648452,0.659039,0.753069
5,0.6415,1.072726,0.67052,0.652908,0.661597,0.756643
6,0.4904,0.966217,0.706368,0.68152,0.693722,0.779176
7,0.4093,0.924789,0.707941,0.687852,0.697752,0.78446
8,0.3488,0.927665,0.715221,0.692073,0.703456,0.788967
9,0.3087,0.922622,0.716812,0.693949,0.705195,0.789588
10,0.2977,0.920381,0.718197,0.695122,0.706471,0.790987


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 16. Training using 68 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.4675,2.885527,0.147251,0.074109,0.098596,0.250971
2,2.417,1.922693,0.431395,0.353189,0.388395,0.548873
3,1.4825,1.352693,0.608847,0.574578,0.591216,0.697436
4,0.9849,1.126901,0.672159,0.650563,0.661185,0.755556
5,0.6238,1.027949,0.680596,0.664634,0.67252,0.765967
6,0.5126,0.974798,0.699326,0.681285,0.690188,0.779021
7,0.3943,0.955173,0.709981,0.690666,0.70019,0.784771
8,0.3509,0.95774,0.71087,0.690197,0.700381,0.784305
9,0.3213,0.938708,0.716005,0.697702,0.706735,0.789122
10,0.2728,0.937281,0.716245,0.697936,0.706972,0.789588


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 17. Training using 72 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.4414,2.763642,0.160612,0.118199,0.136179,0.305361
2,2.2606,1.65571,0.552687,0.492026,0.520596,0.645843
3,1.2815,1.28104,0.635306,0.601782,0.61809,0.716706
4,0.915,1.117153,0.675987,0.646341,0.660832,0.749806
5,0.6669,1.018355,0.688964,0.66909,0.678882,0.769852
6,0.5254,0.959727,0.704799,0.681989,0.693206,0.783683
7,0.4144,0.954591,0.704551,0.68621,0.69526,0.785703
8,0.2877,0.928893,0.715736,0.694418,0.704916,0.793784
9,0.2523,0.930208,0.717681,0.693949,0.705616,0.794716
10,0.2501,0.930599,0.717955,0.694887,0.706233,0.794872


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 18. Training using 76 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.487,2.803045,0.234856,0.110929,0.150685,0.30676
2,2.3759,1.717407,0.512004,0.445122,0.476226,0.620047
3,1.46,1.258059,0.63043,0.609287,0.619678,0.720591
4,1.0076,1.029511,0.691241,0.666276,0.678529,0.769231
5,0.6969,0.95586,0.705495,0.677533,0.691231,0.781197
6,0.3852,0.914921,0.710616,0.681285,0.695642,0.7885
7,0.3223,0.898832,0.712458,0.692073,0.702118,0.791919
8,0.2656,0.881039,0.726568,0.703565,0.714881,0.799689
9,0.2372,0.87599,0.725163,0.703565,0.714201,0.799223
10,0.237,0.876212,0.726525,0.704034,0.715102,0.799689


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 19. Training using 80 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.4092,2.640482,0.22381,0.121248,0.157286,0.324165
2,2.2369,1.527068,0.591858,0.531895,0.560277,0.670862
3,1.357,1.173587,0.64955,0.625938,0.637525,0.731158
4,0.6597,1.029905,0.689045,0.666745,0.677712,0.765346
5,0.4735,0.926043,0.719247,0.689728,0.704178,0.789277
6,0.4119,0.881142,0.734559,0.702861,0.71836,0.801088
7,0.3116,0.882816,0.73293,0.709897,0.721229,0.801865
8,0.2494,0.879647,0.732459,0.707552,0.71979,0.801399
9,0.2117,0.866083,0.737125,0.708255,0.722402,0.805905
10,0.2237,0.869636,0.736084,0.707083,0.721292,0.804507


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 20. Training using 84 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.476,2.694339,0.256663,0.182927,0.213611,0.379643
2,2.4225,1.576301,0.559548,0.511257,0.534314,0.656721
3,1.5315,1.181124,0.642664,0.613274,0.627625,0.72805
4,0.7241,1.004385,0.694714,0.671904,0.683119,0.77094
5,0.5302,0.961015,0.706577,0.687852,0.697089,0.787102
6,0.4541,0.898892,0.725434,0.706379,0.715779,0.79798
7,0.2937,0.884382,0.727449,0.705441,0.716276,0.801399
8,0.247,0.876242,0.725971,0.701454,0.713502,0.798601
9,0.2221,0.871421,0.72703,0.70333,0.714984,0.799223
10,0.2181,0.870676,0.727251,0.702861,0.714848,0.799845


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 21. Training using 88 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.4374,2.592428,0.298049,0.143293,0.193538,0.346853
2,2.359,1.490521,0.58816,0.540572,0.563363,0.673504
3,0.9653,1.174443,0.640471,0.625,0.632641,0.728361
4,0.7082,1.024436,0.685632,0.666979,0.676177,0.768454
5,0.5203,0.932025,0.72694,0.69864,0.712509,0.792075
6,0.3589,0.923077,0.726568,0.703565,0.714881,0.795183
7,0.3068,0.884918,0.742528,0.710835,0.726336,0.804507
8,0.2138,0.874859,0.737186,0.715056,0.725952,0.804196
9,0.2054,0.877545,0.742697,0.715525,0.728858,0.805905
10,0.1869,0.878271,0.742934,0.715056,0.728728,0.805128


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 22. Training using 92 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.4595,2.645446,0.244473,0.17894,0.206635,0.372339
2,2.497,1.528665,0.563927,0.521341,0.541799,0.657964
3,1.0653,1.179667,0.632123,0.616557,0.624243,0.725253
4,0.8154,0.97626,0.707449,0.672608,0.689589,0.780886
5,0.457,0.925643,0.723952,0.692542,0.707899,0.790365
6,0.3842,0.860361,0.736029,0.704268,0.719799,0.804817
7,0.2832,0.846698,0.733965,0.70849,0.721002,0.805439
8,0.2183,0.850509,0.738667,0.714587,0.726427,0.808702
9,0.2091,0.854742,0.735173,0.712242,0.723526,0.806527
10,0.1841,0.853652,0.737339,0.713649,0.725301,0.807304


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 23. Training using 96 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.6231,2.643192,0.315362,0.12758,0.181666,0.3108
2,1.5325,1.523249,0.570998,0.533771,0.551758,0.65843
3,1.0014,1.145366,0.652982,0.634146,0.643427,0.738151
4,0.5776,0.953889,0.709537,0.685741,0.697436,0.783061
5,0.4502,0.899868,0.726417,0.706144,0.716137,0.794561
6,0.2856,0.874945,0.731766,0.708255,0.719819,0.801554
7,0.2413,0.85929,0.736791,0.716229,0.726365,0.804507
8,0.1952,0.862609,0.741974,0.720919,0.731295,0.808236
9,0.1719,0.857811,0.740785,0.721154,0.730838,0.809013
10,0.1662,0.856334,0.7415,0.721154,0.731185,0.809324


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 24. Training using 100 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.4618,2.600487,0.283483,0.229831,0.253853,0.446931
2,1.54,1.49261,0.577857,0.530019,0.552905,0.668376
3,1.0466,1.080865,0.67832,0.655253,0.666587,0.760218
4,0.5284,0.958173,0.710271,0.687617,0.698761,0.784615
5,0.4406,0.91026,0.728743,0.697467,0.712762,0.794716
6,0.3056,0.874575,0.735151,0.708255,0.721452,0.801709
7,0.2706,0.877464,0.728108,0.70591,0.716837,0.796892
8,0.1688,0.841694,0.736077,0.712946,0.724327,0.807304
9,0.1659,0.845052,0.735422,0.71576,0.725458,0.807304
10,0.1762,0.846119,0.736651,0.715056,0.725693,0.807148


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 25. Training using 104 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.5555,2.593493,0.270349,0.130863,0.176359,0.339239
2,1.7339,1.460141,0.583291,0.540338,0.560993,0.668998
3,1.1041,1.103686,0.668429,0.652439,0.660337,0.751671
4,0.6177,0.953584,0.718399,0.690432,0.704138,0.791298
5,0.4459,0.867162,0.728748,0.705675,0.717026,0.799845
6,0.3179,0.843234,0.747143,0.720685,0.733676,0.812587
7,0.2239,0.83913,0.745601,0.715525,0.730254,0.808081
8,0.1908,0.82885,0.74387,0.718574,0.731003,0.808702
9,0.1817,0.822291,0.752497,0.724437,0.738201,0.813986
10,0.1775,0.821905,0.752191,0.724672,0.738175,0.813831


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 26. Training using 108 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.5247,2.496444,0.325884,0.229128,0.269072,0.4331
2,1.6121,1.342865,0.614688,0.573171,0.593204,0.694328
3,0.8108,1.058528,0.666747,0.648452,0.657472,0.755556
4,0.6054,0.907673,0.717583,0.685272,0.701056,0.786014
5,0.4315,0.8886,0.722892,0.703565,0.713097,0.790676
6,0.2847,0.808816,0.743237,0.721623,0.73227,0.81352
7,0.2262,0.813492,0.742768,0.722561,0.732525,0.812121
8,0.1985,0.798842,0.742333,0.720919,0.731469,0.81352
9,0.1628,0.805956,0.743221,0.726313,0.73467,0.815229
10,0.1542,0.807046,0.744354,0.726548,0.735343,0.81554


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 27. Training using 112 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.5379,2.462192,0.346074,0.195356,0.249738,0.417716
2,1.5744,1.342499,0.611834,0.562617,0.586194,0.690287
3,0.8138,0.997099,0.701239,0.677064,0.688939,0.769852
4,0.5496,0.907061,0.717507,0.693949,0.705532,0.790365
5,0.3809,0.85631,0.730439,0.718105,0.724219,0.802331
6,0.2684,0.821511,0.748672,0.727251,0.737806,0.817094
7,0.2103,0.799399,0.74501,0.735225,0.740085,0.817405
8,0.1845,0.798271,0.750301,0.730769,0.740406,0.818493
9,0.1583,0.79009,0.755304,0.734756,0.744888,0.822378
10,0.1459,0.790511,0.755304,0.734756,0.744888,0.821756


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 28. Training using 116 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.5704,2.417984,0.306739,0.238039,0.268058,0.440093
2,1.5964,1.349056,0.616038,0.57833,0.596589,0.696193
3,0.9072,1.015517,0.679406,0.675422,0.677408,0.763792
4,0.5376,0.917496,0.714526,0.696764,0.705533,0.788967
5,0.3808,0.863014,0.734552,0.716463,0.725395,0.804973
6,0.291,0.813201,0.7449,0.727955,0.73633,0.815695
7,0.2166,0.821999,0.742273,0.732176,0.73719,0.815851
8,0.1719,0.823244,0.749342,0.734756,0.741978,0.816472
9,0.1456,0.822802,0.749761,0.736398,0.743019,0.817716
10,0.1506,0.824663,0.749761,0.737101,0.743377,0.818026


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 29. Training using 120 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.4866,2.441573,0.307179,0.21576,0.253478,0.418182
2,1.6537,1.341518,0.614161,0.579737,0.596453,0.69728
3,0.8541,1.06963,0.666177,0.637899,0.651731,0.753535
4,0.5773,0.883897,0.725323,0.697936,0.711366,0.797514
5,0.3578,0.855327,0.730704,0.708255,0.719305,0.805439
6,0.2502,0.814852,0.740106,0.719278,0.729543,0.813986
7,0.1913,0.811845,0.743528,0.727486,0.73542,0.818182
8,0.1714,0.797557,0.754087,0.735694,0.744777,0.824864
9,0.1291,0.802106,0.752221,0.734756,0.743386,0.824709
10,0.1389,0.803426,0.753003,0.734991,0.743888,0.824864


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
eval/accuracy,▂▁▄▅▄▆▆▆▄▇▇▆▃▅▇▇▇▂██▇███▆████▆███▄██████
eval/f1,▂▁▃▄▃▅▆▅▃▆▇▅▂▄▇▇▇▁▇▇▇██▇▅████▆███▂██▇███
eval/loss,▇█▅▅▆▄▃▃▆▂▂▃▆▅▂▂▂▆▂▂▂▁▁▂▃▁▁▁▁▃▁▁▁▅▁▁▁▁▁▁
eval/precision,▂▁▄▄▃▅▆▆▃▆▇▆▂▄▇▇▇▂▇▇▇██▇▆████▆███▃██▇███
eval/recall,▂▁▃▃▃▅▆▅▃▆▇▅▂▄▇▇▆▁▇▇▇██▇▅████▆███▂██▇███
eval/runtime,▁▁▇▂▃█▂▂▁▁▁▂▆▂▇▃▁▁▁▆▁▁▄▁▆▁▁▁▂▂▁▂▁▁▁▁▁▁▁▂
eval/samples_per_second,█▇▂▇▅▁▇▇█▇▇▆▂▇▂▅██▇▂█▇▅█▃███▇▇█▇███████▇
eval/steps_per_second,█▇▂▇▅▁▇▇█▇▇▆▂▇▂▅██▇▂█▇▅█▃███▇▇█▇███████▇
train/epoch,▆█▂▃▃▄▃▃▃▁█▇▆▄▃█▆▄▂█▅▃█▅▂▇▄▁▆▃▇▄█▅▂▆▂▇▃▇
train/global_step,▁▁▁▁▁▂▂▂▂▁▄▄▃▃▂▅▄▃▂▅▄▂▆▄▂▆▄▁▅▃▇▄█▅▂▆▃▇▃█

0,1
eval/accuracy,0.82486
eval/f1,0.74389
eval/loss,0.80343
eval/precision,0.753
eval/recall,0.73499
eval/runtime,1.0421
eval/samples_per_second,73.891
eval/steps_per_second,19.192
train/epoch,10.0
train/global_step,300.0


Current seed:  1255


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 0. Training using 4 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.890504,0.007775,0.009615,0.008598,0.013831
2,No log,3.611541,0.066031,0.081144,0.072811,0.128671
3,No log,3.383992,0.106147,0.065197,0.080779,0.215851
4,No log,3.214814,0.109375,0.02955,0.046529,0.198291
5,No log,3.102307,0.111389,0.020872,0.035157,0.191142
6,No log,3.033006,0.130102,0.023921,0.040412,0.195493
7,No log,2.990445,0.153576,0.030722,0.051202,0.204507
8,No log,2.966095,0.166488,0.036351,0.059673,0.21181
9,No log,2.954934,0.179104,0.042214,0.068324,0.218959
10,No log,2.952078,0.182796,0.043856,0.07074,0.219891


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 1. Training using 8 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.711834,0.024977,0.03166,0.027924,0.050971
2,No log,3.285401,0.086871,0.041276,0.055962,0.195804
3,No log,3.028898,0.198643,0.048077,0.077417,0.209324
4,No log,2.882263,0.272668,0.098734,0.144972,0.269775
5,No log,2.777674,0.29298,0.163462,0.209845,0.340637
6,No log,2.690884,0.298915,0.200281,0.239854,0.384305
7,No log,2.623006,0.306431,0.227955,0.261431,0.415695
8,2.685200,2.580619,0.316219,0.245544,0.276436,0.439161
9,2.685200,2.56268,0.320383,0.251407,0.281735,0.446931
10,2.685200,2.558905,0.324486,0.255159,0.285677,0.449573


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 2. Training using 12 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.594126,0.046729,0.051595,0.049041,0.099301
2,No log,3.040004,0.066901,0.004456,0.008355,0.166589
3,No log,2.838502,0.173913,0.018762,0.03387,0.190521
4,No log,2.658473,0.322642,0.160413,0.214286,0.356022
5,No log,2.499819,0.342207,0.229128,0.274477,0.434188
6,2.827700,2.367714,0.348881,0.263133,0.3,0.475369
7,2.827700,2.283076,0.366123,0.295028,0.326753,0.50272
8,2.827700,2.234096,0.386248,0.320122,0.35009,0.519037
9,2.827700,2.212231,0.395487,0.328799,0.359073,0.524786
10,2.827700,2.208092,0.397512,0.329737,0.360467,0.525563


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 3. Training using 16 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.480757,0.078861,0.067542,0.072764,0.189433
2,No log,2.983545,0.122596,0.011961,0.021795,0.181507
3,No log,2.706442,0.316267,0.114447,0.168073,0.297902
4,2.911300,2.466759,0.314334,0.215994,0.256047,0.422533
5,2.911300,2.270029,0.349708,0.238743,0.283763,0.447397
6,2.911300,2.122669,0.386547,0.303236,0.339861,0.504895
7,2.911300,2.021376,0.432085,0.370779,0.399091,0.5554
8,1.606600,1.966556,0.452866,0.396576,0.422856,0.572339
9,1.606600,1.943427,0.46115,0.406426,0.432062,0.578399
10,1.606600,1.939297,0.462214,0.407364,0.433059,0.579176


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 4. Training using 20 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.34078,0.114592,0.092636,0.102451,0.247397
2,No log,2.815407,0.244358,0.07364,0.113174,0.253924
3,No log,2.506672,0.307229,0.179409,0.226532,0.378555
4,2.974100,2.179271,0.400055,0.341698,0.368581,0.523232
5,2.974100,1.931286,0.46162,0.409006,0.433723,0.584149
6,2.974100,1.769008,0.5143,0.472326,0.492421,0.62533
7,1.585000,1.679762,0.53357,0.493902,0.51297,0.637296
8,1.585000,1.627252,0.540268,0.501876,0.520365,0.641958
9,1.585000,1.603133,0.54447,0.506801,0.524961,0.645998
10,1.073100,1.599373,0.546737,0.508912,0.527147,0.646775


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 5. Training using 24 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.301039,0.088067,0.046904,0.061209,0.200932
2,No log,2.796629,0.180918,0.094278,0.123959,0.275369
3,3.084800,2.410532,0.357356,0.281426,0.314878,0.4662
4,3.084800,2.053469,0.428386,0.386492,0.406362,0.556643
5,3.084800,1.768976,0.52207,0.482645,0.501584,0.631391
6,1.700400,1.615309,0.563737,0.527908,0.545234,0.662005
7,1.700400,1.526024,0.577927,0.545263,0.56112,0.671018
8,0.988700,1.482028,0.588556,0.557223,0.572461,0.677855
9,0.988700,1.463708,0.59375,0.561445,0.577146,0.68174
10,0.988700,1.460451,0.594648,0.562852,0.578313,0.682207


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 6. Training using 28 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.152936,0.059501,0.00727,0.012957,0.169231
2,No log,2.751521,0.289897,0.118433,0.168165,0.306915
3,3.096700,2.385567,0.31054,0.141651,0.194556,0.339239
4,3.096700,2.030738,0.432358,0.367261,0.39716,0.539394
5,1.875400,1.73629,0.518069,0.470685,0.493242,0.62331
6,1.875400,1.55137,0.558536,0.522514,0.539925,0.660917
7,1.085800,1.455211,0.575162,0.541979,0.558078,0.671018
8,1.085800,1.407201,0.589484,0.560038,0.574384,0.682207
9,1.085800,1.387462,0.593666,0.567073,0.580065,0.68749
10,0.797100,1.384427,0.595191,0.568949,0.581775,0.688733


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 7. Training using 32 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.155952,0.047319,0.003518,0.006549,0.158664
2,3.116600,2.571421,0.320348,0.215994,0.258019,0.410567
3,3.116600,2.010682,0.465435,0.413696,0.438043,0.577001
4,1.677400,1.653551,0.552712,0.511492,0.531303,0.653613
5,1.677400,1.493588,0.58784,0.553236,0.570013,0.675058
6,0.931500,1.395696,0.612235,0.589118,0.600454,0.699611
7,0.931500,1.330963,0.619845,0.599203,0.609349,0.705828
8,0.643500,1.312438,0.623871,0.599437,0.61141,0.709868
9,0.643500,1.301864,0.625977,0.601313,0.613397,0.711267
10,0.560800,1.299983,0.625852,0.602955,0.61419,0.711888


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 8. Training using 36 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.085852,0.0,0.0,0.0,0.154934
2,3.201000,2.558927,0.31332,0.184803,0.232483,0.376535
3,3.201000,2.012038,0.427446,0.368902,0.396022,0.540482
4,1.926500,1.644692,0.540623,0.500938,0.520024,0.647863
5,1.926500,1.471284,0.566857,0.535882,0.550934,0.669153
6,1.107700,1.311864,0.611017,0.590525,0.600596,0.700389
7,1.107700,1.248053,0.626676,0.613743,0.620142,0.714996
8,0.682600,1.2114,0.633557,0.620779,0.627103,0.721057
9,0.570800,1.205282,0.633478,0.61773,0.625505,0.721834
10,0.570800,1.203515,0.635597,0.618902,0.627139,0.722922


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 9. Training using 40 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.029108,0.067961,0.001642,0.003206,0.156643
2,3.182700,2.316164,0.37746,0.24742,0.298909,0.436053
3,3.182700,1.732645,0.529851,0.48288,0.505276,0.631702
4,1.807500,1.4596,0.592352,0.555816,0.573503,0.680808
5,0.957700,1.408786,0.607641,0.581848,0.594465,0.696348
6,0.957700,1.250095,0.646647,0.628752,0.637574,0.721678
7,0.654000,1.205434,0.655718,0.641417,0.648488,0.73784
8,0.530200,1.16356,0.663799,0.651501,0.657593,0.74934
9,0.530200,1.169658,0.668029,0.651735,0.659782,0.749495
10,0.469400,1.169618,0.66843,0.65197,0.660097,0.749495


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 10. Training using 44 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.008834,0.075,0.002111,0.004106,0.15913
2,3.234500,2.248719,0.400479,0.274625,0.325821,0.457964
3,1.891800,1.621031,0.569711,0.52228,0.544965,0.658897
4,1.891800,1.372024,0.607178,0.575281,0.5908,0.690287
5,1.041300,1.204189,0.645757,0.622889,0.634117,0.726651
6,0.655900,1.156021,0.658206,0.626407,0.641913,0.732246
7,0.655900,1.092161,0.671602,0.648921,0.660067,0.749806
8,0.496200,1.075255,0.678405,0.650563,0.664193,0.754623
9,0.445000,1.067538,0.68233,0.653846,0.667784,0.75742
10,0.445000,1.065308,0.683619,0.655722,0.66938,0.758508


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 11. Training using 48 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,3.037884,0.011494,0.000235,0.00046,0.1554
2,3.301600,2.357925,0.354496,0.257974,0.298629,0.448951
3,2.133700,1.661067,0.545524,0.498827,0.521132,0.647708
4,1.174600,1.376064,0.622032,0.595919,0.608696,0.705828
5,1.174600,1.218921,0.649439,0.624765,0.636863,0.727894
6,0.737000,1.160238,0.66765,0.636961,0.651944,0.74359
7,0.501400,1.126531,0.672665,0.648687,0.660458,0.750894
8,0.448900,1.100344,0.686486,0.655253,0.670506,0.760373
9,0.448900,1.09961,0.684647,0.657833,0.670972,0.760684
10,0.373100,1.09911,0.68584,0.659944,0.672643,0.761461


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 12. Training using 52 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,2.95975,0.024691,0.000938,0.001808,0.160373
2,3.338600,2.146369,0.341479,0.252345,0.290223,0.449417
3,1.999200,1.531788,0.574371,0.529784,0.551177,0.66418
4,1.218300,1.281159,0.625398,0.599437,0.612142,0.706605
5,0.692400,1.174586,0.653288,0.633677,0.643333,0.737685
6,0.692400,1.092465,0.684378,0.655488,0.669621,0.758197
7,0.524200,1.0457,0.69764,0.672608,0.684896,0.771251
8,0.415700,1.036745,0.696662,0.675422,0.685878,0.771562
9,0.350900,1.03583,0.701428,0.679878,0.690485,0.773116
10,0.322500,1.034827,0.701716,0.680816,0.691108,0.773582


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 13. Training using 56 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,2.964847,0.209596,0.077861,0.113543,0.242269
2,3.379700,2.064214,0.459887,0.40197,0.428983,0.573582
3,2.167600,1.48228,0.587137,0.545966,0.565804,0.677389
4,1.201100,1.253339,0.635175,0.603893,0.619139,0.715152
5,0.738300,1.100359,0.669924,0.643058,0.656216,0.749806
6,0.532300,1.037765,0.702696,0.672373,0.6872,0.772339
7,0.439700,1.011044,0.701827,0.675657,0.688493,0.77467
8,0.339800,0.992522,0.708858,0.686914,0.697713,0.78073
9,0.339800,0.990632,0.710138,0.688321,0.699059,0.78073
10,0.308900,0.990917,0.709615,0.687148,0.698201,0.779798


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 14. Training using 60 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,No log,2.887024,0.254197,0.024859,0.045289,0.182906
2,3.330100,1.986162,0.434133,0.394934,0.413607,0.5554
3,2.127800,1.452632,0.57221,0.539869,0.555569,0.670552
4,1.264000,1.199291,0.637566,0.621717,0.629542,0.7223
5,0.777700,1.081299,0.682316,0.657833,0.669851,0.753535
6,0.554200,1.044042,0.695961,0.666745,0.68104,0.763326
7,0.426300,1.001472,0.707928,0.682692,0.695081,0.777467
8,0.334000,1.000527,0.710367,0.68621,0.698079,0.783061
9,0.304000,0.995347,0.708888,0.686445,0.697486,0.783528
10,0.271900,0.995911,0.708576,0.685976,0.697092,0.783217


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 15. Training using 64 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.4064,2.930979,0.044248,0.001173,0.002285,0.15742
2,2.2727,1.936421,0.443869,0.382036,0.410638,0.559907
3,1.3496,1.438804,0.588892,0.556989,0.572496,0.679254
4,0.8626,1.191978,0.633277,0.616792,0.624926,0.718881
5,0.5914,1.069407,0.687071,0.658068,0.672257,0.766278
6,0.4412,1.004524,0.702893,0.678002,0.690223,0.778866
7,0.3575,0.985834,0.702097,0.683161,0.6925,0.781507
8,0.2978,0.976499,0.708031,0.686445,0.697071,0.783838
9,0.2654,0.977689,0.707388,0.687148,0.697121,0.783372
10,0.2588,0.977864,0.706422,0.68621,0.696169,0.782906


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 16. Training using 68 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.4029,2.795246,0.24126,0.114916,0.155679,0.309091
2,2.167,1.765044,0.52974,0.467871,0.496887,0.62906
3,1.2036,1.317952,0.633034,0.595919,0.613916,0.709246
4,0.8064,1.126906,0.668312,0.635084,0.651275,0.740482
5,0.5399,1.029463,0.698141,0.669325,0.683429,0.770008
6,0.4312,0.990564,0.715162,0.68363,0.699041,0.779332
7,0.3306,0.958129,0.723201,0.693011,0.707784,0.789899
8,0.3001,0.946378,0.724347,0.701923,0.712959,0.790987
9,0.2375,0.939641,0.726899,0.704737,0.715647,0.793007
10,0.2353,0.940306,0.726525,0.704034,0.715102,0.792852


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 17. Training using 72 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.4679,2.820933,0.1404,0.070826,0.094154,0.2777
2,2.2471,1.727163,0.516417,0.461069,0.487176,0.620513
3,1.2735,1.316873,0.626155,0.604128,0.614944,0.703186
4,0.8729,1.12815,0.666345,0.64728,0.656674,0.738772
5,0.6173,1.012435,0.697804,0.678002,0.68776,0.766589
6,0.4649,0.980472,0.699306,0.685038,0.692098,0.77265
7,0.3917,0.932165,0.721276,0.705206,0.713151,0.795493
8,0.2687,0.934791,0.727317,0.706848,0.716936,0.79596
9,0.2463,0.925545,0.728389,0.709428,0.718783,0.797047
10,0.2247,0.924822,0.727338,0.709428,0.718271,0.797047


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 18. Training using 76 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.3945,2.7963,0.175688,0.046435,0.073456,0.232012
2,2.286,1.753194,0.51433,0.471388,0.491924,0.625019
3,1.4123,1.350224,0.603905,0.587477,0.595578,0.694949
4,0.9541,1.170387,0.649248,0.61773,0.633097,0.72805
5,0.6715,1.031668,0.698331,0.667214,0.682418,0.768298
6,0.3695,1.012261,0.697471,0.672608,0.684814,0.77467
7,0.3218,0.986155,0.707429,0.687852,0.697503,0.783838
8,0.2853,0.955261,0.712843,0.695122,0.703871,0.789122
9,0.2676,0.955914,0.714148,0.694887,0.704386,0.789433
10,0.2271,0.956959,0.71432,0.694887,0.70447,0.789588


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 19. Training using 80 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.4742,2.758225,0.245063,0.064024,0.101525,0.26791
2,2.2931,1.648192,0.556091,0.513837,0.53413,0.650194
3,1.4279,1.261541,0.639421,0.610929,0.62485,0.713442
4,0.7162,1.091752,0.679538,0.647983,0.663385,0.753691
5,0.5357,1.005529,0.71273,0.690666,0.701525,0.781507
6,0.4311,0.929024,0.727338,0.709428,0.718271,0.797358
7,0.3205,0.916,0.73343,0.713649,0.723404,0.803574
8,0.2494,0.917718,0.735146,0.716698,0.725805,0.803108
9,0.2365,0.91883,0.736425,0.718809,0.72751,0.803885
10,0.2202,0.917434,0.737146,0.719512,0.728222,0.804507


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 20. Training using 84 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.4043,2.707532,0.279135,0.208959,0.239002,0.399845
2,2.3774,1.638175,0.550865,0.507974,0.528551,0.649883
3,1.4374,1.246577,0.625855,0.60061,0.612973,0.709091
4,0.6709,1.061293,0.685136,0.666979,0.675936,0.767832
5,0.5214,0.97368,0.710305,0.69348,0.701792,0.787723
6,0.4586,0.928457,0.709151,0.70333,0.706229,0.790831
7,0.281,0.919207,0.718467,0.708021,0.713206,0.796892
8,0.2452,0.904756,0.725998,0.716463,0.721199,0.800932
9,0.2332,0.903826,0.727122,0.721154,0.724126,0.802176
10,0.1997,0.902565,0.728305,0.722326,0.725303,0.803419


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 21. Training using 88 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.4779,2.665235,0.296335,0.199109,0.238182,0.393318
2,2.3392,1.574625,0.562276,0.51454,0.53735,0.65439
3,1.0171,1.259409,0.631289,0.617964,0.624556,0.716239
4,0.703,1.082122,0.677789,0.652674,0.664994,0.760839
5,0.5383,0.987884,0.705501,0.68879,0.697045,0.781818
6,0.3546,0.923713,0.725126,0.70591,0.715389,0.794872
7,0.2828,0.91525,0.725857,0.710366,0.718028,0.799689
8,0.2299,0.906441,0.736061,0.721388,0.728651,0.804973
9,0.2101,0.900844,0.732904,0.721388,0.727101,0.805594
10,0.1875,0.900031,0.733302,0.720919,0.727058,0.80575


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 22. Training using 92 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.4685,2.735184,0.250996,0.044325,0.075344,0.229215
2,2.4445,1.573264,0.566176,0.523687,0.544103,0.656099
3,1.0064,1.185824,0.65959,0.626642,0.642694,0.729915
4,0.7108,1.025452,0.704755,0.681285,0.692821,0.777312
5,0.4658,0.94443,0.724421,0.704034,0.714082,0.790676
6,0.338,0.91023,0.729581,0.714353,0.721886,0.797514
7,0.2544,0.879064,0.734035,0.719747,0.726821,0.80202
8,0.218,0.878215,0.737443,0.726548,0.731955,0.807148
9,0.1926,0.879252,0.739182,0.729128,0.73412,0.808392
10,0.1757,0.880023,0.739658,0.729597,0.734593,0.808547


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 23. Training using 96 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.5085,2.649284,0.319876,0.193246,0.240936,0.386014
2,1.5608,1.47198,0.584247,0.537523,0.559912,0.672572
3,0.9484,1.098406,0.689209,0.650094,0.66908,0.756954
4,0.602,0.977776,0.700989,0.681754,0.691238,0.778089
5,0.4413,0.899506,0.733898,0.710835,0.722183,0.802486
6,0.2899,0.871071,0.735808,0.72045,0.728048,0.80373
7,0.2523,0.850217,0.737873,0.724203,0.730974,0.808392
8,0.1973,0.84098,0.737066,0.731707,0.734377,0.810567
9,0.1716,0.842513,0.735719,0.727955,0.731817,0.80979
10,0.161,0.842066,0.736605,0.728659,0.73261,0.809946


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 24. Training using 100 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.5105,2.623509,0.257702,0.188321,0.217615,0.389744
2,1.6119,1.528684,0.567882,0.525797,0.54603,0.661383
3,1.0578,1.171685,0.644558,0.622186,0.633174,0.732246
4,0.6315,1.031211,0.682945,0.65924,0.670883,0.762082
5,0.4954,0.896923,0.726719,0.699109,0.712646,0.796115
6,0.2975,0.899448,0.722892,0.703565,0.713097,0.795183
7,0.2682,0.877503,0.735506,0.719981,0.727661,0.803263
8,0.2046,0.886473,0.735763,0.715056,0.725262,0.80373
9,0.172,0.878486,0.738942,0.720919,0.72982,0.806216
10,0.1581,0.877329,0.740331,0.722795,0.731458,0.807304


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 25. Training using 104 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.5748,2.59042,0.28125,0.156191,0.200844,0.354157
2,1.5936,1.45447,0.59386,0.553471,0.572955,0.684693
3,1.0007,1.117322,0.657443,0.646341,0.651845,0.747475
4,0.5862,0.998985,0.704479,0.678705,0.691352,0.778089
5,0.444,0.906591,0.727536,0.708255,0.717766,0.798912
6,0.326,0.887841,0.72795,0.710366,0.71905,0.801088
7,0.2366,0.87021,0.737783,0.725844,0.731765,0.809324
8,0.1734,0.875556,0.735113,0.729597,0.732345,0.812121
9,0.1794,0.875378,0.740266,0.731238,0.735724,0.813054
10,0.1682,0.875519,0.741874,0.733349,0.737587,0.813986


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 26. Training using 108 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.6016,2.464699,0.35836,0.266417,0.305623,0.449417
2,1.4697,1.377771,0.617068,0.588415,0.602401,0.699456
3,0.7519,1.064035,0.683661,0.660413,0.671836,0.76115
4,0.5459,0.938479,0.720175,0.696529,0.708155,0.788034
5,0.3895,0.878808,0.726922,0.707317,0.716986,0.798912
6,0.2784,0.8378,0.732775,0.71834,0.725486,0.803885
7,0.2179,0.81475,0.742212,0.731942,0.737041,0.816628
8,0.1753,0.847712,0.742525,0.733818,0.738146,0.81554
9,0.1403,0.848027,0.742823,0.734287,0.73853,0.816162
10,0.1497,0.8477,0.743833,0.73546,0.739623,0.816783


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 27. Training using 112 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.4676,2.453459,0.357407,0.226313,0.27714,0.418026
2,1.5937,1.364569,0.622306,0.582317,0.601648,0.701476
3,0.7929,1.061017,0.690824,0.655019,0.672445,0.753069
4,0.5147,0.931911,0.719961,0.696998,0.708294,0.788811
5,0.3817,0.818365,0.738406,0.716932,0.727511,0.808547
6,0.2761,0.814072,0.747263,0.736398,0.741791,0.815851
7,0.2234,0.836934,0.746028,0.737805,0.741894,0.816472
8,0.1823,0.828191,0.745956,0.73546,0.740671,0.818803
9,0.1555,0.836819,0.744711,0.734756,0.7397,0.816939
10,0.1365,0.836218,0.74306,0.734522,0.738766,0.816939


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 28. Training using 116 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.4721,2.437177,0.297731,0.200047,0.239304,0.400777
2,1.6044,1.399691,0.606577,0.583959,0.595053,0.698368
3,0.7892,1.0983,0.665701,0.646811,0.65612,0.747786
4,0.5476,0.957291,0.704246,0.688555,0.696312,0.780575
5,0.391,0.877884,0.719131,0.706144,0.712578,0.796426
6,0.2768,0.833291,0.73327,0.722092,0.727638,0.807459
7,0.2168,0.843233,0.72787,0.727017,0.727443,0.806371
8,0.1808,0.852488,0.737462,0.734522,0.735989,0.811344
9,0.1605,0.85425,0.738465,0.735694,0.737077,0.814141
10,0.1554,0.853859,0.738342,0.735225,0.73678,0.814297


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]


Iteration: 29. Training using 120 samples


Some weights of BertForTokenClassification were not initialized from the model checkpoint at alexyalunin/RuBioBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy
1,3.4925,2.397412,0.373383,0.28424,0.32277,0.476457
2,1.5735,1.284257,0.650379,0.624296,0.637071,0.724476
3,0.7384,1.039538,0.702428,0.664869,0.683133,0.762238
4,0.4914,0.93532,0.721642,0.696764,0.708985,0.791919
5,0.3577,0.874988,0.713436,0.703565,0.708466,0.792852
6,0.2799,0.822922,0.734926,0.728893,0.731897,0.810723
7,0.1875,0.816159,0.748392,0.736632,0.742465,0.818803
8,0.1755,0.836832,0.743054,0.733818,0.738407,0.81554
9,0.1482,0.818281,0.752376,0.742495,0.747403,0.821756
10,0.1329,0.821469,0.751663,0.741792,0.746695,0.82129


Filter:   0%|          | 0/612 [00:00<?, ? examples/s]

VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
eval/accuracy,▂▁▅▅▃▆▆▆▃▇▇▆▂▅▇▇▇▃█▇▇██▇▆████▆██▇▄██▇███
eval/f1,▁▁▄▄▃▅▆▆▃▆▇▆▁▄▇▇▇▂█▇▆██▇▆████▆██▇▃██▇███
eval/loss,▇█▅▅▆▄▃▃▆▂▂▃▆▄▂▂▂▆▁▂▃▁▁▁▃▁▁▁▁▃▁▁▂▅▁▁▂▁▁▁
eval/precision,▂▁▄▄▄▅▆▆▄▆▇▆▁▅▇▇▇▃█▇▆██▇▆████▆██▇▃██▇███
eval/recall,▁▁▃▃▂▅▆▆▂▆▇▆▁▄▇▇▇▂▇▇▆▇█▇▅███▇▆██▇▂██▇███
eval/runtime,▁▃▁▇▂▁▂█▁▂▂▂▁▂██▃▁▃▂█▂█▁▁▂▂▁▂▁▂▁▇▂▄▂▂▂▂▇
eval/samples_per_second,█▅▇▂▇▇▇▁▇▆▇▇▇▇▁▁▅█▆▇▁▇▁█▇▇▇▇▇▇▇▇▂▇▅▇▇▇▇▂
eval/steps_per_second,█▅▇▂▇▇▇▁▇▆▇▇▇▇▁▁▅█▆▇▁▇▁█▇▇▇▇▇▇▇▇▂▇▅▇▇▇▇▂
train/epoch,▆█▂▃▃▄▃▃▃▁█▇▆▄▃█▆▄▂█▅▃█▅▂▇▄▁▆▃▇▄█▅▂▆▂▇▃▇
train/global_step,▁▁▁▁▁▂▂▂▂▁▄▄▃▃▂▅▄▃▂▅▄▂▆▄▂▆▄▁▅▃▇▄█▅▂▆▃▇▃█

0,1
eval/accuracy,0.82129
eval/f1,0.74669
eval/loss,0.82147
eval/precision,0.75166
eval/recall,0.74179
eval/runtime,0.9154
eval/samples_per_second,84.114
eval/steps_per_second,21.848
train/epoch,10.0
train/global_step,300.0
