In [None]:
# Colabis kasutamiseks
from google.colab import drive
drive.mount('/content/drive')
import os
os.chdir('/content/drive/My Drive/Colab Notebooks/thesis/')

!pip install estnltk==1.7.4
!pip install evaluate
!pip install seqeval
!pip install nervaluate

In [2]:
from modules.data_processing import DatasetProcessor
from modules.bert_data_processing import BERTDataProcessor
from modules.bert_evaluator import BERTEvaluator
from modules.bert_trainer import BERTTrainer
import json
ALL_TAGS = DatasetProcessor.ALL_TAGS
TAG2IDX = DatasetProcessor.TAG2IDX
IDX2TAG = DatasetProcessor.IDX2TAG

INFO:datasets:PyTorch version 2.5.1+cu124 available.
INFO:datasets:Polars version 1.21.0 available.
INFO:datasets:Duckdb version 1.1.3 available.
INFO:datasets:TensorFlow version 2.18.0 available.
INFO:datasets:JAX version 0.4.33 available.


INFO:config.py:54: PyTorch version 2.5.1+cu124 available.
INFO:config.py:66: Polars version 1.21.0 available.
INFO:config.py:77: Duckdb version 1.1.3 available.
INFO:config.py:112: TensorFlow version 2.18.0 available.
INFO:config.py:125: JAX version 0.4.33 available.


In [6]:
def train_model(model_name, dataset_name, epochs=3, batch_size=16):
    if dataset_name.lower() == 'combined':
      ewt_processor = DatasetProcessor('ewt', from_json=True)
      edt_processor = DatasetProcessor('edt', from_json=True)
      ewt_dataset = DatasetProcessor.tag_to_id(ewt_processor.dataset, TAG2IDX)
      edt_dataset = DatasetProcessor.tag_to_id(edt_processor.dataset, TAG2IDX)
      dataset = DatasetProcessor.combine_datasetdicts(ewt_dataset, edt_dataset)
    elif dataset_name.lower() in ['ewt', 'edt']:
      processor = DatasetProcessor(dataset_name.lower(), from_json=True)
      dataset = DatasetProcessor.tag_to_id(processor.dataset, TAG2IDX)

    print(f'{dataset_name.upper()} andmestik laetud')
    bert_processor = BERTDataProcessor(model_name)
    evaluator = BERTEvaluator(all_tags=ALL_TAGS)

    tokenized_dataset = bert_processor.tokenize_dataset(dataset)

    trainer = BERTTrainer(model_name=model_name, idx2tag=IDX2TAG, tag2idx=TAG2IDX, evaluator=evaluator)

    model, model_trainer = trainer.finetune_model(processor=bert_processor, tokenized_dataset=tokenized_dataset, epochs=epochs, batch_size=batch_size, early_stop_patience=3, output_dir=f'./results/{model_name.split("/")[1]}/{dataset_name}/trained_for_{epochs}')

    results = evaluator.evaluate_and_print(tokenized_dataset['test'], model_trainer)
    evaluator.evaluation_to_json(nervaluate_strict_overall=results[1]['strict'], nervaluate_by_tag=results[2], model_name=model_name.split('/')[1], trained_on=dataset_name, evaluated_on=dataset_name, epochs=epochs)

    if dataset_name.lower() == 'combined':
      tokenized_ewt = bert_processor.tokenize_dataset(ewt_dataset['test'])
      tokenized_edt = bert_processor.tokenize_dataset(edt_dataset['test'])

      print(f'Kombineeritud andmestikul treenitud {model_name} EWT testandmestikul')
      ewt_results = evaluator.evaluate_and_print(tokenized_ewt, model_trainer)
      evaluator.evaluation_to_json(nervaluate_strict_overall=ewt_results[1]['strict'], nervaluate_by_tag=ewt_results[2], model_name=model_name.split('/')[1], trained_on=dataset_name, evaluated_on="EWT", epochs=epochs)

      print(f'Kombineeritud andmestikul treenitud {model_name} EDT testandmestikul')
      edt_results = evaluator.evaluate_and_print(tokenized_edt, model_trainer)
      evaluator.evaluation_to_json(nervaluate_strict_overall=edt_results[1]['strict'], nervaluate_by_tag=edt_results[2], model_name=model_name.split('/')[1], trained_on=dataset_name, evaluated_on="EDT", epochs=epochs)

      return model, model_trainer, (results, ewt_results, edt_results)

    return model, model_trainer, results

def train_all():
  dataset_names = ['ewt', 'edt', 'combined']

  model_names = ["tartuNLP/EstRoBERTa", "tartuNLP/EstBERT"]
  results_dict = {}

  for model_name in model_names:
    model_results = {}
    for dataset_name in dataset_names:
      model, model_trainer, results = train_model(model_name, dataset_name, epochs=3)
      model_results[dataset_name] = results
    results_dict[model_name] = model_results

  return results_dict

In [None]:
def main():
    results = train_all()

In [None]:
main()

EWT andmestik laetud


tokenizer_config.json:   0%|          | 0.00/398 [00:00<?, ?B/s]

sentencepiece.bpe.model:   0%|          | 0.00/5.07M [00:00<?, ?B/s]

tokenizer.json:   0%|          | 0.00/17.1M [00:00<?, ?B/s]

special_tokens_map.json:   0%|          | 0.00/239 [00:00<?, ?B/s]

Downloading builder script:   0%|          | 0.00/6.34k [00:00<?, ?B/s]

Map:   0%|          | 0/5444 [00:00<?, ? examples/s]

Map:   0%|          | 0/833 [00:00<?, ? examples/s]

Map:   0%|          | 0/913 [00:00<?, ? examples/s]

config.json:   0%|          | 0.00/707 [00:00<?, ?B/s]

model.safetensors:   0%|          | 0.00/1.11G [00:00<?, ?B/s]

Some weights of XLMRobertaForTokenClassification were not initialized from the model checkpoint at tartuNLP/EstRoBERTa and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


[2025-03-05 09:01:36] Alustan tartuNLP/EstRoBERTa treenimist


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy,Gep precision,Gep recall,Gep f1,Gep number,Loc precision,Loc recall,Loc f1,Loc number,Org precision,Org recall,Org f1,Org number,Per precision,Per recall,Per f1,Per number,Prod precision,Prod recall,Prod f1,Prod number,Unk precision,Unk recall,Unk f1,Unk number,Eve precision,Eve recall,Eve f1,Eve number
1,No log,0.242729,0.75924,0.715423,0.73668,0.958174,0.482759,0.583333,0.528302,24,0.0,0.0,0.0,7,0.266667,0.218182,0.24,55,0.958478,0.909688,0.933446,609,0.476027,0.449838,0.462562,309,0.0,0.0,0.0,1,,,,
2,0.149200,0.249776,0.798755,0.766169,0.782123,0.963294,0.46875,0.625,0.535714,24,0.0,0.0,0.0,7,0.633333,0.345455,0.447059,55,0.972556,0.931034,0.951342,609,0.541667,0.546926,0.544283,309,0.0,0.0,0.0,1,,,,
3,0.039500,0.288473,0.81509,0.763184,0.788284,0.96422,0.56,0.583333,0.571429,24,0.0,0.0,0.0,7,0.53125,0.309091,0.390805,55,0.949511,0.957307,0.953393,609,0.590734,0.495146,0.538732,309,0.0,0.0,0.0,1,0.0,0.0,0.0,0.0


  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))


[2025-03-05 09:06:50] tartuNLP/EstRoBERTa treenimine lõpetatud
Kokku kulus: 313.23 sekundit (0.09 tundi)
Hindan testandmestikul..


Seqeval tulemused
EVE {'precision': 0.5416666666666666, 'recall': 0.23636363636363636, 'f1': 0.32911392405063294, 'number': 55}
GEP {'precision': 0.7818181818181819, 'recall': 0.7166666666666667, 'f1': 0.7478260869565218, 'number': 60}
LOC {'precision': 0.3548387096774194, 'recall': 0.7096774193548387, 'f1': 0.4731182795698926, 'number': 62}
ORG {'precision': 0.49444444444444446, 'recall': 0.5144508670520231, 'f1': 0.5042492917847026, 'number': 173}
PER {'precision': 0.9494949494949495, 'recall': 0.7423494570582428, 'f1': 0.8332409972299168, 'number': 1013}
PROD {'precision': 0.26883910386965376, 'recall': 0.4258064516129032, 'f1': 0.3295880149812734, 'number': 310}
overall_precision 0.6440576230492197
overall_recall 0.6413628212791392
overall_f1 0.6427073974243785
overall_accuracy 0.9522528274352426

Nervaluate tulemused
Strict {'correct': 1073, 'incorrect': 399, 'partial': 0, 'missed': 201, 'spurious': 205, 'possible': 1673, 'actual': 1677, 'precision': 0.6398330351818724, 'recall': 

Map:   0%|          | 0/24601 [00:00<?, ? examples/s]

Map:   0%|          | 0/3122 [00:00<?, ? examples/s]

Map:   0%|          | 0/3207 [00:00<?, ? examples/s]

Some weights of XLMRobertaForTokenClassification were not initialized from the model checkpoint at tartuNLP/EstRoBERTa and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


[2025-03-05 09:07:46] Alustan tartuNLP/EstRoBERTa treenimist


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy,Eve precision,Eve recall,Eve f1,Eve number,Gep precision,Gep recall,Gep f1,Gep number,Loc precision,Loc recall,Loc f1,Loc number,Muu precision,Muu recall,Muu f1,Muu number,Org precision,Org recall,Org f1,Org number,Per precision,Per recall,Per f1,Per number,Prod precision,Prod recall,Prod f1,Prod number,Unk precision,Unk recall,Unk f1,Unk number
1,0.0692,0.079022,0.720725,0.719843,0.720284,0.977724,0.643836,0.52809,0.580247,89,0.573034,0.795322,0.666122,513,0.862423,0.506024,0.637813,830,0.0,0.0,0.0,9,0.537572,0.709924,0.611842,393,0.84435,0.939502,0.889388,1686,0.491566,0.387097,0.433121,527,0.0,0.0,0.0,40
2,0.0395,0.078968,0.753602,0.742354,0.747935,0.978915,0.769231,0.674157,0.718563,89,0.538462,0.873294,0.666171,513,0.808621,0.56506,0.665248,830,0.0,0.0,0.0,9,0.656613,0.720102,0.686893,393,0.923586,0.910439,0.916965,1686,0.539503,0.45351,0.492784,527,0.0,0.0,0.0,40
3,0.0189,0.079573,0.767533,0.765843,0.766687,0.981285,0.662338,0.573034,0.614458,89,0.605381,0.789474,0.685279,513,0.793605,0.657831,0.719368,830,0.0,0.0,0.0,9,0.638132,0.834606,0.723264,393,0.946914,0.909846,0.92801,1686,0.521569,0.504744,0.513018,527,0.0,0.0,0.0,40


  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))


[2025-03-05 09:26:56] tartuNLP/EstRoBERTa treenimine lõpetatud
Kokku kulus: 1150.49 sekundit (0.32 tundi)
Hindan testandmestikul..


  _warn_prf(average, modifier, msg_start, len(result))


Seqeval tulemused
EVE {'precision': 0.5714285714285714, 'recall': 0.5052631578947369, 'f1': 0.5363128491620112, 'number': 95}
GEP {'precision': 0.7171717171717171, 'recall': 0.7553191489361702, 'f1': 0.7357512953367876, 'number': 470}
LOC {'precision': 0.7563884156729132, 'recall': 0.7104, 'f1': 0.7326732673267328, 'number': 625}
MUU {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 8}
ORG {'precision': 0.8014285714285714, 'recall': 0.7674418604651163, 'f1': 0.7840670859538784, 'number': 731}
PER {'precision': 0.9434878587196468, 'recall': 0.9340034965034965, 'f1': 0.9387217219415769, 'number': 2288}
PROD {'precision': 0.5830618892508144, 'recall': 0.5655608214849921, 'f1': 0.5741780272654371, 'number': 633}
UNK {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 2}
overall_precision 0.822550052687039
overall_recall 0.8044105523495466
overall_f1 0.8133791809940606
overall_accuracy 0.98288659088577

Nervaluate tulemused
Strict {'correct': 3903, 'incorrect': 734, 'partial': 0, 'm

Map:   0%|          | 0/30045 [00:00<?, ? examples/s]

Map:   0%|          | 0/3955 [00:00<?, ? examples/s]

Map:   0%|          | 0/4120 [00:00<?, ? examples/s]

Some weights of XLMRobertaForTokenClassification were not initialized from the model checkpoint at tartuNLP/EstRoBERTa and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


[2025-03-05 09:27:53] Alustan tartuNLP/EstRoBERTa treenimist


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy,Eve precision,Eve recall,Eve f1,Eve number,Gep precision,Gep recall,Gep f1,Gep number,Loc precision,Loc recall,Loc f1,Loc number,Muu precision,Muu recall,Muu f1,Muu number,Org precision,Org recall,Org f1,Org number,Per precision,Per recall,Per f1,Per number,Prod precision,Prod recall,Prod f1,Prod number,Unk precision,Unk recall,Unk f1,Unk number
1,0.0774,0.122649,0.720629,0.720346,0.720487,0.972632,0.6,0.404494,0.483221,89,0.636893,0.610801,0.623574,537,0.769452,0.637993,0.697583,837,0.0,0.0,0.0,9,0.364113,0.774554,0.49536,448,0.933601,0.912854,0.923111,2295,0.525641,0.392344,0.449315,836,0.0,0.0,0.0,41
2,0.0402,0.110727,0.764647,0.748429,0.756451,0.97686,0.634409,0.662921,0.648352,89,0.600324,0.690875,0.642424,537,0.687351,0.688172,0.687761,837,0.0,0.0,0.0,9,0.636364,0.65625,0.646154,448,0.949053,0.917211,0.932861,2295,0.537748,0.485646,0.510371,836,0.0,0.0,0.0,41
3,0.0216,0.121331,0.776008,0.755892,0.765818,0.978289,0.7125,0.640449,0.674556,89,0.591353,0.789572,0.676236,537,0.79084,0.618877,0.69437,837,0.0,0.0,0.0,9,0.598513,0.71875,0.653144,448,0.943675,0.919826,0.931598,2295,0.568895,0.498804,0.531549,836,0.0,0.0,0.0,41


  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))


[2025-03-05 09:50:09] tartuNLP/EstRoBERTa treenimine lõpetatud
Kokku kulus: 1336.07 sekundit (0.37 tundi)
Hindan testandmestikul..


  _warn_prf(average, modifier, msg_start, len(result))


Seqeval tulemused
EVE {'precision': 0.712, 'recall': 0.5933333333333334, 'f1': 0.6472727272727272, 'number': 150}
GEP {'precision': 0.6671974522292994, 'recall': 0.7905660377358491, 'f1': 0.7236614853195165, 'number': 530}
LOC {'precision': 0.716030534351145, 'recall': 0.6826783114992722, 'f1': 0.6989567809239939, 'number': 687}
MUU {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 8}
ORG {'precision': 0.7160356347438753, 'recall': 0.7112831858407079, 'f1': 0.713651498335183, 'number': 904}
PER {'precision': 0.9415501905972046, 'recall': 0.8979097243259618, 'f1': 0.9192122809737945, 'number': 3301}
PROD {'precision': 0.5110336817653891, 'recall': 0.46659597030752914, 'f1': 0.48780487804878053, 'number': 943}
UNK {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 2}
overall_precision 0.7955661124307205
overall_recall 0.7699616858237548
overall_f1 0.7825545171339563
overall_accuracy 0.9783193629887721

Nervaluate tulemused
Strict {'correct': 5024, 'incorrect': 1029, 'partial': 0

Map:   0%|          | 0/5444 [00:00<?, ? examples/s]

Map:   0%|          | 0/833 [00:00<?, ? examples/s]

Map:   0%|          | 0/913 [00:00<?, ? examples/s]

Map:   0%|          | 0/24601 [00:00<?, ? examples/s]

Map:   0%|          | 0/3122 [00:00<?, ? examples/s]

Map:   0%|          | 0/3207 [00:00<?, ? examples/s]

Kombineeritud andmestikul treenitud tartuNLP/EstRoBERTa EWT testandmestikul
Hindan testandmestikul..


Seqeval tulemused
EVE {'precision': 0.7954545454545454, 'recall': 0.6363636363636364, 'f1': 0.7070707070707071, 'number': 55}
GEP {'precision': 0.7575757575757576, 'recall': 0.8333333333333334, 'f1': 0.7936507936507938, 'number': 60}
LOC {'precision': 0.3786407766990291, 'recall': 0.6290322580645161, 'f1': 0.4727272727272727, 'number': 62}
ORG {'precision': 0.5899280575539568, 'recall': 0.47398843930635837, 'f1': 0.5256410256410255, 'number': 173}
PER {'precision': 0.9439655172413793, 'recall': 0.8647581441263573, 'f1': 0.902627511591963, 'number': 1013}
PROD {'precision': 0.4027777777777778, 'recall': 0.3741935483870968, 'f1': 0.38795986622073586, 'number': 310}
overall_precision 0.764030612244898
overall_recall 0.7160789001793186
overall_f1 0.7392780006170935
overall_accuracy 0.9642466253192266

Nervaluate tulemused
Strict {'correct': 1198, 'incorrect': 231, 'partial': 0, 'missed': 244, 'spurious': 139, 'possible': 1673, 'actual': 1568, 'precision': 0.764030612244898, 'recall': 0.716

Seqeval tulemused
EVE {'precision': 0.6666666666666666, 'recall': 0.5684210526315789, 'f1': 0.6136363636363636, 'number': 95}
GEP {'precision': 0.6565836298932385, 'recall': 0.7851063829787234, 'f1': 0.7151162790697675, 'number': 470}
LOC {'precision': 0.7789855072463768, 'recall': 0.688, 'f1': 0.7306711979609176, 'number': 625}
MUU {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 8}
ORG {'precision': 0.7391304347826086, 'recall': 0.7674418604651163, 'f1': 0.7530201342281879, 'number': 731}
PER {'precision': 0.9405405405405406, 'recall': 0.9125874125874126, 'f1': 0.9263531499556344, 'number': 2288}
PROD {'precision': 0.5654450261780105, 'recall': 0.5118483412322274, 'f1': 0.537313432835821, 'number': 633}
UNK {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 2}
overall_precision 0.8059827259321677
overall_recall 0.7885408079142622
overall_f1 0.797166371497031
overall_accuracy 0.9818376677421929

Nervaluate tulemused
Strict {'correct': 3826, 'incorrect': 798, 'partial': 0, 'm

tokenizer_config.json:   0%|          | 0.00/62.0 [00:00<?, ?B/s]

config.json:   0%|          | 0.00/534 [00:00<?, ?B/s]

vocab.txt:   0%|          | 0.00/410k [00:00<?, ?B/s]

special_tokens_map.json:   0%|          | 0.00/112 [00:00<?, ?B/s]

Map:   0%|          | 0/5444 [00:00<?, ? examples/s]

Map:   0%|          | 0/833 [00:00<?, ? examples/s]

Map:   0%|          | 0/913 [00:00<?, ? examples/s]

model.safetensors:   0%|          | 0.00/498M [00:00<?, ?B/s]

Some weights of BertForTokenClassification were not initialized from the model checkpoint at tartuNLP/EstBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


[2025-03-05 09:51:30] Alustan tartuNLP/EstBERT treenimist


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy,Gep precision,Gep recall,Gep f1,Gep number,Loc precision,Loc recall,Loc f1,Loc number,Org precision,Org recall,Org f1,Org number,Per precision,Per recall,Per f1,Per number,Prod precision,Prod recall,Prod f1,Prod number,Unk precision,Unk recall,Unk f1,Unk number
1,No log,0.255041,0.754506,0.780639,0.767351,0.950338,0.545455,0.461538,0.5,26,0.5,0.333333,0.4,9,0.512195,0.328125,0.4,64,0.924581,0.952518,0.938342,695,0.476316,0.546828,0.509142,331,0.0,0.0,0.0,1
2,0.168300,0.301402,0.787851,0.771758,0.779722,0.953875,0.521739,0.461538,0.489796,26,0.142857,0.111111,0.125,9,0.4,0.21875,0.282828,64,0.948454,0.926619,0.937409,695,0.551532,0.598187,0.573913,331,0.0,0.0,0.0,1
3,0.043100,0.324784,0.798174,0.776199,0.787033,0.955796,0.55,0.423077,0.478261,26,0.25,0.333333,0.285714,9,0.407407,0.34375,0.372881,64,0.941776,0.930935,0.936324,695,0.593168,0.577039,0.584992,331,0.0,0.0,0.0,1


  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))


[2025-03-05 09:55:02] tartuNLP/EstBERT treenimine lõpetatud
Kokku kulus: 212.08 sekundit (0.06 tundi)
Hindan testandmestikul..


Seqeval tulemused
EVE {'precision': 0.24324324324324326, 'recall': 0.15789473684210525, 'f1': 0.19148936170212766, 'number': 57}
GEP {'precision': 0.66, 'recall': 0.6, 'f1': 0.6285714285714286, 'number': 55}
LOC {'precision': 0.17647058823529413, 'recall': 0.6545454545454545, 'f1': 0.277992277992278, 'number': 55}
ORG {'precision': 0.5222222222222223, 'recall': 0.4069264069264069, 'f1': 0.45742092457420924, 'number': 231}
PER {'precision': 0.9308108108108109, 'recall': 0.7863013698630137, 'f1': 0.8524752475247525, 'number': 1095}
PROD {'precision': 0.30612244897959184, 'recall': 0.3314917127071823, 'f1': 0.31830238726790455, 'number': 362}
overall_precision 0.6448545861297539
overall_recall 0.6215633423180593
overall_f1 0.6329947845182542
overall_accuracy 0.9369323050556984

Nervaluate tulemused
Strict {'correct': 1153, 'incorrect': 421, 'partial': 0, 'missed': 281, 'spurious': 233, 'possible': 1855, 'actual': 1807, 'precision': 0.6380741560597676, 'recall': 0.6215633423180593, 'f1': 0

Map:   0%|          | 0/24601 [00:00<?, ? examples/s]

Map:   0%|          | 0/3122 [00:00<?, ? examples/s]

Map:   0%|          | 0/3207 [00:00<?, ? examples/s]

Some weights of BertForTokenClassification were not initialized from the model checkpoint at tartuNLP/EstBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


[2025-03-05 09:55:37] Alustan tartuNLP/EstBERT treenimist


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy,Eve precision,Eve recall,Eve f1,Eve number,Gep precision,Gep recall,Gep f1,Gep number,Loc precision,Loc recall,Loc f1,Loc number,Muu precision,Muu recall,Muu f1,Muu number,Org precision,Org recall,Org f1,Org number,Per precision,Per recall,Per f1,Per number,Prod precision,Prod recall,Prod f1,Prod number,Unk precision,Unk recall,Unk f1,Unk number
1,0.085,0.1026,0.7109,0.696954,0.703858,0.968893,0.344444,0.455882,0.392405,68,0.612963,0.78066,0.686722,424,0.778509,0.558176,0.650183,636,0.0,0.0,0.0,12,0.55707,0.720264,0.628242,454,0.891975,0.888138,0.890052,1627,0.417822,0.362543,0.388224,582,0.0,0.0,0.0,71
2,0.0416,0.11563,0.685544,0.712442,0.698734,0.968683,0.441176,0.441176,0.441176,68,0.546667,0.870283,0.67152,424,0.789604,0.501572,0.613462,636,0.0,0.0,0.0,12,0.490057,0.759912,0.595855,454,0.924952,0.886294,0.90521,1627,0.413961,0.438144,0.42571,582,0.0,0.0,0.0,71
3,0.0165,0.129063,0.71119,0.720186,0.71566,0.970313,0.368421,0.411765,0.388889,68,0.577818,0.761792,0.657172,424,0.740602,0.619497,0.674658,636,0.0,0.0,0.0,12,0.533742,0.76652,0.629295,454,0.941022,0.882606,0.910879,1627,0.451557,0.448454,0.45,582,0.0,0.0,0.0,71


  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))


[2025-03-05 10:07:35] tartuNLP/EstBERT treenimine lõpetatud
Kokku kulus: 718.25 sekundit (0.20 tundi)
Hindan testandmestikul..


  _warn_prf(average, modifier, msg_start, len(result))


Seqeval tulemused
EVE {'precision': 0.45614035087719296, 'recall': 0.30952380952380953, 'f1': 0.36879432624113473, 'number': 84}
GEP {'precision': 0.6786570743405276, 'recall': 0.7369791666666666, 'f1': 0.7066167290886392, 'number': 384}
LOC {'precision': 0.7612293144208038, 'recall': 0.7301587301587301, 'f1': 0.7453703703703703, 'number': 441}
MUU {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 6}
ORG {'precision': 0.6867924528301886, 'recall': 0.7489711934156379, 'f1': 0.7165354330708662, 'number': 729}
PER {'precision': 0.9394347240915208, 'recall': 0.8998710786420283, 'f1': 0.9192273924495171, 'number': 2327}
PROD {'precision': 0.47641509433962265, 'recall': 0.5135593220338983, 'f1': 0.4942903752039152, 'number': 590}
UNK {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 2}
overall_precision 0.7842879087118718
overall_recall 0.7832566294104756
overall_f1 0.7837719298245613
overall_accuracy 0.9752186817846318

Nervaluate tulemused
Strict {'correct': 3574, 'incorrect': 75

Map:   0%|          | 0/30045 [00:00<?, ? examples/s]

Map:   0%|          | 0/3955 [00:00<?, ? examples/s]

Map:   0%|          | 0/4120 [00:00<?, ? examples/s]

Some weights of BertForTokenClassification were not initialized from the model checkpoint at tartuNLP/EstBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


[2025-03-05 10:08:19] Alustan tartuNLP/EstBERT treenimist


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy,Eve precision,Eve recall,Eve f1,Eve number,Gep precision,Gep recall,Gep f1,Gep number,Loc precision,Loc recall,Loc f1,Loc number,Muu precision,Muu recall,Muu f1,Muu number,Org precision,Org recall,Org f1,Org number,Per precision,Per recall,Per f1,Per number,Prod precision,Prod recall,Prod f1,Prod number,Unk precision,Unk recall,Unk f1,Unk number
1,0.0949,0.143808,0.7109,0.69,0.700294,0.965007,0.338462,0.323529,0.330827,68,0.577703,0.76,0.65643,450,0.752252,0.517829,0.613407,645,0.0,0.0,0.0,12,0.477301,0.750965,0.583646,518,0.927103,0.854436,0.889287,2322,0.475533,0.415115,0.443275,913,0.0,0.0,0.0,72
2,0.04,0.156549,0.729516,0.7212,0.725334,0.966941,0.383721,0.485294,0.428571,68,0.615385,0.64,0.627451,450,0.66369,0.691473,0.677297,645,0.0,0.0,0.0,12,0.547967,0.650579,0.594881,518,0.935425,0.885874,0.909976,2322,0.492802,0.487404,0.490088,913,0.0,0.0,0.0,72
3,0.02,0.181128,0.742904,0.7224,0.732509,0.968194,0.352941,0.352941,0.352941,68,0.589438,0.768889,0.66731,450,0.718447,0.573643,0.637931,645,0.0,0.0,0.0,12,0.569678,0.718147,0.635354,518,0.937187,0.886736,0.911264,2322,0.524376,0.483023,0.502851,913,0.0,0.0,0.0,72


  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))


[2025-03-05 10:23:11] tartuNLP/EstBERT treenimine lõpetatud
Kokku kulus: 891.59 sekundit (0.25 tundi)
Hindan testandmestikul..


  _warn_prf(average, modifier, msg_start, len(result))


Seqeval tulemused
EVE {'precision': 0.5565217391304348, 'recall': 0.45390070921985815, 'f1': 0.4999999999999999, 'number': 141}
GEP {'precision': 0.5662650602409639, 'recall': 0.7494305239179955, 'f1': 0.6450980392156863, 'number': 439}
LOC {'precision': 0.736734693877551, 'recall': 0.7278225806451613, 'f1': 0.7322515212981744, 'number': 496}
MUU {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 6}
ORG {'precision': 0.738015607580825, 'recall': 0.6895833333333333, 'f1': 0.7129779213785676, 'number': 960}
PER {'precision': 0.9386617100371747, 'recall': 0.8854471069549971, 'f1': 0.9112781954887217, 'number': 3422}
PROD {'precision': 0.4939759036144578, 'recall': 0.4737394957983193, 'f1': 0.48364611260053614, 'number': 952}
UNK {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 2}
overall_precision 0.786793059125964
overall_recall 0.7630102835774385
overall_f1 0.7747191900015821
overall_accuracy 0.9704860683402725

Nervaluate tulemused
Strict {'correct': 4897, 'incorrect': 954, '

Map:   0%|          | 0/5444 [00:00<?, ? examples/s]

Map:   0%|          | 0/833 [00:00<?, ? examples/s]

Map:   0%|          | 0/913 [00:00<?, ? examples/s]

Map:   0%|          | 0/24601 [00:00<?, ? examples/s]

Map:   0%|          | 0/3122 [00:00<?, ? examples/s]

Map:   0%|          | 0/3207 [00:00<?, ? examples/s]

Kombineeritud andmestikul treenitud tartuNLP/EstBERT EWT testandmestikul
Hindan testandmestikul..


Seqeval tulemused
EVE {'precision': 0.5517241379310345, 'recall': 0.5614035087719298, 'f1': 0.5565217391304348, 'number': 57}
GEP {'precision': 0.2631578947368421, 'recall': 0.7272727272727273, 'f1': 0.3864734299516908, 'number': 55}
LOC {'precision': 0.4864864864864865, 'recall': 0.6545454545454545, 'f1': 0.5581395348837209, 'number': 55}
ORG {'precision': 0.7235294117647059, 'recall': 0.5324675324675324, 'f1': 0.6134663341645885, 'number': 231}
PER {'precision': 0.9608879492600423, 'recall': 0.8301369863013699, 'f1': 0.8907398334149927, 'number': 1095}
PROD {'precision': 0.5, 'recall': 0.34806629834254144, 'f1': 0.41042345276872966, 'number': 362}
overall_precision 0.7663438256658596
overall_recall 0.6824797843665769
overall_f1 0.7219846022241232
overall_accuracy 0.9505855469865753

Nervaluate tulemused
Strict {'correct': 1266, 'incorrect': 260, 'partial': 0, 'missed': 329, 'spurious': 137, 'possible': 1855, 'actual': 1663, 'precision': 0.7612748045700541, 'recall': 0.682479784366576

Seqeval tulemused
EVE {'precision': 0.5614035087719298, 'recall': 0.38095238095238093, 'f1': 0.45390070921985815, 'number': 84}
GEP {'precision': 0.6736596736596736, 'recall': 0.7526041666666666, 'f1': 0.7109471094710947, 'number': 384}
LOC {'precision': 0.78125, 'recall': 0.7369614512471655, 'f1': 0.7584597432905484, 'number': 441}
MUU {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 6}
ORG {'precision': 0.7414030261348006, 'recall': 0.7393689986282579, 'f1': 0.7403846153846154, 'number': 729}
PER {'precision': 0.9294478527607362, 'recall': 0.9114740008594757, 'f1': 0.9203731829030157, 'number': 2327}
PROD {'precision': 0.491679273827534, 'recall': 0.5508474576271186, 'f1': 0.5195843325339727, 'number': 590}
UNK {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 2}
overall_precision 0.7941819772528433
overall_recall 0.7957484111330265
overall_f1 0.7949644225506294
overall_accuracy 0.9759567818835686

Nervaluate tulemused
Strict {'correct': 3631, 'incorrect': 694, 'partial': 

In [None]:
estroberta_edt, estroberta_edt_trainer, estroberta_edt_results = train_model('tartuNLP/EstRoBERTa', 'edt', epochs=6)

EDT andmestik laetud


Map:   0%|          | 0/24601 [00:00<?, ? examples/s]

Map:   0%|          | 0/3122 [00:00<?, ? examples/s]

Map:   0%|          | 0/3207 [00:00<?, ? examples/s]

Some weights of XLMRobertaForTokenClassification were not initialized from the model checkpoint at tartuNLP/EstRoBERTa and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


[2025-03-05 10:25:44] Alustan tartuNLP/EstRoBERTa treenimist


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy,Eve precision,Eve recall,Eve f1,Eve number,Gep precision,Gep recall,Gep f1,Gep number,Loc precision,Loc recall,Loc f1,Loc number,Muu precision,Muu recall,Muu f1,Muu number,Org precision,Org recall,Org f1,Org number,Per precision,Per recall,Per f1,Per number,Prod precision,Prod recall,Prod f1,Prod number,Unk precision,Unk recall,Unk f1,Unk number
1,0.0782,0.085064,0.725127,0.699046,0.711848,0.976293,0.517857,0.325843,0.4,89,0.597134,0.730994,0.657318,513,0.790991,0.528916,0.633935,830,0.0,0.0,0.0,9,0.534636,0.765903,0.629707,393,0.870056,0.913405,0.891204,1686,0.470109,0.328273,0.386592,527,0.0,0.0,0.0,40
2,0.0476,0.087196,0.715017,0.717641,0.716327,0.976666,0.5,0.438202,0.467066,89,0.570461,0.820663,0.673062,513,0.793907,0.533735,0.638329,830,0.0,0.0,0.0,9,0.548043,0.783715,0.645026,393,0.885313,0.89739,0.891311,1686,0.45733,0.396584,0.424797,527,0.0,0.0,0.0,40
3,0.0311,0.091934,0.7257,0.728897,0.727295,0.978049,0.545455,0.47191,0.506024,89,0.56827,0.851852,0.681747,513,0.832402,0.538554,0.653987,830,0.0,0.0,0.0,9,0.545283,0.735369,0.626219,393,0.914442,0.893832,0.904019,1686,0.472426,0.487666,0.479925,527,0.0,0.0,0.0,40
4,0.0194,0.101696,0.741753,0.737216,0.739477,0.978903,0.603175,0.426966,0.5,89,0.56147,0.863548,0.680492,513,0.78754,0.593976,0.677198,830,0.0,0.0,0.0,9,0.614894,0.735369,0.669757,393,0.909635,0.901542,0.90557,1686,0.519187,0.436433,0.474227,527,0.0,0.0,0.0,40
5,0.0098,0.121099,0.739312,0.736237,0.737771,0.978446,0.592105,0.505618,0.545455,89,0.557464,0.822612,0.664567,513,0.8,0.636145,0.708725,830,0.0,0.0,0.0,9,0.534602,0.78626,0.636457,393,0.938452,0.877224,0.906806,1686,0.534279,0.428843,0.475789,527,0.0,0.0,0.0,40
6,0.0046,0.125276,0.761704,0.752386,0.757016,0.97942,0.561798,0.561798,0.561798,89,0.602374,0.791423,0.684078,513,0.802053,0.659036,0.723545,830,0.0,0.0,0.0,9,0.601179,0.778626,0.678492,393,0.936914,0.88968,0.912686,1686,0.551867,0.504744,0.527255,527,0.0,0.0,0.0,40


  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))


[2025-03-05 11:03:30] tartuNLP/EstRoBERTa treenimine lõpetatud
Kokku kulus: 2265.46 sekundit (0.63 tundi)
Hindan testandmestikul..


  _warn_prf(average, modifier, msg_start, len(result))


Seqeval tulemused
EVE {'precision': 0.5365853658536586, 'recall': 0.4631578947368421, 'f1': 0.4971751412429378, 'number': 95}
GEP {'precision': 0.6844262295081968, 'recall': 0.7106382978723405, 'f1': 0.6972860125260961, 'number': 470}
LOC {'precision': 0.7062818336162988, 'recall': 0.6656, 'f1': 0.685337726523888, 'number': 625}
MUU {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 8}
ORG {'precision': 0.7357237715803453, 'recall': 0.7578659370725034, 'f1': 0.7466307277628031, 'number': 731}
PER {'precision': 0.9356855739169272, 'recall': 0.9156468531468531, 'f1': 0.9255577645239673, 'number': 2288}
PROD {'precision': 0.5988805970149254, 'recall': 0.5071090047393365, 'f1': 0.5491873396065012, 'number': 633}
UNK {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 2}
overall_precision 0.8025586353944563
overall_recall 0.7757625721352019
overall_f1 0.7889331377069796
overall_accuracy 0.9809939686919245

Nervaluate tulemused
Strict {'correct': 3764, 'incorrect': 829, 'partial': 0, 

In [None]:
estroberta_combined, estroberta_combined_trainer, estroberta_combined_results = train_model('tartuNLP/EstRoBERTa', 'combined', epochs=6)

COMBINED andmestik laetud


Map:   0%|          | 0/30045 [00:00<?, ? examples/s]

Map:   0%|          | 0/3955 [00:00<?, ? examples/s]

Map:   0%|          | 0/4120 [00:00<?, ? examples/s]

Some weights of XLMRobertaForTokenClassification were not initialized from the model checkpoint at tartuNLP/EstRoBERTa and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


[2025-03-05 11:04:51] Alustan tartuNLP/EstRoBERTa treenimist


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy,Eve precision,Eve recall,Eve f1,Eve number,Gep precision,Gep recall,Gep f1,Gep number,Loc precision,Loc recall,Loc f1,Loc number,Muu precision,Muu recall,Muu f1,Muu number,Org precision,Org recall,Org f1,Org number,Per precision,Per recall,Per f1,Per number,Prod precision,Prod recall,Prod f1,Prod number,Unk precision,Unk recall,Unk f1,Unk number
1,0.0822,0.142245,0.677787,0.666339,0.672014,0.967388,0.45,0.404494,0.426036,89,0.624719,0.517691,0.566191,537,0.749648,0.636798,0.68863,837,0.0,0.0,0.0,9,0.294913,0.828125,0.434936,448,0.950509,0.853595,0.899449,2295,0.478936,0.258373,0.335664,836,0.0,0.0,0.0,41
2,0.0474,0.113163,0.729031,0.747643,0.73822,0.975219,0.517544,0.662921,0.581281,89,0.611584,0.668529,0.63879,537,0.647059,0.709677,0.676923,837,0.0,0.0,0.0,9,0.612335,0.620536,0.616408,448,0.940163,0.903704,0.921573,2295,0.469777,0.529904,0.498033,836,0.0,0.0,0.0,41
3,0.0316,0.129303,0.766193,0.76198,0.76408,0.976759,0.417808,0.685393,0.519149,89,0.658318,0.685289,0.671533,537,0.739905,0.744325,0.742108,837,0.0,0.0,0.0,9,0.662736,0.627232,0.644495,448,0.942896,0.913725,0.928081,2295,0.517837,0.538278,0.527859,836,0.0,0.0,0.0,41
4,0.019,0.144214,0.784745,0.749607,0.766774,0.978007,0.564356,0.640449,0.6,89,0.587755,0.804469,0.679245,537,0.789238,0.630824,0.701195,837,0.0,0.0,0.0,9,0.653153,0.647321,0.650224,448,0.929103,0.925054,0.927074,2295,0.615262,0.462919,0.528328,836,0.0,0.0,0.0,41
5,0.0091,0.150025,0.766192,0.750393,0.75821,0.97695,0.47541,0.651685,0.549763,89,0.572207,0.782123,0.660897,537,0.741497,0.651135,0.693384,837,0.0,0.0,0.0,9,0.644105,0.658482,0.651214,448,0.936805,0.917211,0.926904,2295,0.577649,0.476077,0.521967,836,0.0,0.0,0.0,41
6,0.0044,0.159191,0.773878,0.762176,0.767983,0.977886,0.654321,0.595506,0.623529,89,0.599424,0.774674,0.675873,537,0.763869,0.641577,0.697403,837,0.0,0.0,0.0,9,0.607843,0.691964,0.647182,448,0.939582,0.921569,0.930488,2295,0.582147,0.538278,0.559354,836,0.0,0.0,0.0,41


  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))


[2025-03-05 11:50:26] tartuNLP/EstRoBERTa treenimine lõpetatud
Kokku kulus: 2735.07 sekundit (0.76 tundi)
Hindan testandmestikul..


Seqeval tulemused
EVE {'precision': 0.5546218487394958, 'recall': 0.44, 'f1': 0.49070631970260226, 'number': 150}
GEP {'precision': 0.7198581560283688, 'recall': 0.7660377358490567, 'f1': 0.7422303473491774, 'number': 530}
LOC {'precision': 0.7027439024390244, 'recall': 0.6710334788937409, 'f1': 0.6865227103499627, 'number': 687}
MUU {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 8}
ORG {'precision': 0.7159450897571278, 'recall': 0.75, 'f1': 0.7325769854132902, 'number': 904}
PER {'precision': 0.9506212169480727, 'recall': 0.9039684943956376, 'f1': 0.9267080745341614, 'number': 3301}
PROD {'precision': 0.5172031076581576, 'recall': 0.4941675503711559, 'f1': 0.5054229934924077, 'number': 943}
UNK {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 2}
overall_precision 0.7977616645649432
overall_recall 0.775632183908046
overall_f1 0.786541300800373
overall_accuracy 0.9782463949214225

Nervaluate tulemused
Strict {'correct': 5061, 'incorrect': 1017, 'partial': 0, 'missed': 447,

Map:   0%|          | 0/913 [00:00<?, ? examples/s]

Map:   0%|          | 0/3207 [00:00<?, ? examples/s]

Kombineeritud andmestikul treenitud tartuNLP/EstRoBERTa EWT testandmestikul
Hindan testandmestikul..


  _warn_prf(average, modifier, msg_start, len(result))


Seqeval tulemused
EVE {'precision': 0.725, 'recall': 0.5272727272727272, 'f1': 0.6105263157894736, 'number': 55}
GEP {'precision': 0.7692307692307693, 'recall': 0.8333333333333334, 'f1': 0.8, 'number': 60}
LOC {'precision': 0.4482758620689655, 'recall': 0.6290322580645161, 'f1': 0.523489932885906, 'number': 62}
MUU {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 0}
ORG {'precision': 0.5084745762711864, 'recall': 0.5202312138728323, 'f1': 0.5142857142857143, 'number': 173}
PER {'precision': 0.9600456621004566, 'recall': 0.8302073050345509, 'f1': 0.8904182106934887, 'number': 1013}
PROD {'precision': 0.364741641337386, 'recall': 0.3870967741935484, 'f1': 0.37558685446009393, 'number': 310}
UNK {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 0}
overall_precision 0.7380050505050505
overall_recall 0.698744769874477
overall_f1 0.7178385016886706
overall_accuracy 0.9609631521342575

Nervaluate tulemused
Strict {'correct': 1169, 'incorrect': 272, 'partial': 0, 'missed': 232, 'spu

Seqeval tulemused
EVE {'precision': 0.46835443037974683, 'recall': 0.3894736842105263, 'f1': 0.4252873563218391, 'number': 95}
GEP {'precision': 0.7134268537074149, 'recall': 0.7574468085106383, 'f1': 0.7347781217750258, 'number': 470}
LOC {'precision': 0.7416520210896309, 'recall': 0.6752, 'f1': 0.7068676716917922, 'number': 625}
MUU {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 8}
ORG {'precision': 0.7636363636363637, 'recall': 0.8043775649794802, 'f1': 0.7834776815456362, 'number': 731}
PER {'precision': 0.9469730446310207, 'recall': 0.9366258741258742, 'f1': 0.9417710393320149, 'number': 2288}
PROD {'precision': 0.6048951048951049, 'recall': 0.5466034755134281, 'f1': 0.5742738589211619, 'number': 633}
UNK {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 2}
overall_precision 0.8176470588235294
overall_recall 0.8021434460016488
overall_f1 0.8098210570120682
overall_accuracy 0.9825673534072901

Nervaluate tulemused
Strict {'correct': 3892, 'incorrect': 745, 'partial': 0

In [None]:
estbert_combined, estbert_combined_trainer, estbert_combined_results = train_model('tartuNLP/EstBERT', 'combined', epochs=6)

COMBINED andmestik laetud


Map:   0%|          | 0/30045 [00:00<?, ? examples/s]

Map:   0%|          | 0/3955 [00:00<?, ? examples/s]

Map:   0%|          | 0/4120 [00:00<?, ? examples/s]

Some weights of BertForTokenClassification were not initialized from the model checkpoint at tartuNLP/EstBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


[2025-03-05 11:52:02] Alustan tartuNLP/EstBERT treenimist


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy,Eve precision,Eve recall,Eve f1,Eve number,Gep precision,Gep recall,Gep f1,Gep number,Loc precision,Loc recall,Loc f1,Loc number,Muu precision,Muu recall,Muu f1,Muu number,Org precision,Org recall,Org f1,Org number,Per precision,Per recall,Per f1,Per number,Prod precision,Prod recall,Prod f1,Prod number,Unk precision,Unk recall,Unk f1,Unk number
1,0.0944,0.137863,0.719613,0.6986,0.708951,0.965501,0.32,0.352941,0.335664,68,0.613074,0.771111,0.683071,450,0.746204,0.533333,0.622061,645,0.0,0.0,0.0,12,0.462275,0.745174,0.570584,518,0.935335,0.872093,0.902608,2322,0.488032,0.401972,0.440841,913,0.0,0.0,0.0,72
2,0.0438,0.159691,0.723536,0.7218,0.722667,0.966474,0.28,0.514706,0.362694,68,0.613883,0.628889,0.621295,450,0.669207,0.68062,0.674865,645,0.0,0.0,0.0,12,0.498603,0.689189,0.578606,518,0.943104,0.892334,0.917017,2322,0.507803,0.463308,0.484536,913,0.0,0.0,0.0,72
3,0.0231,0.175934,0.737744,0.7404,0.73907,0.968061,0.409639,0.5,0.450331,68,0.569748,0.753333,0.648804,450,0.730263,0.688372,0.708699,645,0.0,0.0,0.0,12,0.592466,0.667954,0.627949,518,0.942831,0.894918,0.91825,2322,0.500543,0.504929,0.502726,913,0.0,0.0,0.0,72
4,0.0119,0.210472,0.751138,0.7262,0.738458,0.968621,0.4,0.382353,0.390977,68,0.594982,0.737778,0.65873,450,0.76556,0.572093,0.654836,645,0.0,0.0,0.0,12,0.518414,0.706564,0.598039,518,0.939636,0.911714,0.925464,2322,0.555409,0.461117,0.50389,913,0.0,0.0,0.0,72
5,0.0057,0.209417,0.763989,0.74,0.751803,0.970315,0.430769,0.411765,0.421053,68,0.617308,0.713333,0.661856,450,0.726957,0.648062,0.685246,645,0.0,0.0,0.0,12,0.612069,0.685328,0.64663,518,0.933042,0.918174,0.925548,2322,0.551298,0.488499,0.518002,913,0.0,0.0,0.0,72
6,0.0022,0.227933,0.749541,0.735,0.742199,0.969128,0.387097,0.352941,0.369231,68,0.604779,0.731111,0.661972,450,0.739962,0.6,0.662671,645,0.0,0.0,0.0,12,0.561562,0.722008,0.631757,518,0.944942,0.90913,0.92669,2322,0.51963,0.492881,0.505902,913,0.0,0.0,0.0,72


  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))


[2025-03-05 12:21:16] tartuNLP/EstBERT treenimine lõpetatud
Kokku kulus: 1754.47 sekundit (0.49 tundi)
Hindan testandmestikul..


Seqeval tulemused
EVE {'precision': 0.5267857142857143, 'recall': 0.41843971631205673, 'f1': 0.466403162055336, 'number': 141}
GEP {'precision': 0.691764705882353, 'recall': 0.6697038724373576, 'f1': 0.6805555555555555, 'number': 439}
LOC {'precision': 0.6602112676056338, 'recall': 0.7560483870967742, 'f1': 0.7048872180451128, 'number': 496}
MUU {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 6}
ORG {'precision': 0.7386877828054299, 'recall': 0.6802083333333333, 'f1': 0.70824295010846, 'number': 960}
PER {'precision': 0.9336594313665546, 'recall': 0.8924605493863238, 'f1': 0.912595248767369, 'number': 3422}
PROD {'precision': 0.46382978723404256, 'recall': 0.4579831932773109, 'f1': 0.4608879492600423, 'number': 952}
UNK {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 2}
overall_precision 0.7836229086229086
overall_recall 0.7589591773138049
overall_f1 0.7710938736742124
overall_accuracy 0.9699687122761204

Nervaluate tulemused
Strict {'correct': 4871, 'incorrect': 1003, 'p

Map:   0%|          | 0/913 [00:00<?, ? examples/s]

Map:   0%|          | 0/3207 [00:00<?, ? examples/s]

Kombineeritud andmestikul treenitud tartuNLP/EstBERT EWT testandmestikul
Hindan testandmestikul..


  _warn_prf(average, modifier, msg_start, len(result))


Seqeval tulemused
EVE {'precision': 0.559322033898305, 'recall': 0.5789473684210527, 'f1': 0.5689655172413793, 'number': 57}
GEP {'precision': 0.5797101449275363, 'recall': 0.7272727272727273, 'f1': 0.6451612903225806, 'number': 55}
LOC {'precision': 0.40476190476190477, 'recall': 0.6181818181818182, 'f1': 0.48920863309352525, 'number': 55}
MUU {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 0}
ORG {'precision': 0.7668711656441718, 'recall': 0.5411255411255411, 'f1': 0.6345177664974619, 'number': 231}
PER {'precision': 0.9613428280773143, 'recall': 0.863013698630137, 'f1': 0.9095283926852743, 'number': 1095}
PROD {'precision': 0.39862542955326463, 'recall': 0.32044198895027626, 'f1': 0.3552833078101072, 'number': 362}
UNK {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 0}
overall_precision 0.7798552472858866
overall_recall 0.6970350404312669
overall_f1 0.7361229718189582
overall_accuracy 0.9520137103684662

Nervaluate tulemused
Strict {'correct': 1293, 'incorrect': 237, '

Seqeval tulemused
EVE {'precision': 0.49056603773584906, 'recall': 0.30952380952380953, 'f1': 0.3795620437956205, 'number': 84}
GEP {'precision': 0.7134831460674157, 'recall': 0.6614583333333334, 'f1': 0.6864864864864865, 'number': 384}
LOC {'precision': 0.7045454545454546, 'recall': 0.7732426303854876, 'f1': 0.7372972972972973, 'number': 441}
MUU {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 6}
ORG {'precision': 0.7323162274618585, 'recall': 0.7242798353909465, 'f1': 0.7282758620689657, 'number': 729}
PER {'precision': 0.9217657342657343, 'recall': 0.9063171465406102, 'f1': 0.9139761646803901, 'number': 2327}
PROD {'precision': 0.4930662557781202, 'recall': 0.5423728813559322, 'f1': 0.5165456012913641, 'number': 590}
UNK {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 2}
overall_precision 0.7849934181658622
overall_recall 0.7841332456717072
overall_f1 0.7845630961517377
overall_accuracy 0.974904596636148

Nervaluate tulemused
Strict {'correct': 3578, 'incorrect': 766, 

EstRoBERTa EDT 3 ja 6, combined 3 ja 6; EstBERT combined 3 ja 6 uuesti, sest output_dir oli sama ja alles jäi ainult üks parim variant

In [7]:
estroberta_edt_3, estroberta_edt_3_trainer, estroberta_edt_3_results = train_model('tartuNLP/EstRoBERTa', 'EDT', epochs=3)

Map:   0%|          | 0/24601 [00:00<?, ? examples/s]

Map:   0%|          | 0/3122 [00:00<?, ? examples/s]

Map:   0%|          | 0/3207 [00:00<?, ? examples/s]

EDT andmestik laetud


Map:   0%|          | 0/24601 [00:00<?, ? examples/s]

Map:   0%|          | 0/3122 [00:00<?, ? examples/s]

Map:   0%|          | 0/3207 [00:00<?, ? examples/s]

Some weights of XLMRobertaForTokenClassification were not initialized from the model checkpoint at tartuNLP/EstRoBERTa and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


[2025-03-10 14:11:47] Alustan tartuNLP/EstRoBERTa treenimist


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy,Eve precision,Eve recall,Eve f1,Eve number,Gep precision,Gep recall,Gep f1,Gep number,Loc precision,Loc recall,Loc f1,Loc number,Muu precision,Muu recall,Muu f1,Muu number,Org precision,Org recall,Org f1,Org number,Per precision,Per recall,Per f1,Per number,Prod precision,Prod recall,Prod f1,Prod number,Unk precision,Unk recall,Unk f1,Unk number
1,0.0723,0.078209,0.725092,0.724737,0.724914,0.97753,0.560976,0.516854,0.538012,89,0.60315,0.746589,0.667247,513,0.795764,0.633735,0.705567,830,0.0,0.0,0.0,9,0.584677,0.737913,0.652418,393,0.841878,0.925267,0.881605,1686,0.438547,0.297913,0.354802,527,0.0,0.0,0.0,40
2,0.0417,0.086422,0.709577,0.726939,0.718153,0.976892,0.375,0.269663,0.313725,89,0.533578,0.851852,0.656156,513,0.831418,0.522892,0.642012,830,0.0,0.0,0.0,9,0.490879,0.753181,0.594378,393,0.897674,0.915777,0.906635,1686,0.514161,0.447818,0.478702,527,0.0,0.0,0.0,40
3,0.0212,0.086889,0.758995,0.753609,0.756292,0.97996,0.582418,0.595506,0.588889,89,0.582849,0.781676,0.667777,513,0.803807,0.661446,0.725711,830,0.0,0.0,0.0,9,0.643923,0.768448,0.700696,393,0.922007,0.904508,0.913174,1686,0.528541,0.474383,0.5,527,0.0,0.0,0.0,40


  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))


[2025-03-10 14:29:53] tartuNLP/EstRoBERTa treenimine lõpetatud
Kokku kulus: 1085.24 sekundit (0.30 tundi)
Hindan testandmestikul..


  _warn_prf(average, modifier, msg_start, len(result))


Seqeval tulemused
EVE {'precision': 0.5797101449275363, 'recall': 0.42105263157894735, 'f1': 0.48780487804878053, 'number': 95}
GEP {'precision': 0.6808510638297872, 'recall': 0.7505330490405118, 'f1': 0.7139959432048683, 'number': 469}
LOC {'precision': 0.729776247848537, 'recall': 0.6784, 'f1': 0.703150912106136, 'number': 625}
MUU {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 8}
ORG {'precision': 0.7463672391017173, 'recall': 0.7729138166894665, 'f1': 0.7594086021505375, 'number': 731}
PER {'precision': 0.9239130434782609, 'recall': 0.9287587412587412, 'f1': 0.9263295553618135, 'number': 2288}
PROD {'precision': 0.5315985130111525, 'recall': 0.4518167456556082, 'f1': 0.488471391972673, 'number': 633}
UNK {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 2}
overall_precision 0.7963040739185216
overall_recall 0.7816944959802102
overall_f1 0.7889316550504526
overall_accuracy 0.9812886968221571

Nervaluate tulemused
Strict {'correct': 3792, 'incorrect': 827, 'partial': 0, 

In [8]:
estroberta_edt_6, estroberta_edt_6_trainer, estroberta_edt_6_results = train_model('tartuNLP/EstRoBERTa', 'EDT', epochs=6)

Map:   0%|          | 0/24601 [00:00<?, ? examples/s]

Map:   0%|          | 0/3122 [00:00<?, ? examples/s]

Map:   0%|          | 0/3207 [00:00<?, ? examples/s]

EDT andmestik laetud


Map:   0%|          | 0/24601 [00:00<?, ? examples/s]

Map:   0%|          | 0/3122 [00:00<?, ? examples/s]

Map:   0%|          | 0/3207 [00:00<?, ? examples/s]

Some weights of XLMRobertaForTokenClassification were not initialized from the model checkpoint at tartuNLP/EstRoBERTa and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


[2025-03-10 14:31:10] Alustan tartuNLP/EstRoBERTa treenimist


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy,Eve precision,Eve recall,Eve f1,Eve number,Gep precision,Gep recall,Gep f1,Gep number,Loc precision,Loc recall,Loc f1,Loc number,Muu precision,Muu recall,Muu f1,Muu number,Org precision,Org recall,Org f1,Org number,Per precision,Per recall,Per f1,Per number,Prod precision,Prod recall,Prod f1,Prod number,Unk precision,Unk recall,Unk f1,Unk number
1,0.0726,0.074083,0.740477,0.737216,0.738843,0.978119,0.628205,0.550562,0.586826,89,0.610738,0.709552,0.656447,513,0.833333,0.63253,0.719178,830,0.0,0.0,0.0,9,0.607143,0.778626,0.682274,393,0.871837,0.940095,0.90468,1686,0.41535,0.349146,0.379381,527,0.0,0.0,0.0,40
2,0.0472,0.076375,0.732493,0.739662,0.73606,0.978312,0.54902,0.314607,0.4,89,0.564537,0.844055,0.676562,513,0.806838,0.568675,0.667138,830,0.0,0.0,0.0,9,0.601578,0.776081,0.677778,393,0.897583,0.925267,0.911215,1686,0.469729,0.426945,0.447316,527,0.0,0.0,0.0,40
3,0.0295,0.088824,0.731725,0.734769,0.733244,0.978757,0.640625,0.460674,0.535948,89,0.570068,0.816764,0.671474,513,0.763441,0.598795,0.671168,830,0.0,0.0,0.0,9,0.555556,0.737913,0.63388,393,0.905771,0.912218,0.908983,1686,0.502304,0.413662,0.453694,527,0.0,0.0,0.0,40
4,0.0183,0.094191,0.755672,0.74162,0.74858,0.980032,0.655738,0.449438,0.533333,89,0.558559,0.846004,0.672868,513,0.804207,0.598795,0.686464,830,0.0,0.0,0.0,9,0.65,0.694656,0.671587,393,0.90388,0.92586,0.914738,1686,0.560794,0.428843,0.486022,527,0.0,0.0,0.0,40
5,0.0084,0.10957,0.746128,0.754343,0.750213,0.979478,0.617021,0.651685,0.63388,89,0.583679,0.822612,0.682848,513,0.795918,0.610843,0.691207,830,0.0,0.0,0.0,9,0.557223,0.755725,0.641469,393,0.933658,0.909846,0.921598,1686,0.537525,0.502846,0.519608,527,0.0,0.0,0.0,40
6,0.0039,0.115811,0.7608,0.754098,0.757434,0.979887,0.648352,0.662921,0.655556,89,0.594993,0.787524,0.677852,513,0.774854,0.638554,0.700132,830,0.0,0.0,0.0,9,0.606122,0.755725,0.672707,393,0.92503,0.907473,0.916168,1686,0.595455,0.497154,0.541882,527,0.0,0.0,0.0,40


  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))


[2025-03-10 15:07:42] tartuNLP/EstRoBERTa treenimine lõpetatud
Kokku kulus: 2192.37 sekundit (0.61 tundi)
Hindan testandmestikul..


  _warn_prf(average, modifier, msg_start, len(result))


Seqeval tulemused
EVE {'precision': 0.5540540540540541, 'recall': 0.43157894736842106, 'f1': 0.485207100591716, 'number': 95}
GEP {'precision': 0.6802443991853361, 'recall': 0.7121535181236673, 'f1': 0.6958333333333333, 'number': 469}
LOC {'precision': 0.6961414790996785, 'recall': 0.6928, 'f1': 0.6944667201283079, 'number': 625}
MUU {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 8}
ORG {'precision': 0.7791495198902606, 'recall': 0.7770177838577291, 'f1': 0.7780821917808218, 'number': 731}
PER {'precision': 0.9322409211691762, 'recall': 0.9200174825174825, 'f1': 0.9260888693356797, 'number': 2288}
PROD {'precision': 0.6091743119266055, 'recall': 0.5244865718799369, 'f1': 0.5636672325976231, 'number': 633}
UNK {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 2}
overall_precision 0.8080101716465353
overall_recall 0.7860235003092146
overall_f1 0.7968652037617555
overall_accuracy 0.981425525364591

Nervaluate tulemused
Strict {'correct': 3813, 'incorrect': 789, 'partial': 0, 

In [16]:
estroberta_combined_3, estroberta_combined_3_trainer, estroberta_combined_3_results = train_model('tartuNLP/EstRoBERTa', 'Combined', epochs=3)

Map:   0%|          | 0/5444 [00:00<?, ? examples/s]

Map:   0%|          | 0/833 [00:00<?, ? examples/s]

Map:   0%|          | 0/913 [00:00<?, ? examples/s]

Map:   0%|          | 0/24601 [00:00<?, ? examples/s]

Map:   0%|          | 0/3122 [00:00<?, ? examples/s]

Map:   0%|          | 0/3207 [00:00<?, ? examples/s]

COMBINED andmestik laetud


Map:   0%|          | 0/30045 [00:00<?, ? examples/s]

Map:   0%|          | 0/3955 [00:00<?, ? examples/s]

Map:   0%|          | 0/4120 [00:00<?, ? examples/s]

Some weights of XLMRobertaForTokenClassification were not initialized from the model checkpoint at tartuNLP/EstRoBERTa and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


[2025-03-10 15:09:30] Alustan tartuNLP/EstRoBERTa treenimist


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy,Eve precision,Eve recall,Eve f1,Eve number,Gep precision,Gep recall,Gep f1,Gep number,Loc precision,Loc recall,Loc f1,Loc number,Muu precision,Muu recall,Muu f1,Muu number,Org precision,Org recall,Org f1,Org number,Per precision,Per recall,Per f1,Per number,Prod precision,Prod recall,Prod f1,Prod number,Unk precision,Unk recall,Unk f1,Unk number
1,0.0781,0.112341,0.723204,0.707581,0.715307,0.972621,0.618182,0.382022,0.472222,89,0.632,0.588454,0.60945,537,0.684337,0.678614,0.681464,837,0.0,0.0,0.0,9,0.387996,0.808036,0.524258,448,0.933451,0.922876,0.928133,2295,0.518987,0.245215,0.333063,836,0.0,0.0,0.0,41
2,0.0388,0.11506,0.767008,0.750589,0.75871,0.976869,0.710526,0.606742,0.654545,89,0.597504,0.713222,0.650255,537,0.690276,0.686977,0.688623,837,0.0,0.0,0.0,9,0.693431,0.636161,0.663562,448,0.925749,0.928976,0.92736,2295,0.546592,0.470096,0.505466,836,0.0,0.0,0.0,41
3,0.0212,0.126067,0.770531,0.751767,0.761034,0.977715,0.630435,0.651685,0.640884,89,0.57708,0.787709,0.666142,537,0.796446,0.589008,0.677198,837,0.0,0.0,0.0,9,0.563869,0.689732,0.620482,448,0.943505,0.924183,0.933744,2295,0.582418,0.507177,0.542199,836,0.0,0.0,0.0,41


  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))


[2025-03-10 15:31:50] tartuNLP/EstRoBERTa treenimine lõpetatud
Kokku kulus: 1340.73 sekundit (0.37 tundi)
Hindan testandmestikul..


  _warn_prf(average, modifier, msg_start, len(result))


Seqeval tulemused
EVE {'precision': 0.6590909090909091, 'recall': 0.58, 'f1': 0.6170212765957446, 'number': 150}
GEP {'precision': 0.6960629921259842, 'recall': 0.8339622641509434, 'f1': 0.7587982832618025, 'number': 530}
LOC {'precision': 0.7658536585365854, 'recall': 0.6855895196506551, 'f1': 0.7235023041474654, 'number': 687}
MUU {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 8}
ORG {'precision': 0.724972497249725, 'recall': 0.7289823008849557, 'f1': 0.7269718698290126, 'number': 904}
PER {'precision': 0.945997458703939, 'recall': 0.9021508633747349, 'f1': 0.9235540393859513, 'number': 3301}
PROD {'precision': 0.5361653272101033, 'recall': 0.49522799575821846, 'f1': 0.5148842337375964, 'number': 943}
UNK {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 2}
overall_precision 0.8088748019017432
overall_recall 0.7822222222222223
overall_f1 0.7953252824308531
overall_accuracy 0.9789483285447166

Nervaluate tulemused
Strict {'correct': 5104, 'incorrect': 981, 'partial': 0, '

Map:   0%|          | 0/913 [00:00<?, ? examples/s]

Map:   0%|          | 0/3207 [00:00<?, ? examples/s]

Kombineeritud andmestikul treenitud tartuNLP/EstRoBERTa EWT testandmestikul
Hindan testandmestikul..


Seqeval tulemused
EVE {'precision': 0.813953488372093, 'recall': 0.6363636363636364, 'f1': 0.7142857142857143, 'number': 55}
GEP {'precision': 0.6790123456790124, 'recall': 0.9166666666666666, 'f1': 0.7801418439716312, 'number': 60}
LOC {'precision': 0.4943820224719101, 'recall': 0.7096774193548387, 'f1': 0.5827814569536423, 'number': 62}
ORG {'precision': 0.5059523809523809, 'recall': 0.4913294797687861, 'f1': 0.4985337243401759, 'number': 173}
PER {'precision': 0.9517241379310345, 'recall': 0.8173741362290227, 'f1': 0.8794476898566118, 'number': 1013}
PROD {'precision': 0.4214046822742475, 'recall': 0.4064516129032258, 'f1': 0.41379310344827586, 'number': 310}
overall_precision 0.756774193548387
overall_recall 0.7011356843992828
overall_f1 0.7278932671424139
overall_accuracy 0.9640609322265803

Nervaluate tulemused
Strict {'correct': 1173, 'incorrect': 274, 'partial': 0, 'missed': 226, 'spurious': 110, 'possible': 1673, 'actual': 1557, 'precision': 0.7533718689788054, 'recall': 0.701

Seqeval tulemused
EVE {'precision': 0.5842696629213483, 'recall': 0.5473684210526316, 'f1': 0.5652173913043478, 'number': 95}
GEP {'precision': 0.6980108499095841, 'recall': 0.8230277185501066, 'f1': 0.7553816046966731, 'number': 469}
LOC {'precision': 0.811787072243346, 'recall': 0.6832, 'f1': 0.741963509991312, 'number': 625}
MUU {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 8}
ORG {'precision': 0.7746288798920378, 'recall': 0.7852257181942545, 'f1': 0.7798913043478262, 'number': 731}
PER {'precision': 0.9438103599648815, 'recall': 0.9396853146853147, 'f1': 0.941743320192729, 'number': 2288}
PROD {'precision': 0.5961538461538461, 'recall': 0.5387045813586098, 'f1': 0.5659751037344398, 'number': 633}
UNK {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 2}
overall_precision 0.8258037402815718
overall_recall 0.8101422387136673
overall_f1 0.81789802289282
overall_accuracy 0.9826683846250328

Nervaluate tulemused
Strict {'correct': 3930, 'incorrect': 707, 'partial': 0, 'mis

In [18]:
estroberta_combined_6, estroberta_combined_6_trainer, estroberta_combined_6_results = train_model('tartuNLP/EstRoBERTa', 'Combined', epochs=6)

Map:   0%|          | 0/5444 [00:00<?, ? examples/s]

Map:   0%|          | 0/833 [00:00<?, ? examples/s]

Map:   0%|          | 0/913 [00:00<?, ? examples/s]

Map:   0%|          | 0/24601 [00:00<?, ? examples/s]

Map:   0%|          | 0/3122 [00:00<?, ? examples/s]

Map:   0%|          | 0/3207 [00:00<?, ? examples/s]

COMBINED andmestik laetud


Map:   0%|          | 0/30045 [00:00<?, ? examples/s]

Map:   0%|          | 0/3955 [00:00<?, ? examples/s]

Map:   0%|          | 0/4120 [00:00<?, ? examples/s]

Some weights of XLMRobertaForTokenClassification were not initialized from the model checkpoint at tartuNLP/EstRoBERTa and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


[2025-03-10 15:33:53] Alustan tartuNLP/EstRoBERTa treenimist


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy,Eve precision,Eve recall,Eve f1,Eve number,Gep precision,Gep recall,Gep f1,Gep number,Loc precision,Loc recall,Loc f1,Loc number,Muu precision,Muu recall,Muu f1,Muu number,Org precision,Org recall,Org f1,Org number,Per precision,Per recall,Per f1,Per number,Prod precision,Prod recall,Prod f1,Prod number,Unk precision,Unk recall,Unk f1,Unk number
1,0.0826,0.120142,0.701789,0.693244,0.697491,0.971041,0.424242,0.47191,0.446809,89,0.642718,0.616387,0.629278,537,0.724409,0.659498,0.690432,837,0.0,0.0,0.0,9,0.341143,0.8125,0.480528,448,0.956979,0.872331,0.912697,2295,0.482828,0.285885,0.359128,836,0.0,0.0,0.0,41
2,0.0475,0.118941,0.751037,0.746465,0.748744,0.975792,0.582418,0.595506,0.588889,89,0.623711,0.675978,0.648794,537,0.690888,0.715651,0.703052,837,0.0,0.0,0.0,9,0.608137,0.633929,0.620765,448,0.934205,0.903268,0.918476,2295,0.513772,0.513158,0.513465,836,0.0,0.0,0.0,41
3,0.0315,0.127714,0.763662,0.751964,0.757768,0.97696,0.51145,0.752809,0.609091,89,0.592085,0.724395,0.651591,537,0.712589,0.716846,0.714711,837,0.0,0.0,0.0,9,0.614191,0.618304,0.61624,448,0.936572,0.90719,0.921647,2295,0.583099,0.495215,0.535576,836,0.0,0.0,0.0,41
4,0.018,0.157644,0.760008,0.734485,0.747029,0.976456,0.649351,0.561798,0.60241,89,0.58445,0.811918,0.679657,537,0.767367,0.567503,0.652473,837,0.0,0.0,0.0,9,0.539249,0.705357,0.611219,448,0.942423,0.891503,0.916256,2295,0.584034,0.498804,0.538065,836,0.0,0.0,0.0,41


  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy,Eve precision,Eve recall,Eve f1,Eve number,Gep precision,Gep recall,Gep f1,Gep number,Loc precision,Loc recall,Loc f1,Loc number,Muu precision,Muu recall,Muu f1,Muu number,Org precision,Org recall,Org f1,Org number,Per precision,Per recall,Per f1,Per number,Prod precision,Prod recall,Prod f1,Prod number,Unk precision,Unk recall,Unk f1,Unk number
1,0.0826,0.120142,0.701789,0.693244,0.697491,0.971041,0.424242,0.47191,0.446809,89,0.642718,0.616387,0.629278,537,0.724409,0.659498,0.690432,837,0.0,0.0,0.0,9,0.341143,0.8125,0.480528,448,0.956979,0.872331,0.912697,2295,0.482828,0.285885,0.359128,836,0.0,0.0,0.0,41
2,0.0475,0.118941,0.751037,0.746465,0.748744,0.975792,0.582418,0.595506,0.588889,89,0.623711,0.675978,0.648794,537,0.690888,0.715651,0.703052,837,0.0,0.0,0.0,9,0.608137,0.633929,0.620765,448,0.934205,0.903268,0.918476,2295,0.513772,0.513158,0.513465,836,0.0,0.0,0.0,41
3,0.0315,0.127714,0.763662,0.751964,0.757768,0.97696,0.51145,0.752809,0.609091,89,0.592085,0.724395,0.651591,537,0.712589,0.716846,0.714711,837,0.0,0.0,0.0,9,0.614191,0.618304,0.61624,448,0.936572,0.90719,0.921647,2295,0.583099,0.495215,0.535576,836,0.0,0.0,0.0,41
4,0.018,0.157644,0.760008,0.734485,0.747029,0.976456,0.649351,0.561798,0.60241,89,0.58445,0.811918,0.679657,537,0.767367,0.567503,0.652473,837,0.0,0.0,0.0,9,0.539249,0.705357,0.611219,448,0.942423,0.891503,0.916256,2295,0.584034,0.498804,0.538065,836,0.0,0.0,0.0,41
5,0.0093,0.158108,0.770197,0.758248,0.764176,0.977191,0.675,0.606742,0.639053,89,0.610248,0.731844,0.665538,537,0.739762,0.669056,0.702635,837,0.0,0.0,0.0,9,0.585878,0.685268,0.631687,448,0.932629,0.922876,0.927727,2295,0.595007,0.513158,0.55106,836,0.0,0.0,0.0,41
6,0.0049,0.170453,0.774213,0.753535,0.763734,0.977342,0.628205,0.550562,0.586826,89,0.575101,0.791434,0.666144,537,0.773952,0.617682,0.687043,837,0.0,0.0,0.0,9,0.611111,0.6875,0.647059,448,0.941229,0.921133,0.931072,2295,0.593838,0.507177,0.547097,836,0.0,0.0,0.0,41


[2025-03-10 16:18:05] tartuNLP/EstRoBERTa treenimine lõpetatud
Kokku kulus: 2651.95 sekundit (0.74 tundi)
Hindan testandmestikul..


Seqeval tulemused
EVE {'precision': 0.5723270440251572, 'recall': 0.6066666666666667, 'f1': 0.5889967637540454, 'number': 150}
GEP {'precision': 0.6932270916334662, 'recall': 0.6566037735849056, 'f1': 0.6744186046511628, 'number': 530}
LOC {'precision': 0.6082224909310762, 'recall': 0.7321688500727802, 'f1': 0.6644649933949802, 'number': 687}
MUU {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 8}
ORG {'precision': 0.7001044932079414, 'recall': 0.7411504424778761, 'f1': 0.7200429876410532, 'number': 904}
PER {'precision': 0.9435897435897436, 'recall': 0.891850954256286, 'f1': 0.9169911228780564, 'number': 3301}
PROD {'precision': 0.5714285714285714, 'recall': 0.559915164369035, 'f1': 0.5656132833422604, 'number': 943}
UNK {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 2}
overall_precision 0.7823945829485995
overall_recall 0.7791570881226053
overall_f1 0.7807724794594179
overall_accuracy 0.9775619099740046

Nervaluate tulemused
Strict {'correct': 5084, 'incorrect': 1104, '

Map:   0%|          | 0/913 [00:00<?, ? examples/s]

Map:   0%|          | 0/3207 [00:00<?, ? examples/s]

Kombineeritud andmestikul treenitud tartuNLP/EstRoBERTa EWT testandmestikul
Hindan testandmestikul..


  _warn_prf(average, modifier, msg_start, len(result))


Seqeval tulemused
EVE {'precision': 0.84, 'recall': 0.7636363636363637, 'f1': 0.8000000000000002, 'number': 55}
GEP {'precision': 0.875, 'recall': 0.8166666666666667, 'f1': 0.8448275862068966, 'number': 60}
LOC {'precision': 0.3092105263157895, 'recall': 0.7580645161290323, 'f1': 0.4392523364485981, 'number': 62}
MUU {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 0}
ORG {'precision': 0.5406976744186046, 'recall': 0.5375722543352601, 'f1': 0.5391304347826088, 'number': 173}
PER {'precision': 0.9387308533916849, 'recall': 0.8469891411648569, 'f1': 0.8905033731188376, 'number': 1013}
PROD {'precision': 0.49382716049382713, 'recall': 0.5161290322580645, 'f1': 0.5047318611987381, 'number': 310}
UNK {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 0}
overall_precision 0.7470095693779905
overall_recall 0.7465630603705917
overall_f1 0.7467862481315397
overall_accuracy 0.9640153242725531

Nervaluate tulemused
Strict {'correct': 1249, 'incorrect': 250, 'partial': 0, 'missed': 174, 

Seqeval tulemused
EVE {'precision': 0.44954128440366975, 'recall': 0.5157894736842106, 'f1': 0.48039215686274517, 'number': 95}
GEP {'precision': 0.6696629213483146, 'recall': 0.6353944562899787, 'f1': 0.652078774617068, 'number': 469}
LOC {'precision': 0.6755555555555556, 'recall': 0.7296, 'f1': 0.7015384615384616, 'number': 625}
MUU {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 8}
ORG {'precision': 0.7350318471337579, 'recall': 0.7893296853625171, 'f1': 0.7612137203166228, 'number': 731}
PER {'precision': 0.9456029011786038, 'recall': 0.9117132867132867, 'f1': 0.9283489096573209, 'number': 2288}
PROD {'precision': 0.6133333333333333, 'recall': 0.5813586097946287, 'f1': 0.5969180859691808, 'number': 633}
UNK {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 2}
overall_precision 0.7946113989637306
overall_recall 0.7903525046382189
overall_f1 0.7924762298470442
overall_accuracy 0.9809466254660723

Nervaluate tulemused
Strict {'correct': 3834, 'incorrect': 854, 'partial': 0

In [20]:
estbert_combined_3, estbert_combined_3_trainer, estbert_combined_3_results = train_model('tartuNLP/EstBERT', 'Combined', epochs=3)

Map:   0%|          | 0/5444 [00:00<?, ? examples/s]

Map:   0%|          | 0/833 [00:00<?, ? examples/s]

Map:   0%|          | 0/913 [00:00<?, ? examples/s]

Map:   0%|          | 0/24601 [00:00<?, ? examples/s]

Map:   0%|          | 0/3122 [00:00<?, ? examples/s]

Map:   0%|          | 0/3207 [00:00<?, ? examples/s]

COMBINED andmestik laetud


tokenizer_config.json:   0%|          | 0.00/62.0 [00:00<?, ?B/s]

config.json:   0%|          | 0.00/534 [00:00<?, ?B/s]

vocab.txt:   0%|          | 0.00/410k [00:00<?, ?B/s]

special_tokens_map.json:   0%|          | 0.00/112 [00:00<?, ?B/s]

Map:   0%|          | 0/30045 [00:00<?, ? examples/s]

Map:   0%|          | 0/3955 [00:00<?, ? examples/s]

Map:   0%|          | 0/4120 [00:00<?, ? examples/s]

model.safetensors:   0%|          | 0.00/498M [00:00<?, ?B/s]

Some weights of BertForTokenClassification were not initialized from the model checkpoint at tartuNLP/EstBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


[2025-03-10 16:20:13] Alustan tartuNLP/EstBERT treenimist


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy,Eve precision,Eve recall,Eve f1,Eve number,Gep precision,Gep recall,Gep f1,Gep number,Loc precision,Loc recall,Loc f1,Loc number,Muu precision,Muu recall,Muu f1,Muu number,Org precision,Org recall,Org f1,Org number,Per precision,Per recall,Per f1,Per number,Prod precision,Prod recall,Prod f1,Prod number,Unk precision,Unk recall,Unk f1,Unk number
1,0.0929,0.136176,0.718673,0.6974,0.707877,0.965647,0.315068,0.338235,0.326241,68,0.606383,0.76,0.674556,450,0.76009,0.525581,0.621448,645,0.0,0.0,0.0,12,0.457241,0.774131,0.57491,518,0.93121,0.868648,0.898841,2322,0.502755,0.399781,0.445394,913,0.0,0.0,0.0,72
2,0.0396,0.149739,0.729088,0.7304,0.729743,0.967968,0.402778,0.426471,0.414286,68,0.604247,0.695556,0.646694,450,0.707155,0.658915,0.682183,645,0.0,0.0,0.0,12,0.507607,0.708494,0.591459,518,0.936941,0.902239,0.919263,2322,0.492433,0.463308,0.477427,913,0.0,0.0,0.0,72
3,0.0198,0.173371,0.743004,0.7222,0.732454,0.968661,0.358209,0.352941,0.355556,68,0.574959,0.775556,0.66036,450,0.765199,0.565891,0.650624,645,0.0,0.0,0.0,12,0.516129,0.741313,0.608558,518,0.945504,0.896641,0.920424,2322,0.535526,0.445783,0.486551,913,0.0,0.0,0.0,72


  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))


[2025-03-10 16:34:37] tartuNLP/EstBERT treenimine lõpetatud
Kokku kulus: 863.69 sekundit (0.24 tundi)
Hindan testandmestikul..


  _warn_prf(average, modifier, msg_start, len(result))


Seqeval tulemused
EVE {'precision': 0.5258620689655172, 'recall': 0.4326241134751773, 'f1': 0.47470817120622577, 'number': 141}
GEP {'precision': 0.6134301270417423, 'recall': 0.7699316628701595, 'f1': 0.6828282828282829, 'number': 439}
LOC {'precision': 0.7274633123689728, 'recall': 0.6995967741935484, 'f1': 0.7132579650565263, 'number': 496}
MUU {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 6}
ORG {'precision': 0.7200811359026369, 'recall': 0.7395833333333334, 'f1': 0.7297019527235354, 'number': 960}
PER {'precision': 0.9414343877231444, 'recall': 0.8784336645236703, 'f1': 0.908843537414966, 'number': 3422}
PROD {'precision': 0.4791431792559188, 'recall': 0.44642857142857145, 'f1': 0.4622077215878195, 'number': 952}
UNK {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 2}
overall_precision 0.7869565217391304
overall_recall 0.7614521657837332
overall_f1 0.7739942983845423
overall_accuracy 0.9702878823341012

Nervaluate tulemused
Strict {'correct': 4887, 'incorrect': 986,

Map:   0%|          | 0/913 [00:00<?, ? examples/s]

Map:   0%|          | 0/3207 [00:00<?, ? examples/s]

Kombineeritud andmestikul treenitud tartuNLP/EstBERT EWT testandmestikul
Hindan testandmestikul..


Seqeval tulemused
EVE {'precision': 0.49056603773584906, 'recall': 0.45614035087719296, 'f1': 0.4727272727272727, 'number': 57}
GEP {'precision': 0.3253968253968254, 'recall': 0.7454545454545455, 'f1': 0.4530386740331491, 'number': 55}
LOC {'precision': 0.37037037037037035, 'recall': 0.5454545454545454, 'f1': 0.4411764705882353, 'number': 55}
ORG {'precision': 0.7076923076923077, 'recall': 0.5974025974025974, 'f1': 0.6478873239436619, 'number': 231}
PER {'precision': 0.9563365282215123, 'recall': 0.8200913242009132, 'f1': 0.8829891838741396, 'number': 1095}
PROD {'precision': 0.43359375, 'recall': 0.30662983425414364, 'f1': 0.3592233009708738, 'number': 362}
overall_precision 0.7539393939393939
overall_recall 0.6706199460916442
overall_f1 0.7098430813124108
overall_accuracy 0.9486344417780825

Nervaluate tulemused
Strict {'correct': 1244, 'incorrect': 277, 'partial': 0, 'missed': 334, 'spurious': 149, 'possible': 1855, 'actual': 1670, 'precision': 0.7449101796407186, 'recall': 0.670619

Seqeval tulemused
EVE {'precision': 0.5555555555555556, 'recall': 0.4166666666666667, 'f1': 0.4761904761904762, 'number': 84}
GEP {'precision': 0.6988235294117647, 'recall': 0.7734375, 'f1': 0.7342398022249692, 'number': 384}
LOC {'precision': 0.8005050505050505, 'recall': 0.7188208616780045, 'f1': 0.7574671445639187, 'number': 441}
MUU {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 6}
ORG {'precision': 0.7231352718078382, 'recall': 0.7846364883401921, 'f1': 0.7526315789473684, 'number': 729}
PER {'precision': 0.935226264418811, 'recall': 0.9058874086807047, 'f1': 0.9203230735647239, 'number': 2327}
PROD {'precision': 0.4976228209191759, 'recall': 0.5322033898305085, 'f1': 0.5143325143325144, 'number': 590}
UNK {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 2}
overall_precision 0.7989035087719298
overall_recall 0.7983782599167214
overall_f1 0.7986407979831196
overall_accuracy 0.9762387122104437

Nervaluate tulemused
Strict {'correct': 3643, 'incorrect': 709, 'partial': 

In [22]:
estbert_combined_6, estbert_combined_6_trainer, estbert_combined_6_results = train_model('tartuNLP/EstBERT', 'Combined', epochs=6)

Map:   0%|          | 0/5444 [00:00<?, ? examples/s]

Map:   0%|          | 0/833 [00:00<?, ? examples/s]

Map:   0%|          | 0/913 [00:00<?, ? examples/s]

Map:   0%|          | 0/24601 [00:00<?, ? examples/s]

Map:   0%|          | 0/3122 [00:00<?, ? examples/s]

Map:   0%|          | 0/3207 [00:00<?, ? examples/s]

COMBINED andmestik laetud


Map:   0%|          | 0/30045 [00:00<?, ? examples/s]

Map:   0%|          | 0/3955 [00:00<?, ? examples/s]

Map:   0%|          | 0/4120 [00:00<?, ? examples/s]

Some weights of BertForTokenClassification were not initialized from the model checkpoint at tartuNLP/EstBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


[2025-03-10 16:36:22] Alustan tartuNLP/EstBERT treenimist


Epoch,Training Loss,Validation Loss,Precision,Recall,F1,Accuracy,Eve precision,Eve recall,Eve f1,Eve number,Gep precision,Gep recall,Gep f1,Gep number,Loc precision,Loc recall,Loc f1,Loc number,Muu precision,Muu recall,Muu f1,Muu number,Org precision,Org recall,Org f1,Org number,Per precision,Per recall,Per f1,Per number,Prod precision,Prod recall,Prod f1,Prod number,Unk precision,Unk recall,Unk f1,Unk number
1,0.0949,0.138038,0.738429,0.6956,0.716375,0.966408,0.433333,0.382353,0.40625,68,0.635161,0.746667,0.686415,450,0.777778,0.575194,0.661319,645,0.0,0.0,0.0,12,0.500654,0.739382,0.597038,518,0.93451,0.866494,0.899218,2322,0.482094,0.383352,0.42709,913,0.0,0.0,0.0,72
2,0.0451,0.161635,0.71942,0.7246,0.722001,0.966434,0.299145,0.514706,0.378378,68,0.632829,0.651111,0.64184,450,0.672673,0.694574,0.683448,645,0.0,0.0,0.0,12,0.502688,0.722008,0.59271,518,0.939671,0.885444,0.911752,2322,0.486014,0.456736,0.47092,913,0.0,0.0,0.0,72
3,0.024,0.190457,0.731474,0.7186,0.72498,0.967154,0.350649,0.397059,0.372414,68,0.573071,0.775556,0.659112,450,0.694136,0.67907,0.68652,645,0.0,0.0,0.0,12,0.534024,0.696911,0.60469,518,0.941066,0.859604,0.898492,2322,0.534854,0.462212,0.495887,913,0.0,0.0,0.0,72
4,0.0119,0.215714,0.742706,0.728,0.735279,0.968048,0.289157,0.352941,0.317881,68,0.587838,0.773333,0.667946,450,0.751434,0.609302,0.672945,645,0.0,0.0,0.0,12,0.589172,0.714286,0.645724,518,0.933274,0.897502,0.915038,2322,0.509069,0.461117,0.483908,913,0.0,0.0,0.0,72
5,0.0071,0.217182,0.746892,0.733,0.739881,0.968715,0.316456,0.367647,0.340136,68,0.6098,0.746667,0.671329,450,0.712095,0.648062,0.678571,645,0.0,0.0,0.0,12,0.557927,0.706564,0.623509,518,0.948378,0.894057,0.920417,2322,0.546125,0.486309,0.514484,913,0.0,0.0,0.0,72
6,0.0031,0.231435,0.749746,0.7388,0.744233,0.968661,0.377049,0.338235,0.356589,68,0.592845,0.773333,0.671167,450,0.751434,0.609302,0.672945,645,0.0,0.0,0.0,12,0.583463,0.722008,0.645384,518,0.94538,0.894488,0.91923,2322,0.532814,0.524644,0.528698,913,0.0,0.0,0.0,72


  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))


[2025-03-10 17:05:15] tartuNLP/EstBERT treenimine lõpetatud
Kokku kulus: 1732.96 sekundit (0.48 tundi)
Hindan testandmestikul..


Seqeval tulemused
EVE {'precision': 0.5128205128205128, 'recall': 0.425531914893617, 'f1': 0.4651162790697675, 'number': 141}
GEP {'precision': 0.5884476534296029, 'recall': 0.7425968109339408, 'f1': 0.6565961732124874, 'number': 439}
LOC {'precision': 0.7060041407867494, 'recall': 0.6875, 'f1': 0.6966292134831461, 'number': 496}
MUU {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 6}
ORG {'precision': 0.7071651090342679, 'recall': 0.709375, 'f1': 0.7082683307332295, 'number': 960}
PER {'precision': 0.9376966645689113, 'recall': 0.8708357685563998, 'f1': 0.903030303030303, 'number': 3422}
PROD {'precision': 0.46834170854271356, 'recall': 0.4894957983193277, 'f1': 0.4786851566512583, 'number': 952}
UNK {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 2}
overall_precision 0.7694990488268865
overall_recall 0.7563103770645061
overall_f1 0.7628477133427628
overall_accuracy 0.9690560366597273

Nervaluate tulemused
Strict {'correct': 4854, 'incorrect': 1038, 'partial': 0, 'missed'

Map:   0%|          | 0/913 [00:00<?, ? examples/s]

Map:   0%|          | 0/3207 [00:00<?, ? examples/s]

Kombineeritud andmestikul treenitud tartuNLP/EstBERT EWT testandmestikul
Hindan testandmestikul..


  _warn_prf(average, modifier, msg_start, len(result))


Seqeval tulemused
EVE {'precision': 0.5423728813559322, 'recall': 0.5614035087719298, 'f1': 0.5517241379310345, 'number': 57}
GEP {'precision': 0.3333333333333333, 'recall': 0.7636363636363637, 'f1': 0.46408839779005523, 'number': 55}
LOC {'precision': 0.37333333333333335, 'recall': 0.509090909090909, 'f1': 0.4307692307692308, 'number': 55}
MUU {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 0}
ORG {'precision': 0.6703910614525139, 'recall': 0.5194805194805194, 'f1': 0.5853658536585366, 'number': 231}
PER {'precision': 0.9374337221633086, 'recall': 0.8073059360730593, 'f1': 0.8675171736997056, 'number': 1095}
PROD {'precision': 0.409375, 'recall': 0.36187845303867405, 'f1': 0.38416422287390023, 'number': 362}
UNK {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 0}
overall_precision 0.7221249270286048
overall_recall 0.6668463611859838
overall_f1 0.6933856502242153
overall_accuracy 0.9462347160324535

Nervaluate tulemused
Strict {'correct': 1237, 'incorrect': 303, 'partial':

Seqeval tulemused
EVE {'precision': 0.4827586206896552, 'recall': 0.3333333333333333, 'f1': 0.39436619718309857, 'number': 84}
GEP {'precision': 0.6635514018691588, 'recall': 0.7395833333333334, 'f1': 0.6995073891625615, 'number': 384}
LOC {'precision': 0.7671568627450981, 'recall': 0.7097505668934241, 'f1': 0.7373380447585395, 'number': 441}
MUU {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 6}
ORG {'precision': 0.7155612244897959, 'recall': 0.7695473251028807, 'f1': 0.7415730337078652, 'number': 729}
PER {'precision': 0.9378076062639821, 'recall': 0.9007305543618392, 'f1': 0.9188952213941254, 'number': 2327}
PROD {'precision': 0.4962962962962963, 'recall': 0.5677966101694916, 'f1': 0.5296442687747036, 'number': 590}
UNK {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 2}
overall_precision 0.7871599564744287
overall_recall 0.7926802542187158
overall_f1 0.7899104607993012
overall_accuracy 0.9753278366705929

Nervaluate tulemused
Strict {'correct': 3617, 'incorrect': 735, 