In [1]:
import pandas as pd
import numpy as np

from tqdm import tqdm
tqdm.pandas(desc="progress-bar")
from gensim.models import Doc2Vec

import gensim
from sklearn.linear_model import LogisticRegression
from gensim.models.doc2vec import TaggedDocument

from sklearn.model_selection import KFold

from sklearn.base import clone as sklearn_clone

from datasets import Dataset, DatasetDict
import pandas as pd
import torch

from transformers import AutoTokenizer

from adapters import AutoAdapterModel
from transformers import AutoTokenizer

from adapters import BertAdapterModel

from transformers import  BertConfig

from adapters import SeqBnConfig #PfeifferConfig

from transformers import TrainingArguments, EvalPrediction
from adapters import AdapterTrainer
from sklearn.metrics import accuracy_score, f1_score, mean_absolute_error

torch.cuda.is_available()

True

In [2]:
# !conda install -c conda-forge huggingface_hub
# !pip install --force-reinstall charset-normalizer==3.1.0
# !pip install accelerate -U

## Lodad data

In [3]:
with open('../datasets/used_data/03_bert_like_models/02_topics.npy', 'rb') as f:
    df_topics = pd.DataFrame(np.load(f), columns=['topic'])
df_topics.shape

(6529, 1)

In [4]:
df = pd.read_parquet('../datasets/used_data/03_bert_like_models/01_basic_info_data.parquet')

df['sentence'] = df['text'].apply(lambda x: x.replace('\n',' ').strip())
df['labels'] = df['assestment'].astype(int)

df = df.sample(frac=1, random_state=111)

df = df[df.index.isin(df_topics.index)]
df.shape

(6529, 5)

In [5]:
tok = AutoTokenizer.from_pretrained('allegro/herbert-large-cased')

In [6]:
labels = sorted(set(df['labels']))
num_labels = len(labels)
label2id = dict(zip(labels,range(num_labels)))
id2label = {v: k for k, v in label2id.items()}

def encode_batch(batch):
    """Encodes a batch of input data using the model tokenizer."""
    batch['labels'] = np.array(batch['labels'])
    return tok(text=batch['sentence'], max_length=64, truncation=True, padding="max_length")

### Kfold

In [7]:
cv_fold = []
cv_fold_i = []

for i in df_topics['topic'].unique().reshape(10,-1):
    train_cv = df_topics.index[ ~np.isin(df_topics["topic"], i) ].values
    test_cv = df_topics.index[ np.isin(df_topics["topic"], i) ].values
    
    cv_fold.append( [train_cv, test_cv])

In [8]:
kf = KFold(n_splits=10, shuffle=True)
kf.get_n_splits(df_topics)

cv_Kfold = []
cv_Kfold_i = []

for train_index, test_index in kf.split(df_topics):
    train_cv = df_topics.iloc[ train_index, : ].index.values
    test_cv = df_topics.iloc[ test_index, : ].index.values
    
    cv_Kfold.append( [train_cv, test_cv])

## Experiments

In [9]:
config = BertConfig.from_pretrained(
    'allegro/herbert-large-cased',
    num_labels=num_labels
)

adapter_config = SeqBnConfig() #PfeifferConfig()


training_args = TrainingArguments(
    remove_unused_columns=False, # ensure the dataset labels are properly passed to the model
    
    fp16=True,
    learning_rate=1e-4,
    num_train_epochs=10,
    per_device_train_batch_size=8,
    per_device_eval_batch_size=32,
    gradient_accumulation_steps=1,
    max_grad_norm=1.0,
    label_smoothing_factor=0.0,
    weight_decay=0.05,
    warmup_steps=600,
    output_dir="./training_output",
    overwrite_output_dir=True,
    
#     logging_strategy="no"
    
#     logging_steps=200,
#     logging_first_step=False,
#     logging_dir='./tb_logs',
#     evaluation_strategy='steps',
#     report_to='tensorboard',
#     save_steps=200
)

def compute_accuracy_f1score(p: EvalPrediction):
    preds = [id2label[pred_id] for pred_id in np.argmax(p.predictions, axis=1)]
    target_labels = [id2label[label_id] for label_id in p.label_ids]
    return {"accuracy": accuracy_score(target_labels,preds),
           "f1score": f1_score(target_labels,preds)}

In [10]:
cv = cv_fold

In [11]:
acc = []
f1 = []

j = 1

for train_cv, test_cv in cv:
    ds = DatasetDict()
    ds['train'] = Dataset.from_pandas(df[df.index.isin(train_cv)])
    ds['valid'] = Dataset.from_pandas(df[df.index.isin(test_cv)])
    
    
    ds = ds.map(encode_batch, batched=True, batch_size=len(ds['train']))
    ds.set_format(type="torch", columns=["input_ids", "attention_mask", "labels"])
    
    
    model = BertAdapterModel.from_pretrained('allegro/herbert-large-cased', config=config).to('cuda')
    
    adapter_name='fake_news_'+str(j)
    
    model.add_adapter(adapter_name,config=adapter_config)
    model.add_classification_head(
        adapter_name,
        id2label=id2label,
        num_labels=num_labels
      )

    model.train_adapter(adapter_name)
    
    
    trainer = AdapterTrainer(
        model=model,
        args=training_args,
        train_dataset=ds["train"],
        eval_dataset=ds["valid"],
        compute_metrics=compute_accuracy_f1score,
    )

    trainer.train()
    
    eval_out = trainer.evaluate()
    
    acc.append(eval_out['eval_accuracy'])
    f1.append(eval_out['eval_f1score'])
    
    j+=1

Map:   0%|          | 0/5906 [00:00<?, ? examples/s]

Map:   0%|          | 0/623 [00:00<?, ? examples/s]

Step,Training Loss
500,0.5799
1000,0.535
1500,0.5136
2000,0.5053
2500,0.479
3000,0.4759
3500,0.4497
4000,0.4375
4500,0.4189
5000,0.3892


Map:   0%|          | 0/5877 [00:00<?, ? examples/s]

Map:   0%|          | 0/652 [00:00<?, ? examples/s]

Some weights of BertAdapterModel were not initialized from the model checkpoint at allegro/herbert-large-cased and are newly initialized: ['heads.fake_news_1.1.weight', 'heads.fake_news_1.4.weight', 'heads.fake_news_1.4.bias', 'heads.fake_news_1.1.bias']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Step,Training Loss
500,0.5758
1000,0.516
1500,0.5219
2000,0.4993
2500,0.4743
3000,0.476
3500,0.4518
4000,0.4005
4500,0.4075
5000,0.3645


Map:   0%|          | 0/5906 [00:00<?, ? examples/s]

Map:   0%|          | 0/623 [00:00<?, ? examples/s]

Some weights of BertAdapterModel were not initialized from the model checkpoint at allegro/herbert-large-cased and are newly initialized: ['heads.fake_news_2.1.weight', 'heads.fake_news_2.1.bias', 'heads.fake_news_1.1.weight', 'heads.fake_news_1.4.weight', 'heads.fake_news_1.4.bias', 'heads.fake_news_2.4.bias', 'heads.fake_news_1.1.bias', 'heads.fake_news_2.4.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Step,Training Loss
500,0.5863
1000,0.54
1500,0.5207
2000,0.5055
2500,0.4972
3000,0.4783
3500,0.449
4000,0.4303
4500,0.4213
5000,0.3887


Map:   0%|          | 0/5624 [00:00<?, ? examples/s]

Map:   0%|          | 0/905 [00:00<?, ? examples/s]

Some weights of BertAdapterModel were not initialized from the model checkpoint at allegro/herbert-large-cased and are newly initialized: ['heads.fake_news_2.1.weight', 'heads.fake_news_3.1.bias', 'heads.fake_news_2.1.bias', 'heads.fake_news_1.1.weight', 'heads.fake_news_1.4.weight', 'heads.fake_news_3.4.weight', 'heads.fake_news_1.4.bias', 'heads.fake_news_2.4.bias', 'heads.fake_news_1.1.bias', 'heads.fake_news_3.4.bias', 'heads.fake_news_3.1.weight', 'heads.fake_news_2.4.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Step,Training Loss
500,0.5897
1000,0.5363
1500,0.4997
2000,0.495
2500,0.4895
3000,0.4685
3500,0.4398
4000,0.4068
4500,0.3947
5000,0.3644


Map:   0%|          | 0/5897 [00:00<?, ? examples/s]

Map:   0%|          | 0/632 [00:00<?, ? examples/s]

Some weights of BertAdapterModel were not initialized from the model checkpoint at allegro/herbert-large-cased and are newly initialized: ['heads.fake_news_2.1.weight', 'heads.fake_news_4.1.bias', 'heads.fake_news_3.1.bias', 'heads.fake_news_2.1.bias', 'heads.fake_news_1.1.weight', 'heads.fake_news_4.1.weight', 'heads.fake_news_1.4.weight', 'heads.fake_news_3.4.weight', 'heads.fake_news_1.4.bias', 'heads.fake_news_2.4.bias', 'heads.fake_news_4.4.weight', 'heads.fake_news_1.1.bias', 'heads.fake_news_3.4.bias', 'heads.fake_news_3.1.weight', 'heads.fake_news_2.4.weight', 'heads.fake_news_4.4.bias']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Step,Training Loss
500,0.5763
1000,0.5339
1500,0.5321
2000,0.4995
2500,0.5002
3000,0.4669
3500,0.4587
4000,0.428
4500,0.4112
5000,0.3816


Map:   0%|          | 0/5897 [00:00<?, ? examples/s]

Map:   0%|          | 0/632 [00:00<?, ? examples/s]

Some weights of BertAdapterModel were not initialized from the model checkpoint at allegro/herbert-large-cased and are newly initialized: ['heads.fake_news_5.1.weight', 'heads.fake_news_1.1.weight', 'heads.fake_news_1.1.bias', 'heads.fake_news_4.4.bias', 'heads.fake_news_2.1.bias', 'heads.fake_news_4.1.weight', 'heads.fake_news_2.1.weight', 'heads.fake_news_4.1.bias', 'heads.fake_news_3.1.bias', 'heads.fake_news_3.4.weight', 'heads.fake_news_5.4.bias', 'heads.fake_news_4.4.weight', 'heads.fake_news_5.4.weight', 'heads.fake_news_5.1.bias', 'heads.fake_news_1.4.weight', 'heads.fake_news_1.4.bias', 'heads.fake_news_2.4.bias', 'heads.fake_news_3.4.bias', 'heads.fake_news_3.1.weight', 'heads.fake_news_2.4.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Step,Training Loss
500,0.5706
1000,0.5301
1500,0.5098
2000,0.4962
2500,0.4816
3000,0.4955
3500,0.4571
4000,0.409
4500,0.4255
5000,0.3779


Map:   0%|          | 0/5981 [00:00<?, ? examples/s]

Map:   0%|          | 0/548 [00:00<?, ? examples/s]

Some weights of BertAdapterModel were not initialized from the model checkpoint at allegro/herbert-large-cased and are newly initialized: ['heads.fake_news_5.1.weight', 'heads.fake_news_1.1.weight', 'heads.fake_news_1.1.bias', 'heads.fake_news_4.4.bias', 'heads.fake_news_2.1.bias', 'heads.fake_news_4.1.weight', 'heads.fake_news_2.1.weight', 'heads.fake_news_4.1.bias', 'heads.fake_news_3.1.bias', 'heads.fake_news_6.1.weight', 'heads.fake_news_3.4.weight', 'heads.fake_news_5.4.bias', 'heads.fake_news_4.4.weight', 'heads.fake_news_5.4.weight', 'heads.fake_news_5.1.bias', 'heads.fake_news_6.4.bias', 'heads.fake_news_6.1.bias', 'heads.fake_news_1.4.weight', 'heads.fake_news_1.4.bias', 'heads.fake_news_2.4.bias', 'heads.fake_news_6.4.weight', 'heads.fake_news_3.4.bias', 'heads.fake_news_3.1.weight', 'heads.fake_news_2.4.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Step,Training Loss
500,0.5779
1000,0.5339
1500,0.5448
2000,0.5079
2500,0.4918
3000,0.4838
3500,0.4612
4000,0.4346
4500,0.4121
5000,0.3769


Map:   0%|          | 0/5873 [00:00<?, ? examples/s]

Map:   0%|          | 0/656 [00:00<?, ? examples/s]

Some weights of BertAdapterModel were not initialized from the model checkpoint at allegro/herbert-large-cased and are newly initialized: ['heads.fake_news_7.1.bias', 'heads.fake_news_5.1.weight', 'heads.fake_news_1.1.weight', 'heads.fake_news_1.1.bias', 'heads.fake_news_4.4.bias', 'heads.fake_news_2.1.bias', 'heads.fake_news_4.1.weight', 'heads.fake_news_7.4.weight', 'heads.fake_news_7.4.bias', 'heads.fake_news_2.1.weight', 'heads.fake_news_7.1.weight', 'heads.fake_news_4.1.bias', 'heads.fake_news_3.1.bias', 'heads.fake_news_6.1.weight', 'heads.fake_news_3.4.weight', 'heads.fake_news_5.4.bias', 'heads.fake_news_4.4.weight', 'heads.fake_news_5.4.weight', 'heads.fake_news_5.1.bias', 'heads.fake_news_6.4.bias', 'heads.fake_news_6.1.bias', 'heads.fake_news_1.4.weight', 'heads.fake_news_1.4.bias', 'heads.fake_news_2.4.bias', 'heads.fake_news_6.4.weight', 'heads.fake_news_3.4.bias', 'heads.fake_news_3.1.weight', 'heads.fake_news_2.4.weight']
You should probably TRAIN this model on a down-st

Step,Training Loss
500,0.576
1000,0.5415
1500,0.538
2000,0.5098
2500,0.4915
3000,0.4764
3500,0.4598
4000,0.4222
4500,0.4092
5000,0.3852


Map:   0%|          | 0/5861 [00:00<?, ? examples/s]

Map:   0%|          | 0/668 [00:00<?, ? examples/s]

Some weights of BertAdapterModel were not initialized from the model checkpoint at allegro/herbert-large-cased and are newly initialized: ['heads.fake_news_7.1.bias', 'heads.fake_news_5.1.weight', 'heads.fake_news_1.1.weight', 'heads.fake_news_1.1.bias', 'heads.fake_news_8.1.bias', 'heads.fake_news_4.4.bias', 'heads.fake_news_2.1.bias', 'heads.fake_news_8.4.bias', 'heads.fake_news_4.1.weight', 'heads.fake_news_7.4.weight', 'heads.fake_news_8.1.weight', 'heads.fake_news_7.4.bias', 'heads.fake_news_2.1.weight', 'heads.fake_news_7.1.weight', 'heads.fake_news_4.1.bias', 'heads.fake_news_3.1.bias', 'heads.fake_news_6.1.weight', 'heads.fake_news_3.4.weight', 'heads.fake_news_5.4.bias', 'heads.fake_news_4.4.weight', 'heads.fake_news_8.4.weight', 'heads.fake_news_5.4.weight', 'heads.fake_news_5.1.bias', 'heads.fake_news_6.4.bias', 'heads.fake_news_6.1.bias', 'heads.fake_news_1.4.weight', 'heads.fake_news_1.4.bias', 'heads.fake_news_2.4.bias', 'heads.fake_news_6.4.weight', 'heads.fake_news_3.4.

Step,Training Loss
500,0.5652
1000,0.5378
1500,0.5087
2000,0.528
2500,0.4813
3000,0.4738
3500,0.4479
4000,0.4384
4500,0.4139
5000,0.3956


Map:   0%|          | 0/5939 [00:00<?, ? examples/s]

Map:   0%|          | 0/590 [00:00<?, ? examples/s]

Some weights of BertAdapterModel were not initialized from the model checkpoint at allegro/herbert-large-cased and are newly initialized: ['heads.fake_news_7.1.bias', 'heads.fake_news_5.1.weight', 'heads.fake_news_9.4.bias', 'heads.fake_news_1.1.weight', 'heads.fake_news_1.1.bias', 'heads.fake_news_8.1.bias', 'heads.fake_news_4.4.bias', 'heads.fake_news_2.1.bias', 'heads.fake_news_8.4.bias', 'heads.fake_news_4.1.weight', 'heads.fake_news_7.4.weight', 'heads.fake_news_9.4.weight', 'heads.fake_news_8.1.weight', 'heads.fake_news_7.4.bias', 'heads.fake_news_2.1.weight', 'heads.fake_news_7.1.weight', 'heads.fake_news_9.1.bias', 'heads.fake_news_4.1.bias', 'heads.fake_news_3.1.bias', 'heads.fake_news_6.1.weight', 'heads.fake_news_3.4.weight', 'heads.fake_news_5.4.bias', 'heads.fake_news_4.4.weight', 'heads.fake_news_8.4.weight', 'heads.fake_news_5.4.weight', 'heads.fake_news_5.1.bias', 'heads.fake_news_6.4.bias', 'heads.fake_news_6.1.bias', 'heads.fake_news_9.1.weight', 'heads.fake_news_1.4.

Step,Training Loss
500,0.5777
1000,0.5461
1500,0.5161
2000,0.5104
2500,0.4943
3000,0.4812
3500,0.451
4000,0.4368
4500,0.4253
5000,0.3896


Saving model checkpoint to ./training_output/checkpoint-500
Configuration saved in ./training_output/checkpoint-500/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500

Module weights saved in ./training_output/checkpoint-1000/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_9/adapter_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_9/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_10/adapter_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_10/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_1/pytorch_model_head.bin
Configur

Configuration saved in ./training_output/checkpoint-2000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_4/adapter_config.json
Module weights s

Module weights saved in ./training_output/checkpoint-2500/fake_news_9/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_10/adapter_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_10/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_2/pytorch_model_head.bin
Configurati

Configuration saved in ./training_output/checkpoint-3500/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_4/adapter_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_4/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_4/head_config.json
Module weights save

Module weights saved in ./training_output/checkpoint-4000/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_10/adapter_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_10/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_3/pytorch_model_head.bin
Configur

Configuration saved in ./training_output/checkpoint-5000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_4/adapter_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_4/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_5/adapter_config.json
Module weights s

Module weights saved in ./training_output/checkpoint-5500/fake_news_10/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_4/pytorch_model_head.bin
Configuratio

Configuration saved in ./training_output/checkpoint-6500/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_4/adapter_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_4/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_5/adapter_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_5/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_5/head_config.json
Module weights save

Module weights saved in ./training_output/checkpoint-7000/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_5/pytorch_model_head.bin
Configurati

In [12]:
acc = np.array(acc)
f1 = np.array(f1)

print(
    'adapters',
    f'Accuracy {acc.mean():.3f}+-{acc.std():.3f}',
    f'F1 Score {f1.mean():.3f}+-{f1.std():.3f}',
    f' {acc.mean():.3f}+-{acc.std():.3f} | {f1.mean():.3f}+-{f1.std():.3f}'
)

adapters Accuracy 0.761+-0.029 F1 Score 0.754+-0.063  0.761+-0.029 | 0.754+-0.063


In [13]:
cv = cv_Kfold

In [14]:
acc = []
f1 = []

for train_cv, test_cv in cv:
    ds = DatasetDict()
    ds['train'] = Dataset.from_pandas(df[df.index.isin(train_cv)])
    ds['valid'] = Dataset.from_pandas(df[df.index.isin(test_cv)])
    
    
    ds = ds.map(encode_batch, batched=True, batch_size=len(ds['train']))
    ds.set_format(type="torch", columns=["input_ids", "attention_mask", "labels"])
    
    
    model = BertAdapterModel.from_pretrained('allegro/herbert-large-cased', config=config).to('cuda')

    adapter_name='fake_news_'+str(j)
    
    model.add_adapter(adapter_name,config=adapter_config)
    model.add_classification_head(
        adapter_name,
        id2label=id2label,
        num_labels=num_labels
      )

    model.train_adapter(adapter_name)
    
    
    trainer = AdapterTrainer(
        model=model,
        args=training_args,
        train_dataset=ds["train"],
        eval_dataset=ds["valid"],
        compute_metrics=compute_accuracy_f1score,
    )

    trainer.train()
    
    eval_out = trainer.evaluate()
    
    acc.append(eval_out['eval_accuracy'])
    f1.append(eval_out['eval_f1score'])
    
    j += 1

Map:   0%|          | 0/5876 [00:00<?, ? examples/s]

Map:   0%|          | 0/653 [00:00<?, ? examples/s]

Some weights of BertAdapterModel were not initialized from the model checkpoint at allegro/herbert-large-cased and are newly initialized: ['heads.fake_news_7.1.bias', 'heads.fake_news_5.1.weight', 'heads.fake_news_9.4.bias', 'heads.fake_news_10.4.weight', 'heads.fake_news_1.1.weight', 'heads.fake_news_1.1.bias', 'heads.fake_news_8.1.bias', 'heads.fake_news_4.4.bias', 'heads.fake_news_2.1.bias', 'heads.fake_news_8.4.bias', 'heads.fake_news_4.1.weight', 'heads.fake_news_7.4.weight', 'heads.fake_news_9.4.weight', 'heads.fake_news_8.1.weight', 'heads.fake_news_10.4.bias', 'heads.fake_news_7.4.bias', 'heads.fake_news_2.1.weight', 'heads.fake_news_7.1.weight', 'heads.fake_news_9.1.bias', 'heads.fake_news_4.1.bias', 'heads.fake_news_10.1.weight', 'heads.fake_news_3.1.bias', 'heads.fake_news_6.1.weight', 'heads.fake_news_3.4.weight', 'heads.fake_news_5.4.bias', 'heads.fake_news_4.4.weight', 'heads.fake_news_8.4.weight', 'heads.fake_news_5.4.weight', 'heads.fake_news_5.1.bias', 'heads.fake_news

Step,Training Loss
500,0.5768
1000,0.5283
1500,0.5175
2000,0.4973
2500,0.5025
3000,0.4695
3500,0.4444
4000,0.4295
4500,0.4156
5000,0.3705


Map:   0%|          | 0/5876 [00:00<?, ? examples/s]

Map:   0%|          | 0/653 [00:00<?, ? examples/s]

Some weights of BertAdapterModel were not initialized from the model checkpoint at allegro/herbert-large-cased and are newly initialized: ['heads.fake_news_7.1.bias', 'heads.fake_news_5.1.weight', 'heads.fake_news_9.4.bias', 'heads.fake_news_10.4.weight', 'heads.fake_news_1.1.weight', 'heads.fake_news_1.1.bias', 'heads.fake_news_8.1.bias', 'heads.fake_news_4.4.bias', 'heads.fake_news_2.1.bias', 'heads.fake_news_8.4.bias', 'heads.fake_news_4.1.weight', 'heads.fake_news_11.4.weight', 'heads.fake_news_11.4.bias', 'heads.fake_news_7.4.weight', 'heads.fake_news_9.4.weight', 'heads.fake_news_8.1.weight', 'heads.fake_news_10.4.bias', 'heads.fake_news_7.4.bias', 'heads.fake_news_2.1.weight', 'heads.fake_news_7.1.weight', 'heads.fake_news_9.1.bias', 'heads.fake_news_4.1.bias', 'heads.fake_news_11.1.weight', 'heads.fake_news_10.1.weight', 'heads.fake_news_3.1.bias', 'heads.fake_news_6.1.weight', 'heads.fake_news_3.4.weight', 'heads.fake_news_5.4.bias', 'heads.fake_news_4.4.weight', 'heads.fake_n

Step,Training Loss
500,0.5725
1000,0.5508
1500,0.5191
2000,0.5046
2500,0.4914
3000,0.4907
3500,0.461
4000,0.4283
4500,0.4278
5000,0.386


Map:   0%|          | 0/5876 [00:00<?, ? examples/s]

Map:   0%|          | 0/653 [00:00<?, ? examples/s]

Some weights of BertAdapterModel were not initialized from the model checkpoint at allegro/herbert-large-cased and are newly initialized: ['heads.fake_news_7.1.bias', 'heads.fake_news_5.1.weight', 'heads.fake_news_9.4.bias', 'heads.fake_news_10.4.weight', 'heads.fake_news_1.1.weight', 'heads.fake_news_12.1.bias', 'heads.fake_news_1.1.bias', 'heads.fake_news_8.1.bias', 'heads.fake_news_4.4.bias', 'heads.fake_news_2.1.bias', 'heads.fake_news_8.4.bias', 'heads.fake_news_4.1.weight', 'heads.fake_news_11.4.weight', 'heads.fake_news_12.4.bias', 'heads.fake_news_11.4.bias', 'heads.fake_news_7.4.weight', 'heads.fake_news_9.4.weight', 'heads.fake_news_8.1.weight', 'heads.fake_news_10.4.bias', 'heads.fake_news_7.4.bias', 'heads.fake_news_2.1.weight', 'heads.fake_news_12.1.weight', 'heads.fake_news_7.1.weight', 'heads.fake_news_9.1.bias', 'heads.fake_news_4.1.bias', 'heads.fake_news_11.1.weight', 'heads.fake_news_10.1.weight', 'heads.fake_news_3.1.bias', 'heads.fake_news_6.1.weight', 'heads.fake_

Step,Training Loss
500,0.578
1000,0.5187
1500,0.5255
2000,0.494
2500,0.4966
3000,0.4841
3500,0.4494
4000,0.4275
4500,0.4044
5000,0.3824


Map:   0%|          | 0/5876 [00:00<?, ? examples/s]

Map:   0%|          | 0/653 [00:00<?, ? examples/s]

Some weights of BertAdapterModel were not initialized from the model checkpoint at allegro/herbert-large-cased and are newly initialized: ['heads.fake_news_7.1.bias', 'heads.fake_news_5.1.weight', 'heads.fake_news_13.4.bias', 'heads.fake_news_9.4.bias', 'heads.fake_news_10.4.weight', 'heads.fake_news_1.1.weight', 'heads.fake_news_13.1.bias', 'heads.fake_news_12.1.bias', 'heads.fake_news_1.1.bias', 'heads.fake_news_8.1.bias', 'heads.fake_news_4.4.bias', 'heads.fake_news_2.1.bias', 'heads.fake_news_8.4.bias', 'heads.fake_news_4.1.weight', 'heads.fake_news_11.4.weight', 'heads.fake_news_12.4.bias', 'heads.fake_news_11.4.bias', 'heads.fake_news_7.4.weight', 'heads.fake_news_9.4.weight', 'heads.fake_news_8.1.weight', 'heads.fake_news_10.4.bias', 'heads.fake_news_7.4.bias', 'heads.fake_news_13.4.weight', 'heads.fake_news_2.1.weight', 'heads.fake_news_12.1.weight', 'heads.fake_news_7.1.weight', 'heads.fake_news_9.1.bias', 'heads.fake_news_4.1.bias', 'heads.fake_news_11.1.weight', 'heads.fake_

Step,Training Loss
500,0.5647
1000,0.5314
1500,0.5151
2000,0.5041
2500,0.4675
3000,0.4659
3500,0.4501
4000,0.4126
4500,0.3874
5000,0.3618


Map:   0%|          | 0/5876 [00:00<?, ? examples/s]

Map:   0%|          | 0/653 [00:00<?, ? examples/s]

Some weights of BertAdapterModel were not initialized from the model checkpoint at allegro/herbert-large-cased and are newly initialized: ['heads.fake_news_7.1.bias', 'heads.fake_news_5.1.weight', 'heads.fake_news_13.4.bias', 'heads.fake_news_9.4.bias', 'heads.fake_news_14.1.bias', 'heads.fake_news_10.4.weight', 'heads.fake_news_1.1.weight', 'heads.fake_news_14.4.weight', 'heads.fake_news_13.1.bias', 'heads.fake_news_12.1.bias', 'heads.fake_news_1.1.bias', 'heads.fake_news_8.1.bias', 'heads.fake_news_4.4.bias', 'heads.fake_news_14.4.bias', 'heads.fake_news_2.1.bias', 'heads.fake_news_8.4.bias', 'heads.fake_news_4.1.weight', 'heads.fake_news_11.4.weight', 'heads.fake_news_12.4.bias', 'heads.fake_news_11.4.bias', 'heads.fake_news_7.4.weight', 'heads.fake_news_9.4.weight', 'heads.fake_news_8.1.weight', 'heads.fake_news_10.4.bias', 'heads.fake_news_7.4.bias', 'heads.fake_news_13.4.weight', 'heads.fake_news_2.1.weight', 'heads.fake_news_12.1.weight', 'heads.fake_news_7.1.weight', 'heads.fak

Step,Training Loss
500,0.5749
1000,0.5379
1500,0.5203
2000,0.4932
2500,0.4778
3000,0.4747
3500,0.4439
4000,0.4351
4500,0.4072
5000,0.3667


Map:   0%|          | 0/5876 [00:00<?, ? examples/s]

Map:   0%|          | 0/653 [00:00<?, ? examples/s]

Some weights of BertAdapterModel were not initialized from the model checkpoint at allegro/herbert-large-cased and are newly initialized: ['heads.fake_news_7.1.bias', 'heads.fake_news_15.1.weight', 'heads.fake_news_5.1.weight', 'heads.fake_news_13.4.bias', 'heads.fake_news_9.4.bias', 'heads.fake_news_14.1.bias', 'heads.fake_news_10.4.weight', 'heads.fake_news_1.1.weight', 'heads.fake_news_14.4.weight', 'heads.fake_news_13.1.bias', 'heads.fake_news_12.1.bias', 'heads.fake_news_1.1.bias', 'heads.fake_news_8.1.bias', 'heads.fake_news_4.4.bias', 'heads.fake_news_14.4.bias', 'heads.fake_news_15.4.bias', 'heads.fake_news_2.1.bias', 'heads.fake_news_8.4.bias', 'heads.fake_news_4.1.weight', 'heads.fake_news_11.4.weight', 'heads.fake_news_12.4.bias', 'heads.fake_news_11.4.bias', 'heads.fake_news_7.4.weight', 'heads.fake_news_9.4.weight', 'heads.fake_news_8.1.weight', 'heads.fake_news_10.4.bias', 'heads.fake_news_7.4.bias', 'heads.fake_news_13.4.weight', 'heads.fake_news_2.1.weight', 'heads.fake

Step,Training Loss
500,0.5882
1000,0.5332
1500,0.5144
2000,0.5072
2500,0.4708
3000,0.4743
3500,0.4529
4000,0.4172
4500,0.4076
5000,0.3645


Map:   0%|          | 0/5876 [00:00<?, ? examples/s]

Map:   0%|          | 0/653 [00:00<?, ? examples/s]

Some weights of BertAdapterModel were not initialized from the model checkpoint at allegro/herbert-large-cased and are newly initialized: ['heads.fake_news_7.1.bias', 'heads.fake_news_15.1.weight', 'heads.fake_news_5.1.weight', 'heads.fake_news_13.4.bias', 'heads.fake_news_9.4.bias', 'heads.fake_news_14.1.bias', 'heads.fake_news_10.4.weight', 'heads.fake_news_1.1.weight', 'heads.fake_news_14.4.weight', 'heads.fake_news_13.1.bias', 'heads.fake_news_12.1.bias', 'heads.fake_news_1.1.bias', 'heads.fake_news_8.1.bias', 'heads.fake_news_4.4.bias', 'heads.fake_news_16.4.bias', 'heads.fake_news_16.1.bias', 'heads.fake_news_14.4.bias', 'heads.fake_news_16.4.weight', 'heads.fake_news_15.4.bias', 'heads.fake_news_2.1.bias', 'heads.fake_news_8.4.bias', 'heads.fake_news_4.1.weight', 'heads.fake_news_11.4.weight', 'heads.fake_news_12.4.bias', 'heads.fake_news_11.4.bias', 'heads.fake_news_7.4.weight', 'heads.fake_news_9.4.weight', 'heads.fake_news_8.1.weight', 'heads.fake_news_10.4.bias', 'heads.fake

Step,Training Loss
500,0.5777
1000,0.5383
1500,0.5352
2000,0.4995
2500,0.4925
3000,0.4859
3500,0.4517
4000,0.4406
4500,0.4257
5000,0.4033


Map:   0%|          | 0/5876 [00:00<?, ? examples/s]

Map:   0%|          | 0/653 [00:00<?, ? examples/s]

Some weights of BertAdapterModel were not initialized from the model checkpoint at allegro/herbert-large-cased and are newly initialized: ['heads.fake_news_7.1.bias', 'heads.fake_news_15.1.weight', 'heads.fake_news_5.1.weight', 'heads.fake_news_13.4.bias', 'heads.fake_news_9.4.bias', 'heads.fake_news_14.1.bias', 'heads.fake_news_10.4.weight', 'heads.fake_news_1.1.weight', 'heads.fake_news_14.4.weight', 'heads.fake_news_13.1.bias', 'heads.fake_news_12.1.bias', 'heads.fake_news_1.1.bias', 'heads.fake_news_8.1.bias', 'heads.fake_news_4.4.bias', 'heads.fake_news_16.4.bias', 'heads.fake_news_16.1.bias', 'heads.fake_news_14.4.bias', 'heads.fake_news_16.4.weight', 'heads.fake_news_15.4.bias', 'heads.fake_news_2.1.bias', 'heads.fake_news_8.4.bias', 'heads.fake_news_17.1.bias', 'heads.fake_news_4.1.weight', 'heads.fake_news_11.4.weight', 'heads.fake_news_12.4.bias', 'heads.fake_news_11.4.bias', 'heads.fake_news_3.4.bias', 'heads.fake_news_17.4.bias', 'heads.fake_news_7.4.weight', 'heads.fake_ne

Step,Training Loss
500,0.5715
1000,0.5339
1500,0.5237
2000,0.5107
2500,0.491
3000,0.4782
3500,0.4514
4000,0.4376
4500,0.4328
5000,0.3863


Map:   0%|          | 0/5876 [00:00<?, ? examples/s]

Map:   0%|          | 0/653 [00:00<?, ? examples/s]

Some weights of BertAdapterModel were not initialized from the model checkpoint at allegro/herbert-large-cased and are newly initialized: ['heads.fake_news_7.1.bias', 'heads.fake_news_15.1.weight', 'heads.fake_news_5.1.weight', 'heads.fake_news_13.4.bias', 'heads.fake_news_9.4.bias', 'heads.fake_news_14.1.bias', 'heads.fake_news_10.4.weight', 'heads.fake_news_1.1.weight', 'heads.fake_news_14.4.weight', 'heads.fake_news_13.1.bias', 'heads.fake_news_12.1.bias', 'heads.fake_news_1.1.bias', 'heads.fake_news_8.1.bias', 'heads.fake_news_4.4.bias', 'heads.fake_news_16.4.bias', 'heads.fake_news_16.1.bias', 'heads.fake_news_18.4.bias', 'heads.fake_news_18.1.bias', 'heads.fake_news_16.4.weight', 'heads.fake_news_14.4.bias', 'heads.fake_news_15.4.bias', 'heads.fake_news_2.1.bias', 'heads.fake_news_8.4.bias', 'heads.fake_news_17.1.bias', 'heads.fake_news_4.1.weight', 'heads.fake_news_11.4.weight', 'heads.fake_news_12.4.bias', 'heads.fake_news_11.4.bias', 'heads.fake_news_3.4.bias', 'heads.fake_new

Step,Training Loss
500,0.5604
1000,0.5383
1500,0.5306
2000,0.5157
2500,0.4659
3000,0.473
3500,0.4467
4000,0.4341
4500,0.4062
5000,0.3829


Map:   0%|          | 0/5877 [00:00<?, ? examples/s]

Map:   0%|          | 0/652 [00:00<?, ? examples/s]

Some weights of BertAdapterModel were not initialized from the model checkpoint at allegro/herbert-large-cased and are newly initialized: ['heads.fake_news_13.4.bias', 'heads.fake_news_1.1.weight', 'heads.fake_news_1.1.bias', 'heads.fake_news_8.1.bias', 'heads.fake_news_18.1.bias', 'heads.fake_news_16.4.weight', 'heads.fake_news_15.4.bias', 'heads.fake_news_2.1.bias', 'heads.fake_news_8.4.bias', 'heads.fake_news_17.1.bias', 'heads.fake_news_11.4.bias', 'heads.fake_news_10.4.bias', 'heads.fake_news_17.1.weight', 'heads.fake_news_2.1.weight', 'heads.fake_news_12.4.weight', 'heads.fake_news_5.1.bias', 'heads.fake_news_10.1.bias', 'heads.fake_news_9.1.weight', 'heads.fake_news_3.1.weight', 'heads.fake_news_7.1.bias', 'heads.fake_news_15.1.weight', 'heads.fake_news_9.4.bias', 'heads.fake_news_10.4.weight', 'heads.fake_news_19.1.bias', 'heads.fake_news_9.4.weight', 'heads.fake_news_8.1.weight', 'heads.fake_news_7.1.weight', 'heads.fake_news_15.4.weight', 'heads.fake_news_11.1.weight', 'heads

Step,Training Loss
500,0.5788
1000,0.5239
1500,0.5234
2000,0.511
2500,0.4788
3000,0.4749
3500,0.4533
4000,0.4319
4500,0.4271
5000,0.3953


Configuration saved in ./training_output/checkpoint-1500/fake_news_15/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_15/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_16/adapter_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_16/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_16/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_16/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_17/adapter_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_17/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_17/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_17/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_18/adapter_config.json
Modul

Module weights saved in ./training_output/checkpoint-2000/fake_news_11/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_12/adapter_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_12/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_12/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_13/adapter_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_13/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_13/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_13/pytorch_model_head.bin
Conf

Configuration saved in ./training_output/checkpoint-2500/fake_news_7/adapter_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_7/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_8/adapter_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_8/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_9/adapter_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_9/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_9/head_config.json
Module weights save

Module weights saved in ./training_output/checkpoint-3000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_4/adapter_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_4/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_5/adapter_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_5/pytorch_adapter.bin
Configuratio

Module weights saved in ./training_output/checkpoint-3000/fake_news_14/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_15/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_15/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_16/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_16/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_17/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_17/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_18/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_18/pytorch_model_head.bin
Saving model checkpoint to ./training_output/checkpoint-3500
Configuration saved in ./training_output/checkpoint-3500/fake_news_1/adapter_config.json
Module weights saved in ./traini

Configuration saved in ./training_output/checkpoint-3500/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_11/head_config.json
Module weights s

Module weights saved in ./training_output/checkpoint-4000/fake_news_17/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_17/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_17/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_18/adapter_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_18/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_18/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_18/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_2/pytorch_model_head.bin
Configur

Configuration saved in ./training_output/checkpoint-4500/fake_news_13/adapter_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_13/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_13/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_13/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_14/adapter_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_14/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_14/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_14/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_15/adapter_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_15/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_15/head_config.json
Module w

Module weights saved in ./training_output/checkpoint-5000/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_9/adapter_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_9/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_10/adapter_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_10/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_11/adapter_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_11/pytorch_adapter.bin
Config

Configuration saved in ./training_output/checkpoint-5500/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_5/adapter_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_5/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_6/adapter_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_6/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_7/adapter_config.json
Module weights s

Configuration saved in ./training_output/checkpoint-5500/fake_news_18/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_18/pytorch_model_head.bin
Saving model checkpoint to ./training_output/checkpoint-6000
Configuration saved in ./training_output/checkpoint-6000/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/c

Module weights saved in ./training_output/checkpoint-6000/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_12/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_13/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_13/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_14/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_14/pytorch_model_head.bin
Co

Configuration saved in ./training_output/checkpoint-6500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_6/head_config.json
Module weights save

Module weights saved in ./training_output/checkpoint-7000/fake_news_14/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_15/adapter_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_15/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_15/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_15/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_16/adapter_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_16/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_16/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_16/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_17/adapter_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_17/pytorch_adapter.bin
C

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

loading weights file https://huggingface.co/allegro/herbert-large-cased/resolve/main/pytorch_model.bin from cache at /home/marek/.cache/huggingface/transformers/ca58839b8e4b1222703e13158ffeb3a5a7330260cbc39513f74710674d70268b.ad71128a5739887a02bfa6de2fa8768f86e02cd13d0c308873f4cdba254e4c7c
Adding head 'fake_news_1' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_2' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_3' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_4' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh',

Adding adapter 'fake_news_19'.
Adding head 'fake_news_19' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Using cuda_amp half precision backend
***** Running training *****
  Num examples = 5887
  Num Epochs = 10
  Instantaneous batch size per device = 8
  Total train batch size (w. parallel, distributed & accumulation) = 8
  Gradient Accumulation steps = 1
  Total optimization steps = 7360


Step,Training Loss
500,0.6641
1000,0.6076
1500,0.5706
2000,0.5383
2500,0.4923
3000,0.4977
3500,0.4592
4000,0.42
4500,0.4043
5000,0.3729


Saving model checkpoint to ./training_output/checkpoint-500
Configuration saved in ./training_output/checkpoint-500/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500

Configuration saved in ./training_output/checkpoint-500/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_12/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_13/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_13/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_14/head_config.json
Module weights saved 

Module weights saved in ./training_output/checkpoint-1000/fake_news_18/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_18/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_18/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_19/adapter_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_19/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_19/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_19/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_2/pytorch_model_head.bin
Configur

Configuration saved in ./training_output/checkpoint-1500/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_12/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_13/adapter_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_13/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_13/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_13/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_14/adapter_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_14/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_14/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_14/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_15/adapter_config.json
Modul

Module weights saved in ./training_output/checkpoint-2000/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_7/adapter_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_7/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_8/adapter_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_8/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_9/adapter_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_9/pytorch_adapter.bin
Configuratio

Saving model checkpoint to ./training_output/checkpoint-2500
Configuration saved in ./training_output/checkpoint-2500/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/che

Module weights saved in ./training_output/checkpoint-2500/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_12/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_13/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_13/pytorch_model_head.bin
Conf

Configuration saved in ./training_output/checkpoint-3000/fake_news_18/adapter_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_18/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_18/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_18/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_19/adapter_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_19/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_19/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_19/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_2/head_config.json
Module weig

Module weights saved in ./training_output/checkpoint-3500/fake_news_12/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_12/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_13/adapter_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_13/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_13/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_13/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_14/adapter_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_14/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_14/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_14/pytorch_model_head.bin
Conf

Configuration saved in ./training_output/checkpoint-4000/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_7/adapter_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_7/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_8/adapter_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_8/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_9/adapter_config.json
Module weights s

Module weights saved in ./training_output/checkpoint-4000/fake_news_19/pytorch_model_head.bin
Saving model checkpoint to ./training_output/checkpoint-4500
Configuration saved in ./training_output/checkpoint-4500/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_3/adapter_config.json
Module weights saved in ./training_outpu

Configuration saved in ./training_output/checkpoint-4500/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_12/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_13/head_config.json
Module weigh

Module weights saved in ./training_output/checkpoint-5000/fake_news_17/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_18/adapter_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_18/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_18/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_18/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_19/adapter_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_19/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_19/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_19/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_1/pytorch_model_head.bin
Con

Configuration saved in ./training_output/checkpoint-5500/fake_news_12/adapter_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_12/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_12/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_13/adapter_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_13/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_13/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_13/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_14/adapter_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_14/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_14/head_config.json
Module w

Module weights saved in ./training_output/checkpoint-6000/fake_news_6/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_7/adapter_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_7/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_8/adapter_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_8/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_8/pytorch_model_head.bin
Configuration s

Configuration saved in ./training_output/checkpoint-6000/fake_news_19/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_19/pytorch_model_head.bin
Saving model checkpoint to ./training_output/checkpoint-6500
Configuration saved in ./training_output/checkpoint-6500/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/c

Module weights saved in ./training_output/checkpoint-6500/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_12/pytorch_model_head.bin
Config

Configuration saved in ./training_output/checkpoint-7000/fake_news_17/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_17/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_18/adapter_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_18/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_18/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_18/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_19/adapter_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_19/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_19/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_19/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_1/head_config.json
Module we

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

loading weights file https://huggingface.co/allegro/herbert-large-cased/resolve/main/pytorch_model.bin from cache at /home/marek/.cache/huggingface/transformers/ca58839b8e4b1222703e13158ffeb3a5a7330260cbc39513f74710674d70268b.ad71128a5739887a02bfa6de2fa8768f86e02cd13d0c308873f4cdba254e4c7c
Adding head 'fake_news_1' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_2' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_3' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_4' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh',

Adding adapter 'fake_news_20'.
Adding head 'fake_news_20' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Using cuda_amp half precision backend
***** Running training *****
  Num examples = 5887
  Num Epochs = 10
  Instantaneous batch size per device = 8
  Total train batch size (w. parallel, distributed & accumulation) = 8
  Gradient Accumulation steps = 1
  Total optimization steps = 7360


Step,Training Loss
500,0.6679
1000,0.6017
1500,0.5761
2000,0.5336
2500,0.51
3000,0.4916
3500,0.4637
4000,0.4294
4500,0.4174
5000,0.3959


Saving model checkpoint to ./training_output/checkpoint-500
Configuration saved in ./training_output/checkpoint-500/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500

Configuration saved in ./training_output/checkpoint-500/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_12/head_config.json
Module weights saved in .

Module weights saved in ./training_output/checkpoint-1000/fake_news_16/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_17/adapter_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_17/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_17/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_17/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_18/adapter_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_18/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_18/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_18/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_19/adapter_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_19/pytorch_adapter.bin
C

Configuration saved in ./training_output/checkpoint-1500/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_10/adapter_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_10/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_11/adapter_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_11/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_12/adapter_config.json
Module 

Module weights saved in ./training_output/checkpoint-2000/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_4/adapter_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_4/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_4/pytorch_model_head.bin
Configuration s

Module weights saved in ./training_output/checkpoint-2000/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_12/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_13/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_13/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_14/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_14/pytorch_model_head.bin
Co

Configuration saved in ./training_output/checkpoint-2500/fake_news_18/adapter_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_18/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_18/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_18/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_19/adapter_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_19/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_19/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_19/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_20/adapter_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_20/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_20/head_config.json
Module w

Module weights saved in ./training_output/checkpoint-3000/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_11/adapter_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_11/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_12/adapter_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_12/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_12/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_13/adapter_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_13/pytorch_adapter.bin
C

Configuration saved in ./training_output/checkpoint-3500/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_4/adapter_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_4/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_5/adapter_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_5/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_6/adapter_config.json
Module weights s

Configuration saved in ./training_output/checkpoint-3500/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_12/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_13/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_13/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_14/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_14/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_15/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_15/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_16/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_16/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_17/head_config.json
Module w

Module weights saved in ./training_output/checkpoint-4000/fake_news_19/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_19/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_19/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_20/adapter_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_20/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_20/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_20/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_2/pytorch_model_head.bin
Configur

Configuration saved in ./training_output/checkpoint-4500/fake_news_12/adapter_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_12/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_12/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_13/adapter_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_13/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_13/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_13/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_14/adapter_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_14/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_14/head_config.json
Module w

Module weights saved in ./training_output/checkpoint-5000/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_5/adapter_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_5/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_6/adapter_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_6/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_7/adapter_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_7/pytorch_adapter.bin
Configuratio

Configuration saved in ./training_output/checkpoint-5000/fake_news_14/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_14/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_15/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_15/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_16/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_16/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_17/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_17/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_18/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_18/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_19/head_config.json
Module w

Module weights saved in ./training_output/checkpoint-5500/fake_news_20/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_20/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_20/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_4/pytorch_model_head.bin
Configuratio

Configuration saved in ./training_output/checkpoint-6000/fake_news_13/adapter_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_13/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_13/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_13/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_14/adapter_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_14/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_14/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_14/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_15/adapter_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_15/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_15/head_config.json
Module w

Module weights saved in ./training_output/checkpoint-6500/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_6/adapter_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_6/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_7/adapter_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_7/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_8/adapter_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_8/pytorch_adapter.bin
Configuratio

Configuration saved in ./training_output/checkpoint-6500/fake_news_16/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_16/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_17/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_17/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_18/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_18/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_19/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_19/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_20/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_20/pytorch_model_head.bin
Saving model checkpoint to ./training_output/checkpoint-7000
Configuration saved in ./training_

Module weights saved in ./training_output/checkpoint-7000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_6/pytorch_model_head.bin
Configuratio

In [15]:
acc = np.array(acc)
f1 = np.array(f1)

print(
    'adapters',
    f'Accuracy {acc.mean():.3f}+-{acc.std():.3f}',
    f'F1 Score {f1.mean():.3f}+-{f1.std():.3f}',
    f' {acc.mean():.3f}+-{acc.std():.3f} | {f1.mean():.3f}+-{f1.std():.3f}'
)

adapters Accuracy 0.765+-0.015 F1 Score 0.766+-0.018  0.765+-0.015 | 0.766+-0.018
