In [1]:
import pandas as pd
import numpy as np

from tqdm import tqdm
tqdm.pandas(desc="progress-bar")
from gensim.models import Doc2Vec

import gensim
from sklearn.linear_model import LogisticRegression
from gensim.models.doc2vec import TaggedDocument

from sklearn.model_selection import KFold

from sklearn.base import clone as sklearn_clone

from datasets import Dataset, DatasetDict
import pandas as pd
import torch

from transformers import AutoTokenizer

from transformers import BertAdapterModel, BertConfig

from transformers import PfeifferConfig

from transformers import TrainingArguments, AdapterTrainer, EvalPrediction
from sklearn.metrics import accuracy_score, f1_score, mean_absolute_error

torch.cuda.is_available()

True

In [2]:
# https://stackoverflow.com/questions/58497442/best-training-methods-for-binary-text-classification-using-doc2vec-gensim

## Lodad data

In [3]:
df_topics = pd.read_csv('../datasets/ready2use/topics.csv', index_col=0)
df_topics.shape

(6541, 1)

In [4]:
df = pd.read_csv('../datasets/ready2use/text_celan_pl_dataset.csv',
                 index_col=0,
                 sep=';',header=None,names='sentence labels'.split())

df['sentence'] = df['sentence'].apply(lambda x: x.replace('\n',' ').strip())
df['labels'] = df['labels'].astype(int)

df = df.sample(frac=1, random_state=111)

df = df[df.index.isin(df_topics.index)]
df.shape

(6541, 2)

In [5]:
tok = AutoTokenizer.from_pretrained('allegro/herbert-large-cased')

In [6]:
labels = sorted(set(df['labels']))
num_labels = len(labels)
label2id = dict(zip(labels,range(num_labels)))
id2label = {v: k for k, v in label2id.items()}

def encode_batch(batch):
    """Encodes a batch of input data using the model tokenizer."""
    batch['labels'] = np.array(batch['labels'])
    return tok(text=batch['sentence'], max_length=64, truncation=True, padding="max_length")

### Kfold

In [7]:
cv_fold = []
cv_fold_i = []

for i in df_topics['topic'].unique().reshape(10,-1):
    train_cv = df_topics.index[ ~np.isin(df_topics["topic"], i) ].values
    test_cv = df_topics.index[ np.isin(df_topics["topic"], i) ].values
    
    train_cv_i = df_topics.reset_index().index[ ~np.isin(df_topics["topic"], i) ].values
    test_cv_i = df_topics.reset_index().index[ np.isin(df_topics["topic"], i) ].values
    
    cv_fold.append( [train_cv, test_cv])
    cv_fold_i.append( [train_cv_i, test_cv_i])

In [8]:
kf = KFold(n_splits=10, shuffle=True)
kf.get_n_splits(df_topics)

cv_Kfold = []
cv_Kfold_i = []

for train_index, test_index in kf.split(df_topics):
    train_cv = df_topics.iloc[ train_index, : ].index.values
    test_cv = df_topics.iloc[ test_index, : ].index.values

    train_cv_i= df_topics.reset_index().iloc[ train_index, : ].index.values
    test_cv_i = df_topics.reset_index().iloc[ test_index, : ].index.values
    
    cv_Kfold.append( [train_cv, test_cv])
    cv_Kfold_i.append( [train_cv_i, test_cv_i])

## Experiments

In [9]:
config = BertConfig.from_pretrained(
    'allegro/herbert-large-cased',
    num_labels=num_labels
)

adapter_config = PfeifferConfig()


training_args = TrainingArguments(
    remove_unused_columns=False, # ensure the dataset labels are properly passed to the model
    
    fp16=True,
    learning_rate=1e-4,
    num_train_epochs=10,
    per_device_train_batch_size=8,
    per_device_eval_batch_size=32,
    gradient_accumulation_steps=1,
    max_grad_norm=1.0,
    label_smoothing_factor=0.0,
    weight_decay=0.05,
    warmup_steps=600,
    output_dir="./training_output",
    overwrite_output_dir=True,
    
#     logging_strategy="no"
    
#     logging_steps=200,
#     logging_first_step=False,
#     logging_dir='./tb_logs',
#     evaluation_strategy='steps',
#     report_to='tensorboard',
#     save_steps=200
)

def compute_accuracy_f1score(p: EvalPrediction):
    preds = [id2label[pred_id] for pred_id in np.argmax(p.predictions, axis=1)]
    target_labels = [id2label[label_id] for label_id in p.label_ids]
    return {"accuracy": accuracy_score(target_labels,preds),
           "f1score": f1_score(target_labels,preds)}

In [10]:
cv = cv_fold

In [11]:
acc = []
f1 = []

j = 1

for train_cv, test_cv in cv:
    ds = DatasetDict()
    ds['train'] = Dataset.from_pandas(df[df.index.isin(train_cv)])
    ds['valid'] = Dataset.from_pandas(df[df.index.isin(test_cv)])
    
    
    ds = ds.map(encode_batch, batched=True, batch_size=len(ds['train']))
    ds.set_format(type="torch", columns=["input_ids", "attention_mask", "labels"])
    
    
    model = BertAdapterModel.from_pretrained('allegro/herbert-large-cased', config=config).to('cuda')
    
    adapter_name='fake_news_'+str(j)
    
    model.add_adapter(adapter_name,config=adapter_config)
    model.add_classification_head(
        adapter_name,
        id2label=id2label,
        num_labels=num_labels
      )

    model.train_adapter(adapter_name)
    
    
    trainer = AdapterTrainer(
        model=model,
        args=training_args,
        train_dataset=ds["train"],
        eval_dataset=ds["valid"],
        compute_metrics=compute_accuracy_f1score,
    )

    trainer.train()
    
    eval_out = trainer.evaluate()
    
    acc.append(eval_out['eval_accuracy'])
    f1.append(eval_out['eval_f1score'])
    
    j+=1

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

Some weights of the model checkpoint at allegro/herbert-large-cased were not used when initializing BertAdapterModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.sso.sso_relationship.weight', 'cls.sso.sso_relationship.bias', 'cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight']
- This IS expected if you are initializing BertAdapterModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertAdapterModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Using cuda_amp half precision backend
***** Running training *****
  Num examples = 

Step,Training Loss
500,0.6667
1000,0.6057
1500,0.5625
2000,0.536
2500,0.5195
3000,0.4958
3500,0.464
4000,0.4385
4500,0.4101
5000,0.3753


Saving model checkpoint to ./training_output/checkpoint-500
Configuration saved in ./training_output/checkpoint-500/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_model_head.bin
Saving model checkpoint to ./training_output/checkpoint-1000
Configuration saved in ./training_output/checkpoint-1000/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_1/pytorch_model

Module weights saved in ./training_output/checkpoint-7000/fake_news_1/pytorch_model_head.bin


Training completed. Do not forget to share your model on huggingface.co/models =)


***** Running Evaluation *****
  Num examples = 595
  Batch size = 32


  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

loading weights file https://huggingface.co/allegro/herbert-large-cased/resolve/main/pytorch_model.bin from cache at /home/marek/.cache/huggingface/transformers/ca58839b8e4b1222703e13158ffeb3a5a7330260cbc39513f74710674d70268b.ad71128a5739887a02bfa6de2fa8768f86e02cd13d0c308873f4cdba254e4c7c
Adding head 'fake_news_1' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Some weights of the model checkpoint at allegro/herbert-large-cased were not used when initializing BertAdapterModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.sso.sso_relationship.weight', 'cls.sso.sso_relationship.bias', 'cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight']
- This IS expected if you are initializing BertAdapterModel from th

Adding adapter 'fake_news_2'.
Adding head 'fake_news_2' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Using cuda_amp half precision backend
***** Running training *****
  Num examples = 5746
  Num Epochs = 10
  Instantaneous batch size per device = 8
  Total train batch size (w. parallel, distributed & accumulation) = 8
  Gradient Accumulation steps = 1
  Total optimization steps = 7190


Step,Training Loss
500,0.6754
1000,0.5777
1500,0.5638
2000,0.5233
2500,0.4969
3000,0.4773
3500,0.4441
4000,0.4044
4500,0.3817
5000,0.3738


Saving model checkpoint to ./training_output/checkpoint-500
Configuration saved in ./training_output/checkpoint-500/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500

Module weights saved in ./training_output/checkpoint-4000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_2/pytorch_model_head.bin
Saving model checkpoint to ./training_output/checkpoint-4500
Configuration saved in ./training_output/checkpoint-4500/fake_news_1/adapter_config.json
Module weights saved in ./training_output

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

loading weights file https://huggingface.co/allegro/herbert-large-cased/resolve/main/pytorch_model.bin from cache at /home/marek/.cache/huggingface/transformers/ca58839b8e4b1222703e13158ffeb3a5a7330260cbc39513f74710674d70268b.ad71128a5739887a02bfa6de2fa8768f86e02cd13d0c308873f4cdba254e4c7c
Adding head 'fake_news_1' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_2' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Some weights of the model checkpoint at allegro/herbert-large-cased were not used when initializing BertAdapterModel: ['cls.predictions.decoder.bias', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.sso.sso_relationship.weight', 'cls.sso.sso_relationship.bias', 'cls.predictio

Adding adapter 'fake_news_3'.
Adding head 'fake_news_3' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Using cuda_amp half precision backend
***** Running training *****
  Num examples = 5772
  Num Epochs = 10
  Instantaneous batch size per device = 8
  Total train batch size (w. parallel, distributed & accumulation) = 8
  Gradient Accumulation steps = 1
  Total optimization steps = 7220


Step,Training Loss
500,0.6708
1000,0.608
1500,0.5796
2000,0.5409
2500,0.5165
3000,0.4979
3500,0.4619
4000,0.4253
4500,0.3905
5000,0.377


Saving model checkpoint to ./training_output/checkpoint-500
Configuration saved in ./training_output/checkpoint-500/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500

Module weights saved in ./training_output/checkpoint-2500/fake_news_3/pytorch_model_head.bin
Saving model checkpoint to ./training_output/checkpoint-3000
Configuration saved in ./training_output/checkpoint-3000/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_3/adapter_config.json
Module weights saved in ./training_output

Configuration saved in ./training_output/checkpoint-5000/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_3/pytorch_model_head.bin
Saving model checkpoint to ./training_output/checkpoint-5500
Configuration saved in ./training_output/checkpoint-5500/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/che

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

loading weights file https://huggingface.co/allegro/herbert-large-cased/resolve/main/pytorch_model.bin from cache at /home/marek/.cache/huggingface/transformers/ca58839b8e4b1222703e13158ffeb3a5a7330260cbc39513f74710674d70268b.ad71128a5739887a02bfa6de2fa8768f86e02cd13d0c308873f4cdba254e4c7c
Adding head 'fake_news_1' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_2' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_3' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Some weights of the model checkpoint at allegro/herbert-large-cased were not used when initializing BertAdapterModel: ['cls.predic

Adding adapter 'fake_news_4'.
Adding head 'fake_news_4' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Using cuda_amp half precision backend
***** Running training *****
  Num examples = 5965
  Num Epochs = 10
  Instantaneous batch size per device = 8
  Total train batch size (w. parallel, distributed & accumulation) = 8
  Gradient Accumulation steps = 1
  Total optimization steps = 7460


Step,Training Loss
500,0.6703
1000,0.6114
1500,0.5775
2000,0.5302
2500,0.4998
3000,0.4992
3500,0.4547
4000,0.4428
4500,0.4147
5000,0.3645


Saving model checkpoint to ./training_output/checkpoint-500
Configuration saved in ./training_output/checkpoint-500/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500

Configuration saved in ./training_output/checkpoint-2000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_4/pytorch_model_head.bin
Saving model checkpoint to ./training_output/checkpoint-2500
Configuration saved in ./training_output/checkpoint-2500/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/che

Module weights saved in ./training_output/checkpoint-4000/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_4/adapter_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_4/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_3/pytorch_model_head.bin
Configuratio

Configuration saved in ./training_output/checkpoint-6000/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_4/adapter_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_4/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_4/head_config.json
Module weights save

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

loading weights file https://huggingface.co/allegro/herbert-large-cased/resolve/main/pytorch_model.bin from cache at /home/marek/.cache/huggingface/transformers/ca58839b8e4b1222703e13158ffeb3a5a7330260cbc39513f74710674d70268b.ad71128a5739887a02bfa6de2fa8768f86e02cd13d0c308873f4cdba254e4c7c
Adding head 'fake_news_1' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_2' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_3' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_4' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh',

Adding adapter 'fake_news_5'.
Adding head 'fake_news_5' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Using cuda_amp half precision backend
***** Running training *****
  Num examples = 5924
  Num Epochs = 10
  Instantaneous batch size per device = 8
  Total train batch size (w. parallel, distributed & accumulation) = 8
  Gradient Accumulation steps = 1
  Total optimization steps = 7410


Step,Training Loss
500,0.6741
1000,0.5967
1500,0.5769
2000,0.5428
2500,0.5115
3000,0.4873
3500,0.4534
4000,0.4339
4500,0.4093
5000,0.3752


Saving model checkpoint to ./training_output/checkpoint-500
Configuration saved in ./training_output/checkpoint-500/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500

Saving model checkpoint to ./training_output/checkpoint-2000
Configuration saved in ./training_output/checkpoint-2000/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/che

Saving model checkpoint to ./training_output/checkpoint-3500
Configuration saved in ./training_output/checkpoint-3500/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/che

Saving model checkpoint to ./training_output/checkpoint-5000
Configuration saved in ./training_output/checkpoint-5000/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/che

Saving model checkpoint to ./training_output/checkpoint-6500
Configuration saved in ./training_output/checkpoint-6500/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/che

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

loading weights file https://huggingface.co/allegro/herbert-large-cased/resolve/main/pytorch_model.bin from cache at /home/marek/.cache/huggingface/transformers/ca58839b8e4b1222703e13158ffeb3a5a7330260cbc39513f74710674d70268b.ad71128a5739887a02bfa6de2fa8768f86e02cd13d0c308873f4cdba254e4c7c
Adding head 'fake_news_1' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_2' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_3' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_4' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh',

Adding adapter 'fake_news_6'.
Adding head 'fake_news_6' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Using cuda_amp half precision backend
***** Running training *****
  Num examples = 5898
  Num Epochs = 10
  Instantaneous batch size per device = 8
  Total train batch size (w. parallel, distributed & accumulation) = 8
  Gradient Accumulation steps = 1
  Total optimization steps = 7380


Step,Training Loss
500,0.6861
1000,0.6014
1500,0.5645
2000,0.5371
2500,0.509
3000,0.487
3500,0.4487
4000,0.4297
4500,0.4066
5000,0.3715


Saving model checkpoint to ./training_output/checkpoint-500
Configuration saved in ./training_output/checkpoint-500/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500

Configuration saved in ./training_output/checkpoint-1500/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_6/adapter_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_6/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_3/head_config.json
Module weights save

Configuration saved in ./training_output/checkpoint-3000/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_3/head_config.json
Module weights save

Module weights saved in ./training_output/checkpoint-4000/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_6/adapter_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_6/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_3/pytorch_model_head.bin
Configuratio

Module weights saved in ./training_output/checkpoint-5500/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_3/pytorch_model_head.bin
Configuration s

Configuration saved in ./training_output/checkpoint-6500/fake_news_6/adapter_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_6/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_4/head_config.json
Module weights save

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

loading weights file https://huggingface.co/allegro/herbert-large-cased/resolve/main/pytorch_model.bin from cache at /home/marek/.cache/huggingface/transformers/ca58839b8e4b1222703e13158ffeb3a5a7330260cbc39513f74710674d70268b.ad71128a5739887a02bfa6de2fa8768f86e02cd13d0c308873f4cdba254e4c7c
Adding head 'fake_news_1' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_2' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_3' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_4' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh',

Adding adapter 'fake_news_7'.
Adding head 'fake_news_7' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Using cuda_amp half precision backend
***** Running training *****
  Num examples = 5939
  Num Epochs = 10
  Instantaneous batch size per device = 8
  Total train batch size (w. parallel, distributed & accumulation) = 8
  Gradient Accumulation steps = 1
  Total optimization steps = 7430


Step,Training Loss
500,0.6878
1000,0.5902
1500,0.5823
2000,0.5384
2500,0.5048
3000,0.4977
3500,0.4632
4000,0.4377
4500,0.4172
5000,0.3847


Saving model checkpoint to ./training_output/checkpoint-500
Configuration saved in ./training_output/checkpoint-500/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500

Configuration saved in ./training_output/checkpoint-1500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_4/adapter_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_4/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_5/adapter_config.json
Module weights s

Module weights saved in ./training_output/checkpoint-2500/fake_news_4/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_5/adapter_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_5/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_6/adapter_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_6/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_6/pytorch_model_head.bin
Configuration s

Configuration saved in ./training_output/checkpoint-3500/fake_news_6/adapter_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_6/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_7/adapter_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_7/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_2/head_config.json
Module weights save

Module weights saved in ./training_output/checkpoint-4500/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_5/pytorch_model_head.bin
Configuratio

Configuration saved in ./training_output/checkpoint-5500/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_7/pytorch_model_head.bin
Saving model checkpoint to ./training_output/checkpoint-6000
Configuration saved in ./training_output/checkpoint-6000/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/che

Module weights saved in ./training_output/checkpoint-6500/fake_news_7/pytorch_model_head.bin
Saving model checkpoint to ./training_output/checkpoint-7000
Configuration saved in ./training_output/checkpoint-7000/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_3/adapter_config.json
Module weights saved in ./training_output

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

loading weights file https://huggingface.co/allegro/herbert-large-cased/resolve/main/pytorch_model.bin from cache at /home/marek/.cache/huggingface/transformers/ca58839b8e4b1222703e13158ffeb3a5a7330260cbc39513f74710674d70268b.ad71128a5739887a02bfa6de2fa8768f86e02cd13d0c308873f4cdba254e4c7c
Adding head 'fake_news_1' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_2' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_3' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_4' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh',

Adding adapter 'fake_news_8'.
Adding head 'fake_news_8' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Using cuda_amp half precision backend
***** Running training *****
  Num examples = 5978
  Num Epochs = 10
  Instantaneous batch size per device = 8
  Total train batch size (w. parallel, distributed & accumulation) = 8
  Gradient Accumulation steps = 1
  Total optimization steps = 7480


Step,Training Loss
500,0.681
1000,0.6032
1500,0.5955
2000,0.5411
2500,0.5369
3000,0.4988
3500,0.4848
4000,0.4474
4500,0.4414
5000,0.3919


Saving model checkpoint to ./training_output/checkpoint-500
Configuration saved in ./training_output/checkpoint-500/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500

Module weights saved in ./training_output/checkpoint-1000/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_8/pytorch_model_head.bin
Saving model checkpoint to ./training_output/checkpoint-1500
Configuration saved in ./training_output/checkpoint-1500/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_2/adapter_config.json
Module weights saved in ./training_output

Configuration saved in ./training_output/checkpoint-2000/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_8/pytorch_model_head.bin
Saving model checkpoint to ./training_output/checkpoint-2500
Configuration saved in ./training_output/che

Module weights saved in ./training_output/checkpoint-3000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_6/pytorch_model_head.bin
Configuratio

Configuration saved in ./training_output/checkpoint-4000/fake_news_8/adapter_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_8/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_4/head_config.json
Module weights save

Module weights saved in ./training_output/checkpoint-5000/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_7/adapter_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_7/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_8/adapter_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_8/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_1/pytorch_model_head.bin
Configuratio

Configuration saved in ./training_output/checkpoint-6000/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_6/adapter_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_6/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_7/adapter_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_7/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_8/adapter_config.json
Module weights s

Module weights saved in ./training_output/checkpoint-7000/fake_news_4/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_5/adapter_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_5/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_6/adapter_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_6/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_6/pytorch_model_head.bin
Configuration s

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

loading weights file https://huggingface.co/allegro/herbert-large-cased/resolve/main/pytorch_model.bin from cache at /home/marek/.cache/huggingface/transformers/ca58839b8e4b1222703e13158ffeb3a5a7330260cbc39513f74710674d70268b.ad71128a5739887a02bfa6de2fa8768f86e02cd13d0c308873f4cdba254e4c7c
Adding head 'fake_news_1' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_2' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_3' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_4' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh',

Adding adapter 'fake_news_9'.
Adding head 'fake_news_9' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Using cuda_amp half precision backend
***** Running training *****
  Num examples = 5865
  Num Epochs = 10
  Instantaneous batch size per device = 8
  Total train batch size (w. parallel, distributed & accumulation) = 8
  Gradient Accumulation steps = 1
  Total optimization steps = 7340


Step,Training Loss
500,0.6743
1000,0.5923
1500,0.5758
2000,0.5299
2500,0.5163
3000,0.4941
3500,0.4726
4000,0.4125
4500,0.4174
5000,0.3747


Saving model checkpoint to ./training_output/checkpoint-500
Configuration saved in ./training_output/checkpoint-500/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500

Module weights saved in ./training_output/checkpoint-1000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_6/pytorch_model_head.bin
Configuratio

Configuration saved in ./training_output/checkpoint-2000/fake_news_6/adapter_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_6/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_7/adapter_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_7/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_8/adapter_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_8/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_8/head_config.json
Module weights save

Module weights saved in ./training_output/checkpoint-3000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_4/adapter_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_4/pytorch_adapter.bin
Configuratio

Configuration saved in ./training_output/checkpoint-3500/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_8/head_config.json
Module weights save

Module weights saved in ./training_output/checkpoint-4500/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_7/adapter_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_7/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_8/adapter_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_8/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_9/adapter_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_9/pytorch_adapter.bin
Configuratio

Configuration saved in ./training_output/checkpoint-5500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_4/adapter_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_4/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_5/adapter_config.json
Module weights s

Module weights saved in ./training_output/checkpoint-6000/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_9/pytorch_model_head.bin
Saving model

Configuration saved in ./training_output/checkpoint-7000/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_8/adapter_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_8/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_9/adapter_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_9/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_1/head_config.json
Module weights save

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

loading weights file https://huggingface.co/allegro/herbert-large-cased/resolve/main/pytorch_model.bin from cache at /home/marek/.cache/huggingface/transformers/ca58839b8e4b1222703e13158ffeb3a5a7330260cbc39513f74710674d70268b.ad71128a5739887a02bfa6de2fa8768f86e02cd13d0c308873f4cdba254e4c7c
Adding head 'fake_news_1' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_2' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_3' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_4' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh',

Adding adapter 'fake_news_10'.
Adding head 'fake_news_10' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Using cuda_amp half precision backend
***** Running training *****
  Num examples = 5836
  Num Epochs = 10
  Instantaneous batch size per device = 8
  Total train batch size (w. parallel, distributed & accumulation) = 8
  Gradient Accumulation steps = 1
  Total optimization steps = 7300


Step,Training Loss
500,0.6725
1000,0.6159
1500,0.5813
2000,0.5345
2500,0.5151
3000,0.4856
3500,0.4638
4000,0.4141
4500,0.4106
5000,0.3877


Saving model checkpoint to ./training_output/checkpoint-500
Configuration saved in ./training_output/checkpoint-500/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500

Module weights saved in ./training_output/checkpoint-1000/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_9/adapter_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_9/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_10/adapter_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_10/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_1/pytorch_model_head.bin
Configur

Configuration saved in ./training_output/checkpoint-2000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_4/adapter_config.json
Module weights s

Module weights saved in ./training_output/checkpoint-2500/fake_news_9/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_10/adapter_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_10/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_2/pytorch_model_head.bin
Configurati

Configuration saved in ./training_output/checkpoint-3500/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_4/adapter_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_4/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_4/head_config.json
Module weights save

Module weights saved in ./training_output/checkpoint-4000/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_10/adapter_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_10/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_3/pytorch_model_head.bin
Configur

Configuration saved in ./training_output/checkpoint-5000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_4/adapter_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_4/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_5/adapter_config.json
Module weights s

Module weights saved in ./training_output/checkpoint-5500/fake_news_10/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_4/pytorch_model_head.bin
Configuratio

Configuration saved in ./training_output/checkpoint-6500/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_4/adapter_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_4/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_5/adapter_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_5/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_5/head_config.json
Module weights save

Module weights saved in ./training_output/checkpoint-7000/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_5/pytorch_model_head.bin
Configurati

In [12]:
acc = np.array(acc)
f1 = np.array(f1)

print(
    'adapters',
    f'Accuracy {acc.mean():.3f}+-{acc.std():.3f}',
    f'F1 Score {f1.mean():.3f}+-{f1.std():.3f}',
    f' {acc.mean():.3f}+-{acc.std():.3f} | {f1.mean():.3f}+-{f1.std():.3f}'
)

adapters Accuracy 0.710+-0.014 F1 Score 0.690+-0.035  0.710+-0.014 | 0.690+-0.035


In [13]:
cv = cv_Kfold

In [14]:
acc = []
f1 = []

for train_cv, test_cv in cv:
    ds = DatasetDict()
    ds['train'] = Dataset.from_pandas(df[df.index.isin(train_cv)])
    ds['valid'] = Dataset.from_pandas(df[df.index.isin(test_cv)])
    
    
    ds = ds.map(encode_batch, batched=True, batch_size=len(ds['train']))
    ds.set_format(type="torch", columns=["input_ids", "attention_mask", "labels"])
    
    
    model = BertAdapterModel.from_pretrained('allegro/herbert-large-cased', config=config).to('cuda')

    adapter_name='fake_news_'+str(j)
    
    model.add_adapter(adapter_name,config=adapter_config)
    model.add_classification_head(
        adapter_name,
        id2label=id2label,
        num_labels=num_labels
      )

    model.train_adapter(adapter_name)
    
    
    trainer = AdapterTrainer(
        model=model,
        args=training_args,
        train_dataset=ds["train"],
        eval_dataset=ds["valid"],
        compute_metrics=compute_accuracy_f1score,
    )

    trainer.train()
    
    eval_out = trainer.evaluate()
    
    acc.append(eval_out['eval_accuracy'])
    f1.append(eval_out['eval_f1score'])
    
    j += 1

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

loading weights file https://huggingface.co/allegro/herbert-large-cased/resolve/main/pytorch_model.bin from cache at /home/marek/.cache/huggingface/transformers/ca58839b8e4b1222703e13158ffeb3a5a7330260cbc39513f74710674d70268b.ad71128a5739887a02bfa6de2fa8768f86e02cd13d0c308873f4cdba254e4c7c
Adding head 'fake_news_1' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_2' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_3' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_4' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh',

Adding adapter 'fake_news_11'.
Adding head 'fake_news_11' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Using cuda_amp half precision backend
***** Running training *****
  Num examples = 5886
  Num Epochs = 10
  Instantaneous batch size per device = 8
  Total train batch size (w. parallel, distributed & accumulation) = 8
  Gradient Accumulation steps = 1
  Total optimization steps = 7360


Step,Training Loss
500,0.6826
1000,0.6219
1500,0.581
2000,0.5405
2500,0.5119
3000,0.5044
3500,0.4691
4000,0.4426
4500,0.4172
5000,0.3914


Saving model checkpoint to ./training_output/checkpoint-500
Configuration saved in ./training_output/checkpoint-500/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500

Module weights saved in ./training_output/checkpoint-1000/fake_news_7/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_8/adapter_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_8/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_9/adapter_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_9/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_9/pytorch_model_head.bin
Configuration s

Configuration saved in ./training_output/checkpoint-1500/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_9/head_config.json
Module weights save

Configuration saved in ./training_output/checkpoint-2500/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_4/adapter_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_4/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_5/adapter_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_5/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_5/head_config.json
Module weights save

Module weights saved in ./training_output/checkpoint-3000/fake_news_9/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_10/adapter_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_10/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_11/adapter_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_11/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_11/pytorch_model_head.bin
Configu

Configuration saved in ./training_output/checkpoint-3500/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_11/pytorch_model_head.bin
Saving model checkpoint to ./training_output/checkpoint-4000
Configuration saved in ./training_output/checkpoint-4000/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output

Configuration saved in ./training_output/checkpoint-4500/fake_news_5/adapter_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_5/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_6/adapter_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_6/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_7/adapter_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_7/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_7/head_config.json
Module weights save

Module weights saved in ./training_output/checkpoint-5000/fake_news_11/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_4/pytorch_model_head.bin
Configuratio

Saving model checkpoint to ./training_output/checkpoint-6000
Configuration saved in ./training_output/checkpoint-6000/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/che

Module weights saved in ./training_output/checkpoint-6500/fake_news_7/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_8/adapter_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_8/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_9/adapter_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_9/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_9/pytorch_model_head.bin
Configuration s

Configuration saved in ./training_output/checkpoint-7000/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_9/head_config.json
Module weights save

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

loading weights file https://huggingface.co/allegro/herbert-large-cased/resolve/main/pytorch_model.bin from cache at /home/marek/.cache/huggingface/transformers/ca58839b8e4b1222703e13158ffeb3a5a7330260cbc39513f74710674d70268b.ad71128a5739887a02bfa6de2fa8768f86e02cd13d0c308873f4cdba254e4c7c
Adding head 'fake_news_1' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_2' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_3' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_4' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh',

Adding adapter 'fake_news_12'.
Adding head 'fake_news_12' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Using cuda_amp half precision backend
***** Running training *****
  Num examples = 5887
  Num Epochs = 10
  Instantaneous batch size per device = 8
  Total train batch size (w. parallel, distributed & accumulation) = 8
  Gradient Accumulation steps = 1
  Total optimization steps = 7360


Step,Training Loss
500,0.6733
1000,0.6077
1500,0.5703
2000,0.5338
2500,0.5187
3000,0.5048
3500,0.4556
4000,0.4334
4500,0.4178
5000,0.383


Saving model checkpoint to ./training_output/checkpoint-500
Configuration saved in ./training_output/checkpoint-500/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500

Module weights saved in ./training_output/checkpoint-1000/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_6/adapter_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_6/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_7/adapter_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_7/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_8/adapter_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_8/pytorch_adapter.bin
Configuratio

Configuration saved in ./training_output/checkpoint-1500/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_11/adapter_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_11/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_12/adapter_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_12/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_12/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_1/head_config.json
Module we

Module weights saved in ./training_output/checkpoint-2000/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_10/pytorch_model_head.bin
Configurat

Module weights saved in ./training_output/checkpoint-3000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_4/adapter_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_4/pytorch_adapter.bin
Configuratio

Configuration saved in ./training_output/checkpoint-3500/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_7/adapter_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_7/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_8/adapter_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_8/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_9/adapter_config.json
Module weights s

Module weights saved in ./training_output/checkpoint-4000/fake_news_11/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_12/adapter_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_12/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_12/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_2/pytorch_model_head.bin
Configur

Configuration saved in ./training_output/checkpoint-4500/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_12/head_config.json
Module weights

Configuration saved in ./training_output/checkpoint-5500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_4/adapter_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_4/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_5/adapter_config.json
Module weights s

Module weights saved in ./training_output/checkpoint-6000/fake_news_7/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_8/adapter_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_8/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_9/adapter_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_9/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_9/pytorch_model_head.bin
Configuration s

Configuration saved in ./training_output/checkpoint-6500/fake_news_12/adapter_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_12/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_12/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_4/head_config.json
Module weights 

Module weights saved in ./training_output/checkpoint-7000/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_12/pytorch_model_head.bin


Training completed. Do not forget to share your model on huggingface.co/models =)


***** Running Evaluation *****
  Num examples = 654
  Batch size = 32


  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

loading weights file https://huggingface.co/allegro/herbert-large-cased/resolve/main/pytorch_model.bin from cache at /home/marek/.cache/huggingface/transformers/ca58839b8e4b1222703e13158ffeb3a5a7330260cbc39513f74710674d70268b.ad71128a5739887a02bfa6de2fa8768f86e02cd13d0c308873f4cdba254e4c7c
Adding head 'fake_news_1' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_2' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_3' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_4' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh',

Adding adapter 'fake_news_13'.
Adding head 'fake_news_13' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Using cuda_amp half precision backend
***** Running training *****
  Num examples = 5887
  Num Epochs = 10
  Instantaneous batch size per device = 8
  Total train batch size (w. parallel, distributed & accumulation) = 8
  Gradient Accumulation steps = 1
  Total optimization steps = 7360


Step,Training Loss
500,0.6711
1000,0.5969
1500,0.57
2000,0.5234
2500,0.5213
3000,0.4854
3500,0.4486
4000,0.4083
4500,0.3943
5000,0.3659


Saving model checkpoint to ./training_output/checkpoint-500
Configuration saved in ./training_output/checkpoint-500/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500

Module weights saved in ./training_output/checkpoint-1000/fake_news_4/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_5/adapter_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_5/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_6/adapter_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_6/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_6/pytorch_model_head.bin
Configuration s

Configuration saved in ./training_output/checkpoint-1500/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_8/adapter_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_8/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_9/adapter_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_9/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_10/adapter_config.json
Module weights 

Module weights saved in ./training_output/checkpoint-2000/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_11/adapter_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_11/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_12/adapter_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_12/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_12/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_13/adapter_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_13/pytorch_adapter.bin
C

Configuration saved in ./training_output/checkpoint-2500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_6/head_config.json
Module weights save

Module weights saved in ./training_output/checkpoint-3000/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_12/pytorch_model_head.bin
Config

Saving model checkpoint to ./training_output/checkpoint-4000
Configuration saved in ./training_output/checkpoint-4000/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/che

Configuration saved in ./training_output/checkpoint-4500/fake_news_4/adapter_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_4/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_5/adapter_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_5/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_6/adapter_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_6/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_6/head_config.json
Module weights save

Module weights saved in ./training_output/checkpoint-5000/fake_news_7/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_8/adapter_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_8/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_9/adapter_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_9/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_9/pytorch_model_head.bin
Configuration s

Configuration saved in ./training_output/checkpoint-5500/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_11/adapter_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_11/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_12/adapter_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_12/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_12/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_13/adapter_config.json
Modul

Module weights saved in ./training_output/checkpoint-6000/fake_news_13/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_5/pytorch_model_head.bin
Configurati

Configuration saved in ./training_output/checkpoint-6500/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_12/head_config.json
Module weights

Module weights saved in ./training_output/checkpoint-7000/fake_news_13/pytorch_model_head.bin


Training completed. Do not forget to share your model on huggingface.co/models =)


***** Running Evaluation *****
  Num examples = 654
  Batch size = 32


  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

loading weights file https://huggingface.co/allegro/herbert-large-cased/resolve/main/pytorch_model.bin from cache at /home/marek/.cache/huggingface/transformers/ca58839b8e4b1222703e13158ffeb3a5a7330260cbc39513f74710674d70268b.ad71128a5739887a02bfa6de2fa8768f86e02cd13d0c308873f4cdba254e4c7c
Adding head 'fake_news_1' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_2' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_3' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_4' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh',

Adding adapter 'fake_news_14'.
Adding head 'fake_news_14' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Using cuda_amp half precision backend
***** Running training *****
  Num examples = 5887
  Num Epochs = 10
  Instantaneous batch size per device = 8
  Total train batch size (w. parallel, distributed & accumulation) = 8
  Gradient Accumulation steps = 1
  Total optimization steps = 7360


Step,Training Loss
500,0.6758
1000,0.6011
1500,0.5795
2000,0.5448
2500,0.515
3000,0.4916
3500,0.4546
4000,0.4389
4500,0.4201
5000,0.3789


Saving model checkpoint to ./training_output/checkpoint-500
Configuration saved in ./training_output/checkpoint-500/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500

Module weights saved in ./training_output/checkpoint-1000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_4/adapter_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_4/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_5/adapter_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_5/pytorch_adapter.bin
Configuratio

Configuration saved in ./training_output/checkpoint-1500/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_5/adapter_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_5/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_6/adapter_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_6/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_7/adapter_config.json
Module weights s

Module weights saved in ./training_output/checkpoint-2000/fake_news_6/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_7/adapter_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_7/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_8/adapter_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_8/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_8/pytorch_model_head.bin
Configuration s

Configuration saved in ./training_output/checkpoint-2500/fake_news_8/adapter_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_8/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_9/adapter_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_9/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_10/adapter_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_10/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_10/head_config.json
Module weights s

Module weights saved in ./training_output/checkpoint-3000/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_10/adapter_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_10/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_11/adapter_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_11/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_12/adapter_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_12/pytorch_adapter.bin
Co

Configuration saved in ./training_output/checkpoint-3500/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_12/adapter_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_12/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_12/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_13/adapter_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_13/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_13/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_13/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_14/adapter_config.json
Modul

Module weights saved in ./training_output/checkpoint-4000/fake_news_13/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_13/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_13/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_14/adapter_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_14/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_14/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_14/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_2/pytorch_model_head.bin
Configur

Configuration saved in ./training_output/checkpoint-4500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_6/head_config.json
Module weights save

Module weights saved in ./training_output/checkpoint-5000/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_9/pytorch_model_head.bin
Configuratio

Configuration saved in ./training_output/checkpoint-5500/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_12/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_13/head_config.json
Module weigh

Module weights saved in ./training_output/checkpoint-6000/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_12/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_13/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_13/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_14/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_14/pytorch_model_head.bin
Saving model checkpoint to ./training_output/checkpoint-6500
Configuration saved in ./training_output/checkpoint-6500/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_1/head_config.json
Module weights saved in ./training_ou

Saving model checkpoint to ./training_output/checkpoint-7000
Configuration saved in ./training_output/checkpoint-7000/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/che

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

loading weights file https://huggingface.co/allegro/herbert-large-cased/resolve/main/pytorch_model.bin from cache at /home/marek/.cache/huggingface/transformers/ca58839b8e4b1222703e13158ffeb3a5a7330260cbc39513f74710674d70268b.ad71128a5739887a02bfa6de2fa8768f86e02cd13d0c308873f4cdba254e4c7c
Adding head 'fake_news_1' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_2' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_3' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_4' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh',

Adding adapter 'fake_news_15'.
Adding head 'fake_news_15' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Using cuda_amp half precision backend
***** Running training *****
  Num examples = 5887
  Num Epochs = 10
  Instantaneous batch size per device = 8
  Total train batch size (w. parallel, distributed & accumulation) = 8
  Gradient Accumulation steps = 1
  Total optimization steps = 7360


Step,Training Loss
500,0.6774
1000,0.6035
1500,0.5721
2000,0.5352
2500,0.5251
3000,0.4886
3500,0.4577
4000,0.4305
4500,0.4168
5000,0.3765


Saving model checkpoint to ./training_output/checkpoint-500
Configuration saved in ./training_output/checkpoint-500/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500

Module weights saved in ./training_output/checkpoint-1000/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_3/pytorch_model_head.bin
Configuration s

Configuration saved in ./training_output/checkpoint-1500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_4/adapter_config.json
Module weights s

Module weights saved in ./training_output/checkpoint-2000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_4/adapter_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_4/pytorch_adapter.bin
Configuratio

Configuration saved in ./training_output/checkpoint-2500/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_4/adapter_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_4/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_4/head_config.json
Module weights save

Module weights saved in ./training_output/checkpoint-3000/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_4/adapter_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_4/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_4/pytorch_model_head.bin
Configuration s

Configuration saved in ./training_output/checkpoint-3500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_4/adapter_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_4/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_5/adapter_config.json
Module weights s

Module weights saved in ./training_output/checkpoint-4000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_4/adapter_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_4/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_5/adapter_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_5/pytorch_adapter.bin
Configuratio

Configuration saved in ./training_output/checkpoint-4500/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_4/adapter_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_4/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_5/adapter_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_5/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_5/head_config.json
Module weights save

Module weights saved in ./training_output/checkpoint-5000/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_4/adapter_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_4/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_5/adapter_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_5/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_5/pytorch_model_head.bin
Configuration s

Configuration saved in ./training_output/checkpoint-5500/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_4/adapter_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_4/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_5/adapter_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_5/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_6/adapter_config.json
Module weights s

Module weights saved in ./training_output/checkpoint-6000/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_4/adapter_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_4/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_5/adapter_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_5/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_6/adapter_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_6/pytorch_adapter.bin
Configuratio

Configuration saved in ./training_output/checkpoint-6500/fake_news_4/adapter_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_4/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_5/adapter_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_5/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_6/adapter_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_6/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_6/head_config.json
Module weights save

Module weights saved in ./training_output/checkpoint-7000/fake_news_4/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_5/adapter_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_5/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_6/adapter_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_6/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_6/pytorch_model_head.bin
Configuration s

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

loading weights file https://huggingface.co/allegro/herbert-large-cased/resolve/main/pytorch_model.bin from cache at /home/marek/.cache/huggingface/transformers/ca58839b8e4b1222703e13158ffeb3a5a7330260cbc39513f74710674d70268b.ad71128a5739887a02bfa6de2fa8768f86e02cd13d0c308873f4cdba254e4c7c
Adding head 'fake_news_1' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_2' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_3' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_4' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh',

Adding adapter 'fake_news_16'.
Adding head 'fake_news_16' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Using cuda_amp half precision backend
***** Running training *****
  Num examples = 5887
  Num Epochs = 10
  Instantaneous batch size per device = 8
  Total train batch size (w. parallel, distributed & accumulation) = 8
  Gradient Accumulation steps = 1
  Total optimization steps = 7360


Step,Training Loss
500,0.6777
1000,0.5919
1500,0.5758
2000,0.5339
2500,0.507
3000,0.5009
3500,0.4583
4000,0.4215
4500,0.4004
5000,0.3801


Saving model checkpoint to ./training_output/checkpoint-500
Configuration saved in ./training_output/checkpoint-500/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500

Configuration saved in ./training_output/checkpoint-500/fake_news_15/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_15/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_16/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_16/pytorch_model_head.bin
Saving model checkpoint to ./training_output/checkpoint-1000
Configuration saved in ./training_output/checkpoint-1000/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/che

Module weights saved in ./training_output/checkpoint-1000/fake_news_12/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_13/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_13/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_14/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_14/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_15/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_15/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_16/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_16/pytorch_model_head.bin
Saving model checkpoint to ./training_output/checkpoint-1500
Configuration saved in ./training_output/checkpoint-1500/fake_news_1/adapter_config.json
Module weights saved in ./traini

Configuration saved in ./training_output/checkpoint-1500/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_12/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_13/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_13/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_14/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_14/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_15/head_config.json
Module w

Module weights saved in ./training_output/checkpoint-2000/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_12/pytorch_model_head.bin
Config

Configuration saved in ./training_output/checkpoint-2500/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_10/head_config.json
Module weights sav

Module weights saved in ./training_output/checkpoint-3000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_7/pytorch_model_head.bin
Configuratio

Configuration saved in ./training_output/checkpoint-3500/fake_news_16/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_16/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_5/head_config.json
Module weights sa

Module weights saved in ./training_output/checkpoint-4000/fake_news_15/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_15/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_15/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_16/adapter_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_16/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_16/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_16/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_2/pytorch_model_head.bin
Configur

Configuration saved in ./training_output/checkpoint-4500/fake_news_14/adapter_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_14/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_14/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_14/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_15/adapter_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_15/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_15/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_15/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_16/adapter_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_16/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_16/head_config.json
Module w

Module weights saved in ./training_output/checkpoint-5000/fake_news_12/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_13/adapter_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_13/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_13/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_13/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_14/adapter_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_14/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_14/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_14/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_15/adapter_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_15/pytorch_adapter.bin
C

Configuration saved in ./training_output/checkpoint-5500/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_12/adapter_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_12/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_12/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_13/adapter_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_13/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_13/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_13/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_14/adapter_config.json
Modul

Module weights saved in ./training_output/checkpoint-6000/fake_news_10/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_11/adapter_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_11/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_12/adapter_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_12/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_12/pytorch_model_head.bin
Conf

Configuration saved in ./training_output/checkpoint-6500/fake_news_9/adapter_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_9/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_10/adapter_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_10/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_11/adapter_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_11/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_11/head_config.json
Module weigh

Module weights saved in ./training_output/checkpoint-7000/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_8/adapter_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_8/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_9/adapter_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_9/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_10/adapter_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_10/pytorch_adapter.bin
Configurat

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

loading weights file https://huggingface.co/allegro/herbert-large-cased/resolve/main/pytorch_model.bin from cache at /home/marek/.cache/huggingface/transformers/ca58839b8e4b1222703e13158ffeb3a5a7330260cbc39513f74710674d70268b.ad71128a5739887a02bfa6de2fa8768f86e02cd13d0c308873f4cdba254e4c7c
Adding head 'fake_news_1' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_2' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_3' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_4' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh',

Adding adapter 'fake_news_17'.
Adding head 'fake_news_17' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Using cuda_amp half precision backend
***** Running training *****
  Num examples = 5887
  Num Epochs = 10
  Instantaneous batch size per device = 8
  Total train batch size (w. parallel, distributed & accumulation) = 8
  Gradient Accumulation steps = 1
  Total optimization steps = 7360


Step,Training Loss
500,0.6771
1000,0.6183
1500,0.573
2000,0.5425
2500,0.522
3000,0.4978
3500,0.4463
4000,0.4335
4500,0.4115
5000,0.3841


Saving model checkpoint to ./training_output/checkpoint-500
Configuration saved in ./training_output/checkpoint-500/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500

Configuration saved in ./training_output/checkpoint-500/fake_news_13/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_13/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_14/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_14/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_15/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_15/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_16/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_16/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_17/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_17/pytorch_model_head.bin
Saving model checkpoint to ./training_output/checkpoint-1000
Configuration saved in ./training_output/che

Module weights saved in ./training_output/checkpoint-1000/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_12/pytorch_model_head.bin
Config

Configuration saved in ./training_output/checkpoint-1500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_7/head_config.json
Module weights save

Module weights saved in ./training_output/checkpoint-2000/fake_news_15/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_16/adapter_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_16/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_16/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_16/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_17/adapter_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_17/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_17/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_17/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_1/pytorch_model_head.bin
Con

Configuration saved in ./training_output/checkpoint-2500/fake_news_13/adapter_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_13/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_13/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_13/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_14/adapter_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_14/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_14/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_14/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_15/adapter_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_15/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_15/head_config.json
Module w

Module weights saved in ./training_output/checkpoint-3000/fake_news_10/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_11/adapter_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_11/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_12/adapter_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_12/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_12/pytorch_model_head.bin
Conf

Configuration saved in ./training_output/checkpoint-3500/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_8/adapter_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_8/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_9/adapter_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_9/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_10/adapter_config.json
Module weights 

Module weights saved in ./training_output/checkpoint-4000/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_5/adapter_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_5/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_6/adapter_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_6/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_7/adapter_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_7/pytorch_adapter.bin
Configuratio

Configuration saved in ./training_output/checkpoint-4500/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_4/adapter_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_4/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_4/head_config.json
Module weights save

Configuration saved in ./training_output/checkpoint-4500/fake_news_15/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_15/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_16/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_16/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_17/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_17/pytorch_model_head.bin
Saving model checkpoint to ./training_output/checkpoint-5000
Configuration saved in ./training_output/checkpoint-5000/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_outp

Module weights saved in ./training_output/checkpoint-5000/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_12/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_13/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_13/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_14/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_14/pytorch_model_head.bin
Co

Configuration saved in ./training_output/checkpoint-5500/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_9/head_config.json
Module weights save

Module weights saved in ./training_output/checkpoint-6000/fake_news_16/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_17/adapter_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_17/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_17/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_17/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_3/pytorch_model_head.bin
Configu

Configuration saved in ./training_output/checkpoint-6500/fake_news_14/adapter_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_14/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_14/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_14/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_15/adapter_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_15/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_15/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_15/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_16/adapter_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_16/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_16/head_config.json
Module w

Module weights saved in ./training_output/checkpoint-7000/fake_news_11/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_12/adapter_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_12/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_12/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_13/adapter_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_13/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_13/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_13/pytorch_model_head.bin
Conf

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

loading weights file https://huggingface.co/allegro/herbert-large-cased/resolve/main/pytorch_model.bin from cache at /home/marek/.cache/huggingface/transformers/ca58839b8e4b1222703e13158ffeb3a5a7330260cbc39513f74710674d70268b.ad71128a5739887a02bfa6de2fa8768f86e02cd13d0c308873f4cdba254e4c7c
Adding head 'fake_news_1' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_2' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_3' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_4' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh',

Adding adapter 'fake_news_18'.
Adding head 'fake_news_18' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Using cuda_amp half precision backend
***** Running training *****
  Num examples = 5887
  Num Epochs = 10
  Instantaneous batch size per device = 8
  Total train batch size (w. parallel, distributed & accumulation) = 8
  Gradient Accumulation steps = 1
  Total optimization steps = 7360


Step,Training Loss
500,0.6694
1000,0.6134
1500,0.5857
2000,0.5323
2500,0.5202
3000,0.4848
3500,0.4591
4000,0.4278
4500,0.4189
5000,0.3747


Saving model checkpoint to ./training_output/checkpoint-500
Configuration saved in ./training_output/checkpoint-500/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500

Configuration saved in ./training_output/checkpoint-500/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_12/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_13/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_13/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_14/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_14/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_15/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_15/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_16/head_config.json
Module weights save

Module weights saved in ./training_output/checkpoint-1000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_7/pytorch_model_head.bin
Configuratio

Configuration saved in ./training_output/checkpoint-1500/fake_news_15/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_15/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_16/adapter_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_16/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_16/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_16/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_17/adapter_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_17/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_17/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_17/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_18/adapter_config.json
Modul

Module weights saved in ./training_output/checkpoint-2000/fake_news_11/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_12/adapter_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_12/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_12/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_13/adapter_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_13/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_13/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_13/pytorch_model_head.bin
Conf

Configuration saved in ./training_output/checkpoint-2500/fake_news_7/adapter_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_7/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_8/adapter_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_8/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_9/adapter_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_9/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_9/head_config.json
Module weights save

Module weights saved in ./training_output/checkpoint-3000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_4/adapter_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_4/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_5/adapter_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_5/pytorch_adapter.bin
Configuratio

Module weights saved in ./training_output/checkpoint-3000/fake_news_14/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_15/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_15/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_16/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_16/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_17/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_17/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_18/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_18/pytorch_model_head.bin
Saving model checkpoint to ./training_output/checkpoint-3500
Configuration saved in ./training_output/checkpoint-3500/fake_news_1/adapter_config.json
Module weights saved in ./traini

Configuration saved in ./training_output/checkpoint-3500/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_11/head_config.json
Module weights s

Module weights saved in ./training_output/checkpoint-4000/fake_news_17/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_17/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_17/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_18/adapter_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_18/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_18/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_18/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_2/pytorch_model_head.bin
Configur

Configuration saved in ./training_output/checkpoint-4500/fake_news_13/adapter_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_13/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_13/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_13/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_14/adapter_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_14/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_14/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_14/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_15/adapter_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_15/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_15/head_config.json
Module w

Module weights saved in ./training_output/checkpoint-5000/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_9/adapter_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_9/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_10/adapter_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_10/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_11/adapter_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_11/pytorch_adapter.bin
Config

Configuration saved in ./training_output/checkpoint-5500/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_5/adapter_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_5/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_6/adapter_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_6/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_7/adapter_config.json
Module weights s

Configuration saved in ./training_output/checkpoint-5500/fake_news_18/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_18/pytorch_model_head.bin
Saving model checkpoint to ./training_output/checkpoint-6000
Configuration saved in ./training_output/checkpoint-6000/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/c

Module weights saved in ./training_output/checkpoint-6000/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_12/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_13/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_13/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_14/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_14/pytorch_model_head.bin
Co

Configuration saved in ./training_output/checkpoint-6500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_6/head_config.json
Module weights save

Module weights saved in ./training_output/checkpoint-7000/fake_news_14/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_15/adapter_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_15/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_15/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_15/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_16/adapter_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_16/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_16/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_16/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_17/adapter_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_17/pytorch_adapter.bin
C

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

loading weights file https://huggingface.co/allegro/herbert-large-cased/resolve/main/pytorch_model.bin from cache at /home/marek/.cache/huggingface/transformers/ca58839b8e4b1222703e13158ffeb3a5a7330260cbc39513f74710674d70268b.ad71128a5739887a02bfa6de2fa8768f86e02cd13d0c308873f4cdba254e4c7c
Adding head 'fake_news_1' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_2' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_3' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_4' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh',

Adding adapter 'fake_news_19'.
Adding head 'fake_news_19' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Using cuda_amp half precision backend
***** Running training *****
  Num examples = 5887
  Num Epochs = 10
  Instantaneous batch size per device = 8
  Total train batch size (w. parallel, distributed & accumulation) = 8
  Gradient Accumulation steps = 1
  Total optimization steps = 7360


Step,Training Loss
500,0.6641
1000,0.6076
1500,0.5706
2000,0.5383
2500,0.4923
3000,0.4977
3500,0.4592
4000,0.42
4500,0.4043
5000,0.3729


Saving model checkpoint to ./training_output/checkpoint-500
Configuration saved in ./training_output/checkpoint-500/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500

Configuration saved in ./training_output/checkpoint-500/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_12/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_13/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_13/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_14/head_config.json
Module weights saved 

Module weights saved in ./training_output/checkpoint-1000/fake_news_18/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_18/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_18/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_19/adapter_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_19/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_19/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_19/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_2/pytorch_model_head.bin
Configur

Configuration saved in ./training_output/checkpoint-1500/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_12/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_13/adapter_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_13/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_13/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_13/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_14/adapter_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_14/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_14/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_14/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_15/adapter_config.json
Modul

Module weights saved in ./training_output/checkpoint-2000/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_7/adapter_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_7/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_8/adapter_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_8/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_9/adapter_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_9/pytorch_adapter.bin
Configuratio

Saving model checkpoint to ./training_output/checkpoint-2500
Configuration saved in ./training_output/checkpoint-2500/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/che

Module weights saved in ./training_output/checkpoint-2500/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_12/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_13/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_13/pytorch_model_head.bin
Conf

Configuration saved in ./training_output/checkpoint-3000/fake_news_18/adapter_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_18/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_18/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_18/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_19/adapter_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_19/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_19/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_19/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_2/head_config.json
Module weig

Module weights saved in ./training_output/checkpoint-3500/fake_news_12/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_12/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_13/adapter_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_13/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_13/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_13/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_14/adapter_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_14/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_14/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_14/pytorch_model_head.bin
Conf

Configuration saved in ./training_output/checkpoint-4000/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_7/adapter_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_7/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_8/adapter_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_8/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_9/adapter_config.json
Module weights s

Module weights saved in ./training_output/checkpoint-4000/fake_news_19/pytorch_model_head.bin
Saving model checkpoint to ./training_output/checkpoint-4500
Configuration saved in ./training_output/checkpoint-4500/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_3/adapter_config.json
Module weights saved in ./training_outpu

Configuration saved in ./training_output/checkpoint-4500/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_12/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_13/head_config.json
Module weigh

Module weights saved in ./training_output/checkpoint-5000/fake_news_17/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_18/adapter_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_18/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_18/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_18/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_19/adapter_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_19/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_19/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_19/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_1/pytorch_model_head.bin
Con

Configuration saved in ./training_output/checkpoint-5500/fake_news_12/adapter_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_12/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_12/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_13/adapter_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_13/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_13/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_13/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_14/adapter_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_14/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_14/head_config.json
Module w

Module weights saved in ./training_output/checkpoint-6000/fake_news_6/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_7/adapter_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_7/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_8/adapter_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_8/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_8/pytorch_model_head.bin
Configuration s

Configuration saved in ./training_output/checkpoint-6000/fake_news_19/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_19/pytorch_model_head.bin
Saving model checkpoint to ./training_output/checkpoint-6500
Configuration saved in ./training_output/checkpoint-6500/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/c

Module weights saved in ./training_output/checkpoint-6500/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_12/pytorch_model_head.bin
Config

Configuration saved in ./training_output/checkpoint-7000/fake_news_17/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_17/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_18/adapter_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_18/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_18/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_18/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_19/adapter_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_19/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_19/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_19/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_1/head_config.json
Module we

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

loading weights file https://huggingface.co/allegro/herbert-large-cased/resolve/main/pytorch_model.bin from cache at /home/marek/.cache/huggingface/transformers/ca58839b8e4b1222703e13158ffeb3a5a7330260cbc39513f74710674d70268b.ad71128a5739887a02bfa6de2fa8768f86e02cd13d0c308873f4cdba254e4c7c
Adding head 'fake_news_1' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_2' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_3' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Adding head 'fake_news_4' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh',

Adding adapter 'fake_news_20'.
Adding head 'fake_news_20' with config {'head_type': 'classification', 'num_labels': 2, 'layers': 2, 'activation_function': 'tanh', 'label2id': {0: 0, 1: 1}, 'use_pooler': False, 'bias': True}.
Using cuda_amp half precision backend
***** Running training *****
  Num examples = 5887
  Num Epochs = 10
  Instantaneous batch size per device = 8
  Total train batch size (w. parallel, distributed & accumulation) = 8
  Gradient Accumulation steps = 1
  Total optimization steps = 7360


Step,Training Loss
500,0.6679
1000,0.6017
1500,0.5761
2000,0.5336
2500,0.51
3000,0.4916
3500,0.4637
4000,0.4294
4500,0.4174
5000,0.3959


Saving model checkpoint to ./training_output/checkpoint-500
Configuration saved in ./training_output/checkpoint-500/fake_news_1/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-500

Configuration saved in ./training_output/checkpoint-500/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_8/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_8/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-500/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-500/fake_news_12/head_config.json
Module weights saved in .

Module weights saved in ./training_output/checkpoint-1000/fake_news_16/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_17/adapter_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_17/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_17/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_17/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_18/adapter_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_18/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_18/head_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_18/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1000/fake_news_19/adapter_config.json
Module weights saved in ./training_output/checkpoint-1000/fake_news_19/pytorch_adapter.bin
C

Configuration saved in ./training_output/checkpoint-1500/fake_news_9/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_10/adapter_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_10/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_11/adapter_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_11/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-1500/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-1500/fake_news_12/adapter_config.json
Module 

Module weights saved in ./training_output/checkpoint-2000/fake_news_2/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_3/adapter_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_3/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_4/adapter_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_4/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_4/pytorch_model_head.bin
Configuration s

Module weights saved in ./training_output/checkpoint-2000/fake_news_9/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_10/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_12/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_13/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_13/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2000/fake_news_14/head_config.json
Module weights saved in ./training_output/checkpoint-2000/fake_news_14/pytorch_model_head.bin
Co

Configuration saved in ./training_output/checkpoint-2500/fake_news_18/adapter_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_18/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_18/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_18/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_19/adapter_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_19/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_19/head_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_19/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_20/adapter_config.json
Module weights saved in ./training_output/checkpoint-2500/fake_news_20/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-2500/fake_news_20/head_config.json
Module w

Module weights saved in ./training_output/checkpoint-3000/fake_news_10/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_11/adapter_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_11/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_11/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_11/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_12/adapter_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_12/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_12/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3000/fake_news_13/adapter_config.json
Module weights saved in ./training_output/checkpoint-3000/fake_news_13/pytorch_adapter.bin
C

Configuration saved in ./training_output/checkpoint-3500/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_4/adapter_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_4/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_5/adapter_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_5/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_6/adapter_config.json
Module weights s

Configuration saved in ./training_output/checkpoint-3500/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_12/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_13/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_13/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_14/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_14/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_15/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_15/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_16/head_config.json
Module weights saved in ./training_output/checkpoint-3500/fake_news_16/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-3500/fake_news_17/head_config.json
Module w

Module weights saved in ./training_output/checkpoint-4000/fake_news_19/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_19/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_19/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_20/adapter_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_20/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_20/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_20/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-4000/fake_news_2/pytorch_model_head.bin
Configur

Configuration saved in ./training_output/checkpoint-4500/fake_news_12/adapter_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_12/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_12/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_12/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_13/adapter_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_13/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_13/head_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_13/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_14/adapter_config.json
Module weights saved in ./training_output/checkpoint-4500/fake_news_14/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-4500/fake_news_14/head_config.json
Module w

Module weights saved in ./training_output/checkpoint-5000/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_5/adapter_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_5/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_6/adapter_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_6/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_7/adapter_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_7/pytorch_adapter.bin
Configuratio

Configuration saved in ./training_output/checkpoint-5000/fake_news_14/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_14/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_15/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_15/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_16/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_16/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_17/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_17/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_18/head_config.json
Module weights saved in ./training_output/checkpoint-5000/fake_news_18/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5000/fake_news_19/head_config.json
Module w

Module weights saved in ./training_output/checkpoint-5500/fake_news_20/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_20/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_20/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_1/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-5500/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-5500/fake_news_4/pytorch_model_head.bin
Configuratio

Configuration saved in ./training_output/checkpoint-6000/fake_news_13/adapter_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_13/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_13/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_13/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_14/adapter_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_14/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_14/head_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_14/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_15/adapter_config.json
Module weights saved in ./training_output/checkpoint-6000/fake_news_15/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6000/fake_news_15/head_config.json
Module w

Module weights saved in ./training_output/checkpoint-6500/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_6/adapter_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_6/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_6/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_7/adapter_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_7/pytorch_adapter.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_7/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_7/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_8/adapter_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_8/pytorch_adapter.bin
Configuratio

Configuration saved in ./training_output/checkpoint-6500/fake_news_16/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_16/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_17/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_17/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_18/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_18/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_19/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_19/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-6500/fake_news_20/head_config.json
Module weights saved in ./training_output/checkpoint-6500/fake_news_20/pytorch_model_head.bin
Saving model checkpoint to ./training_output/checkpoint-7000
Configuration saved in ./training_

Module weights saved in ./training_output/checkpoint-7000/fake_news_1/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_2/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_2/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_3/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_3/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_4/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_4/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_5/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_5/pytorch_model_head.bin
Configuration saved in ./training_output/checkpoint-7000/fake_news_6/head_config.json
Module weights saved in ./training_output/checkpoint-7000/fake_news_6/pytorch_model_head.bin
Configuratio

In [15]:
acc = np.array(acc)
f1 = np.array(f1)

print(
    'adapters',
    f'Accuracy {acc.mean():.3f}+-{acc.std():.3f}',
    f'F1 Score {f1.mean():.3f}+-{f1.std():.3f}',
    f' {acc.mean():.3f}+-{acc.std():.3f} | {f1.mean():.3f}+-{f1.std():.3f}'
)

adapters Accuracy 0.719+-0.016 F1 Score 0.707+-0.016  0.719+-0.016 | 0.707+-0.016
