In [None]:
!pip install transformers
!pip install datasets
!pip install --upgrade --no-cache-dir gdown==4.5.4

!gdown 18oZZ4jqRK-uF-Nz6ftRdgNjKix88hrnO
!unzip data_and_models.zip && rm data_and_models.zip

Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/
Collecting transformers
  Downloading transformers-4.23.1-py3-none-any.whl (5.3 MB)
[K     |████████████████████████████████| 5.3 MB 4.7 MB/s 
Collecting tokenizers!=0.11.3,<0.14,>=0.11.1
  Downloading tokenizers-0.13.1-cp37-cp37m-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (7.6 MB)
[K     |████████████████████████████████| 7.6 MB 70.2 MB/s 
Collecting huggingface-hub<1.0,>=0.10.0
  Downloading huggingface_hub-0.10.1-py3-none-any.whl (163 kB)
[K     |████████████████████████████████| 163 kB 86.9 MB/s 
Installing collected packages: tokenizers, huggingface-hub, transformers
Successfully installed huggingface-hub-0.10.1 tokenizers-0.13.1 transformers-4.23.1
Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/
Collecting datasets
  Downloading datasets-2.6.1-py3-none-any.whl (441 kB)
[K     |████████████████████████████████| 441 kB 4.7 MB/

In [None]:
import csv
import pickle
import random
import time

from datasets import load_metric
import numpy as np
import pandas as pd
import torch
from transformers import RobertaForSequenceClassification, RobertaTokenizerFast, Trainer, TrainingArguments

def compute_metrics(eval_preds):
    metric = load_metric("accuracy")
    logits, labels = eval_preds
    predictions = np.argmax(logits, axis=-1)
    return metric.compute(predictions=predictions, references=labels)

class PSCDataset(torch.utils.data.Dataset):
    def __init__(self, encodings, labels):
        self.encodings = encodings
        self.labels = labels

    def __getitem__(self, idx):
        item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
        item['labels'] = torch.tensor(self.labels[idx])
        return item

    def __len__(self):
        return len(self.labels)

def top_k_accuracy(top_k, predictions, labels):
  assert len(predictions) == len(labels)
  total = 0
  correct = 0
  for i in range(len(predictions)):
    total += 1
    prediction = []
    for j, k in enumerate(predictions[i]):
      prediction.append([j, k]) # k is the value
    prediction.sort(key = lambda x: -x[1])
    for j, _ in prediction[:top_k]:
      if j == labels[i]:
        correct += 1
        break
  return correct/total

directory = "./data_and_models/"
all_df = pd.read_csv(directory+"target_corpus.csv")
epochs = 20
seeds = [11, 12, 13, 14, 15]
start = time.time()
tokenizer = RobertaTokenizerFast.from_pretrained('roberta-base')

tasks = {
    "44": {
        "number_of_labels": 42,
         "label_column": 1,
    },
    "8": {
        "number_of_labels": 8,
        "label_column": 2,
    }
}

def compute(task, mlength):
  t1 =[] # t1: top 1 accuracy

  for seed in seeds:
    np.random.seed(seed)
    torch.manual_seed(seed)
    random.seed(seed)

    from sklearn.model_selection import train_test_split

    index = -1
    classes = {}
    texts = []
    labels = []
    lm_reverse_mapper = {}
    with open(directory + "target_corpus.csv") as doc:
      reader = csv.reader(doc)
      next(reader)
      for row in reader:
        topic = row[tasks[task]["label_column"]]
        if topic not in classes:
          index += 1
          classes[topic] = index
          lm_reverse_mapper[index] = topic.capitalize()
        labels.append(classes[topic])
        texts.append(row[0])
    print("# classes", len(classes))
    X_train, X_test, y_train, y_test = train_test_split(texts, labels, test_size=625, random_state=seed)
    X_train, X_dev, y_train, y_dev = train_test_split(X_train, y_train, test_size=625, random_state=seed)
    print(len(X_train), len(X_dev), len(X_test))
    print("# classes in train", len(set(y_train)))
    print("# classes in dev", len(set(y_dev)))
    print("# classes in test", len(set(y_test)))

    train_encodings = tokenizer(X_train, truncation=True, padding=True, max_length=mlength)
    dev_encodings = tokenizer(X_dev, truncation=True, padding=True, max_length = mlength)
    test_encodings = tokenizer(X_test, truncation=True, padding=True, max_length= mlength)


    train_dataset = PSCDataset(train_encodings, y_train)
    dev_dataset = PSCDataset(dev_encodings, y_dev)
    test_dataset = PSCDataset(test_encodings, y_test)

    training_args = TrainingArguments(
        output_dir="./results",          # output directory
        num_train_epochs=epochs,         # total number of training epochs
        per_device_train_batch_size=16,  # batch size per device during training
        per_device_eval_batch_size=64,   # batch size for evaluation
        warmup_steps=0,                  # number of warmup steps for learning rate scheduler
        weight_decay=0.01,               # strength of weight decay
        logging_dir='./logs',            # directory for storing logs
        logging_steps=10,
        learning_rate = 2e-5,
        save_strategy= "epoch",
        evaluation_strategy="epoch",
        load_best_model_at_end= True,
        seed = seed, 
    )

    def model_init():
        return RobertaForSequenceClassification.from_pretrained("roberta-base", num_labels=tasks[task]["number_of_labels"])
    trainer = Trainer(
        model_init=model_init,               # the instantiated 🤗 Transformers model to be trained
        args=training_args,                  # training arguments, defined above
        train_dataset=train_dataset,         # training dataset
        eval_dataset=dev_dataset,            # evaluation dataset
        compute_metrics=compute_metrics,     # compute_metrics
        )

    trainer.train()
    predictions = trainer.predict(test_dataset)
    preds = np.argmax(predictions.predictions, axis=-1)

    t1.append(top_k_accuracy(1, predictions.predictions, test_dataset.labels))
  return t1

results = {}
for task in tasks:
  for mlength in [64, 256, 512]:
    result = compute(task, mlength)
    key = task + "/" + str(mlength)
    results[key] = result

np.save( directory + "figure_1_appendix_results.npy", results)


Downloading:   0%|          | 0.00/899k [00:00<?, ?B/s]

Downloading:   0%|          | 0.00/456k [00:00<?, ?B/s]

Downloading:   0%|          | 0.00/1.36M [00:00<?, ?B/s]

Downloading:   0%|          | 0.00/481 [00:00<?, ?B/s]

# classes 42
2915 625 625
# classes in train 42
# classes in dev 36
# classes in test 35


loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "LABEL_12",
    "13": "LABEL_13",
    "14": "LABEL_14",
    "15": "LABEL_15",
    "16": "LABEL_16",
    "17": "LABEL_17",
    "18": "LABEL_18",
    "19": "LABEL_19",
    "20": "LABEL_20",
    "21": "LABEL_21",
    "22": "LABEL_22",
    "23": "LABEL_23",
    "24": "LABEL_24",
    "25": "LABEL_25",

Downloading:   0%|          | 0.00/501M [00:00<?, ?B/s]

loading weights file pytorch_model.bin from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/pytorch_model.bin
Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.dense.weight', 'roberta.pooler.dense.weight', 'lm_head.layer_norm.bias', 'roberta.pooler.dense.bias', 'lm_head.dense.bias', 'lm_head.decoder.weight', 'lm_head.bias', 'lm_head.layer_norm.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some 

Epoch,Training Loss,Validation Loss,Accuracy
1,2.6217,2.499005,0.3856
2,2.2118,2.175195,0.472
3,1.8312,2.090887,0.4752
4,1.7699,2.043772,0.4976
5,1.3144,2.143308,0.4752
6,1.1916,2.247154,0.4704
7,0.9222,2.221262,0.48
8,0.4785,2.344559,0.4608
9,0.5444,2.501603,0.4592
10,0.4185,2.493924,0.4656


***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
  del sys.path[0]


Downloading builder script:   0%|          | 0.00/1.65k [00:00<?, ?B/s]

Saving model checkpoint to ./results/checkpoint-183
Configuration saved in ./results/checkpoint-183/config.json
Model weights saved in ./results/checkpoint-183/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-366
Configuration saved in ./results/checkpoint-366/config.json
Model weights saved in ./results/checkpoint-366/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-549
Configuration saved in ./results/checkpoint-549/config.json
Model weights saved in ./results/checkpoint-549/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-732
Configuration saved in ./results/checkpoint-732/config.json
Model weights saved in ./results/checkpoint-732/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving m

# classes 42
2915 625 625
# classes in train 42
# classes in dev 38
# classes in test 36


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "

Epoch,Training Loss,Validation Loss,Accuracy
1,2.5784,2.494752,0.3888
2,2.3009,2.285124,0.4192
3,1.7127,2.13738,0.4608
4,1.5222,2.169816,0.4736
5,1.2275,2.191029,0.4576
6,0.9274,2.270136,0.4624
7,0.8883,2.319786,0.4576
8,0.4958,2.372674,0.4608
9,0.4589,2.494482,0.4608
10,0.3822,2.557843,0.4672


***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-183
Configuration saved in ./results/checkpoint-183/config.json
Model weights saved in ./results/checkpoint-183/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-366
Configuration saved in ./results/checkpoint-366/config.json
Model weights saved in ./results/checkpoint-366/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-549
Configuration saved in ./results/checkpoint-549/config.json
Model weights saved in ./results/checkpoint-549/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-732
Configuration saved in ./results/checkpoint-732/config.json
Model weights saved in ./results/checkpoint-732/pytorch_model.bin
***** Ru

# classes 42
2915 625 625
# classes in train 41
# classes in dev 38
# classes in test 37


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "

Epoch,Training Loss,Validation Loss,Accuracy
1,2.5776,2.530531,0.3792
2,2.1763,2.382901,0.4336
3,1.9079,2.250292,0.456
4,1.5843,2.276685,0.44
5,1.2387,2.39972,0.4448
6,0.9562,2.480031,0.4192
7,0.7625,2.538512,0.4256
8,0.6277,2.471473,0.464
9,0.6259,2.677087,0.4512
10,0.4263,2.737224,0.4512


***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-183
Configuration saved in ./results/checkpoint-183/config.json
Model weights saved in ./results/checkpoint-183/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-366
Configuration saved in ./results/checkpoint-366/config.json
Model weights saved in ./results/checkpoint-366/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-549
Configuration saved in ./results/checkpoint-549/config.json
Model weights saved in ./results/checkpoint-549/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-732
Configuration saved in ./results/checkpoint-732/config.json
Model weights saved in ./results/checkpoint-732/pytorch_model.bin
***** Ru

# classes 42
2915 625 625
# classes in train 42
# classes in dev 35
# classes in test 37


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "

Epoch,Training Loss,Validation Loss,Accuracy
1,2.6654,2.6206,0.3456
2,2.3401,2.360425,0.408
3,1.832,2.271099,0.4112
4,1.4061,2.325723,0.4352
5,1.2391,2.369185,0.4176
6,1.1022,2.463613,0.4096
7,0.9134,2.611687,0.3968
8,0.4532,2.594323,0.408
9,0.4833,2.64066,0.4064
10,0.3938,2.798657,0.3984


***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-183
Configuration saved in ./results/checkpoint-183/config.json
Model weights saved in ./results/checkpoint-183/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-366
Configuration saved in ./results/checkpoint-366/config.json
Model weights saved in ./results/checkpoint-366/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-549
Configuration saved in ./results/checkpoint-549/config.json
Model weights saved in ./results/checkpoint-549/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-732
Configuration saved in ./results/checkpoint-732/config.json
Model weights saved in ./results/checkpoint-732/pytorch_model.bin
***** Ru

# classes 42
2915 625 625
# classes in train 42
# classes in dev 38
# classes in test 35


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "

Epoch,Training Loss,Validation Loss,Accuracy
1,2.7695,2.648046,0.3616
2,2.1731,2.356622,0.424
3,1.9705,2.283024,0.4304
4,1.5994,2.235606,0.4384
5,1.4288,2.39247,0.4256
6,0.9909,2.399296,0.4304
7,0.86,2.498942,0.4416
8,0.5664,2.595352,0.4288
9,0.4349,2.710012,0.4432
10,0.4795,2.841173,0.4192


***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-183
Configuration saved in ./results/checkpoint-183/config.json
Model weights saved in ./results/checkpoint-183/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-366
Configuration saved in ./results/checkpoint-366/config.json
Model weights saved in ./results/checkpoint-366/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-549
Configuration saved in ./results/checkpoint-549/config.json
Model weights saved in ./results/checkpoint-549/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-732
Configuration saved in ./results/checkpoint-732/config.json
Model weights saved in ./results/checkpoint-732/pytorch_model.bin
***** Ru

# classes 42
2915 625 625
# classes in train 42
# classes in dev 36
# classes in test 35


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "

Epoch,Training Loss,Validation Loss,Accuracy
1,2.4907,2.291392,0.4432
2,2.0032,1.939445,0.5216
3,1.6227,1.81022,0.5424
4,1.358,1.819359,0.52
5,1.0282,1.844699,0.5248
6,0.8642,1.910618,0.5264
7,0.6003,1.951114,0.5376
8,0.3956,2.024622,0.5248
9,0.3791,2.067181,0.5296
10,0.2518,2.118134,0.5168


***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-183
Configuration saved in ./results/checkpoint-183/config.json
Model weights saved in ./results/checkpoint-183/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-366
Configuration saved in ./results/checkpoint-366/config.json
Model weights saved in ./results/checkpoint-366/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-549
Configuration saved in ./results/checkpoint-549/config.json
Model weights saved in ./results/checkpoint-549/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-732
Configuration saved in ./results/checkpoint-732/config.json
Model weights saved in ./results/checkpoint-732/pytorch_model.bin
***** Ru

# classes 42
2915 625 625
# classes in train 42
# classes in dev 38
# classes in test 36


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "

Epoch,Training Loss,Validation Loss,Accuracy
1,2.5136,2.331985,0.4256
2,2.1762,2.072746,0.4688
3,1.5499,1.929446,0.5024
4,1.3799,1.832429,0.5184
5,0.9662,1.879472,0.5216
6,0.7541,1.921443,0.5344
7,0.7293,1.994064,0.5296
8,0.2951,2.085191,0.5264
9,0.4006,2.184536,0.5424
10,0.2526,2.320652,0.528


***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-183
Configuration saved in ./results/checkpoint-183/config.json
Model weights saved in ./results/checkpoint-183/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-366
Configuration saved in ./results/checkpoint-366/config.json
Model weights saved in ./results/checkpoint-366/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-549
Configuration saved in ./results/checkpoint-549/config.json
Model weights saved in ./results/checkpoint-549/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-732
Configuration saved in ./results/checkpoint-732/config.json
Model weights saved in ./results/checkpoint-732/pytorch_model.bin
***** Ru

# classes 42
2915 625 625
# classes in train 41
# classes in dev 38
# classes in test 37


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "

Epoch,Training Loss,Validation Loss,Accuracy
1,2.5391,2.44289,0.4144
2,1.991,2.177721,0.472
3,1.6936,2.007495,0.4944
4,1.3995,2.003397,0.5024
5,1.0748,2.062061,0.4912
6,0.8272,2.090632,0.5152
7,0.6527,2.137616,0.4912
8,0.4672,2.197981,0.5056
9,0.5459,2.278202,0.5008
10,0.3083,2.385895,0.5024


***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-183
Configuration saved in ./results/checkpoint-183/config.json
Model weights saved in ./results/checkpoint-183/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-366
Configuration saved in ./results/checkpoint-366/config.json
Model weights saved in ./results/checkpoint-366/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-549
Configuration saved in ./results/checkpoint-549/config.json
Model weights saved in ./results/checkpoint-549/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-732
Configuration saved in ./results/checkpoint-732/config.json
Model weights saved in ./results/checkpoint-732/pytorch_model.bin
***** Ru

# classes 42
2915 625 625
# classes in train 42
# classes in dev 35
# classes in test 37


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "

Epoch,Training Loss,Validation Loss,Accuracy
1,2.4769,2.479219,0.3808
2,2.0454,2.143213,0.456
3,1.5361,2.043451,0.48
4,1.362,1.986266,0.4688
5,0.9518,1.98832,0.4944
6,0.808,2.087839,0.4864
7,0.6759,2.20315,0.472
8,0.3153,2.291127,0.4592
9,0.3796,2.288975,0.4816
10,0.2594,2.43152,0.4752


***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-183
Configuration saved in ./results/checkpoint-183/config.json
Model weights saved in ./results/checkpoint-183/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-366
Configuration saved in ./results/checkpoint-366/config.json
Model weights saved in ./results/checkpoint-366/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-549
Configuration saved in ./results/checkpoint-549/config.json
Model weights saved in ./results/checkpoint-549/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-732
Configuration saved in ./results/checkpoint-732/config.json
Model weights saved in ./results/checkpoint-732/pytorch_model.bin
***** Ru

# classes 42
2915 625 625
# classes in train 42
# classes in dev 38
# classes in test 35


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "

Epoch,Training Loss,Validation Loss,Accuracy
1,2.6052,2.428265,0.4224
2,1.9466,2.156282,0.4608
3,1.7712,2.005743,0.48
4,1.1742,2.01611,0.4608
5,1.0592,2.153371,0.4592
6,0.6974,2.158676,0.4816
7,0.5897,2.246525,0.4816
8,0.376,2.383993,0.4656
9,0.2744,2.449046,0.4672
10,0.2424,2.48571,0.4768


***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-183
Configuration saved in ./results/checkpoint-183/config.json
Model weights saved in ./results/checkpoint-183/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-366
Configuration saved in ./results/checkpoint-366/config.json
Model weights saved in ./results/checkpoint-366/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-549
Configuration saved in ./results/checkpoint-549/config.json
Model weights saved in ./results/checkpoint-549/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-732
Configuration saved in ./results/checkpoint-732/config.json
Model weights saved in ./results/checkpoint-732/pytorch_model.bin
***** Ru

# classes 42
2915 625 625
# classes in train 42
# classes in dev 36
# classes in test 35


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "

Epoch,Training Loss,Validation Loss,Accuracy
1,2.4303,2.288778,0.4176
2,1.9171,1.934722,0.5168
3,1.5825,1.823273,0.5424
4,1.3624,1.823743,0.5488
5,0.9723,1.889241,0.5232
6,0.848,1.888951,0.5344
7,0.5739,2.010903,0.5328
8,0.4092,1.98929,0.5536
9,0.3174,2.029555,0.5632
10,0.2309,2.128701,0.5328


***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-183
Configuration saved in ./results/checkpoint-183/config.json
Model weights saved in ./results/checkpoint-183/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-366
Configuration saved in ./results/checkpoint-366/config.json
Model weights saved in ./results/checkpoint-366/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-549
Configuration saved in ./results/checkpoint-549/config.json
Model weights saved in ./results/checkpoint-549/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-732
Configuration saved in ./results/checkpoint-732/config.json
Model weights saved in ./results/checkpoint-732/pytorch_model.bin
***** Ru

# classes 42
2915 625 625
# classes in train 42
# classes in dev 38
# classes in test 36


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "

Epoch,Training Loss,Validation Loss,Accuracy
1,2.4401,2.280676,0.4352
2,2.1084,2.000825,0.4736
3,1.4616,1.840411,0.512
4,1.2014,1.78463,0.528
5,0.9437,1.797061,0.5472
6,0.6154,1.897894,0.5328
7,0.6419,1.956028,0.5392
8,0.2293,2.03653,0.544
9,0.3249,2.070697,0.5376
10,0.1992,2.198223,0.5312


***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-183
Configuration saved in ./results/checkpoint-183/config.json
Model weights saved in ./results/checkpoint-183/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-366
Configuration saved in ./results/checkpoint-366/config.json
Model weights saved in ./results/checkpoint-366/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-549
Configuration saved in ./results/checkpoint-549/config.json
Model weights saved in ./results/checkpoint-549/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-732
Configuration saved in ./results/checkpoint-732/config.json
Model weights saved in ./results/checkpoint-732/pytorch_model.bin
***** Ru

# classes 42
2915 625 625
# classes in train 41
# classes in dev 38
# classes in test 37


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "

Epoch,Training Loss,Validation Loss,Accuracy
1,2.5073,2.389546,0.4032
2,1.9702,2.135563,0.472
3,1.7043,1.997115,0.496
4,1.453,2.0351,0.48
5,0.9569,2.062247,0.4864
6,0.6945,2.15573,0.4864
7,0.5929,2.221344,0.5088
8,0.4993,2.261892,0.4944
9,0.4328,2.324211,0.5056
10,0.2564,2.473519,0.4928


***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-183
Configuration saved in ./results/checkpoint-183/config.json
Model weights saved in ./results/checkpoint-183/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-366
Configuration saved in ./results/checkpoint-366/config.json
Model weights saved in ./results/checkpoint-366/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-549
Configuration saved in ./results/checkpoint-549/config.json
Model weights saved in ./results/checkpoint-549/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-732
Configuration saved in ./results/checkpoint-732/config.json
Model weights saved in ./results/checkpoint-732/pytorch_model.bin
***** Ru

# classes 42
2915 625 625
# classes in train 42
# classes in dev 35
# classes in test 37


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "

Epoch,Training Loss,Validation Loss,Accuracy
1,2.5149,2.50049,0.3648
2,2.0622,2.101844,0.464
3,1.5385,1.987228,0.472
4,1.2171,1.94286,0.5024
5,0.8703,1.969932,0.4896
6,0.7309,2.034905,0.4896
7,0.6832,2.094531,0.4992
8,0.3393,2.186576,0.488
9,0.2957,2.145506,0.5184
10,0.2354,2.275206,0.4928


***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-183
Configuration saved in ./results/checkpoint-183/config.json
Model weights saved in ./results/checkpoint-183/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-366
Configuration saved in ./results/checkpoint-366/config.json
Model weights saved in ./results/checkpoint-366/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-549
Configuration saved in ./results/checkpoint-549/config.json
Model weights saved in ./results/checkpoint-549/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-732
Configuration saved in ./results/checkpoint-732/config.json
Model weights saved in ./results/checkpoint-732/pytorch_model.bin
***** Ru

# classes 42
2915 625 625
# classes in train 42
# classes in dev 38
# classes in test 35


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "

Epoch,Training Loss,Validation Loss,Accuracy
1,2.592,2.406589,0.424
2,1.8191,2.11586,0.4624
3,1.7895,1.973715,0.4896
4,1.187,1.987817,0.4832
5,1.018,2.02603,0.4832
6,0.6837,2.087702,0.4896
7,0.5114,2.160427,0.4848
8,0.4005,2.265558,0.4912
9,0.2759,2.363732,0.4912
10,0.1687,2.525493,0.48


***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-183
Configuration saved in ./results/checkpoint-183/config.json
Model weights saved in ./results/checkpoint-183/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-366
Configuration saved in ./results/checkpoint-366/config.json
Model weights saved in ./results/checkpoint-366/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-549
Configuration saved in ./results/checkpoint-549/config.json
Model weights saved in ./results/checkpoint-549/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-732
Configuration saved in ./results/checkpoint-732/config.json
Model weights saved in ./results/checkpoint-732/pytorch_model.bin
***** Ru

# classes 8
2915 625 625
# classes in train 8
# classes in dev 8
# classes in test 8


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,

Epoch,Training Loss,Validation Loss,Accuracy
1,1.3789,1.337807,0.5344
2,1.0988,1.34299,0.5456
3,0.9794,1.298765,0.584
4,0.9686,1.39653,0.56
5,0.6311,1.525748,0.5568
6,0.2218,1.831988,0.5552
7,0.2571,1.997571,0.5392
8,0.0846,2.182239,0.5712
9,0.086,2.467403,0.5552
10,0.0763,2.59986,0.5616


***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-183
Configuration saved in ./results/checkpoint-183/config.json
Model weights saved in ./results/checkpoint-183/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-366
Configuration saved in ./results/checkpoint-366/config.json
Model weights saved in ./results/checkpoint-366/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-549
Configuration saved in ./results/checkpoint-549/config.json
Model weights saved in ./results/checkpoint-549/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-732
Configuration saved in ./results/checkpoint-732/config.json
Model weights saved in ./results/checkpoint-732/pytorch_model.bin
***** Ru

# classes 8
2915 625 625
# classes in train 8
# classes in dev 8
# classes in test 8


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,

Epoch,Training Loss,Validation Loss,Accuracy
1,1.3164,1.388045,0.5296
2,1.1313,1.28397,0.5536
3,0.8759,1.368154,0.584
4,0.6556,1.457107,0.5664
5,0.4724,1.533135,0.5712
6,0.301,1.711547,0.5472
7,0.2123,1.930853,0.5552
8,0.1635,2.252084,0.5472
9,0.0336,2.40866,0.5584
10,0.0533,2.63143,0.552


***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-183
Configuration saved in ./results/checkpoint-183/config.json
Model weights saved in ./results/checkpoint-183/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-366
Configuration saved in ./results/checkpoint-366/config.json
Model weights saved in ./results/checkpoint-366/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-549
Configuration saved in ./results/checkpoint-549/config.json
Model weights saved in ./results/checkpoint-549/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-732
Configuration saved in ./results/checkpoint-732/config.json
Model weights saved in ./results/checkpoint-732/pytorch_model.bin
***** Ru

# classes 8
2915 625 625
# classes in train 8
# classes in dev 8
# classes in test 8


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,

Epoch,Training Loss,Validation Loss,Accuracy
1,1.3762,1.393996,0.5232
2,1.1138,1.325008,0.5552
3,0.8447,1.406461,0.552
4,0.714,1.473362,0.576
5,0.4667,1.633926,0.5568
6,0.4165,1.770823,0.5504
7,0.1933,1.948338,0.5504
8,0.1975,2.053538,0.5392
9,0.162,2.501997,0.5456
10,0.0823,2.675789,0.552


***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-183
Configuration saved in ./results/checkpoint-183/config.json
Model weights saved in ./results/checkpoint-183/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-366
Configuration saved in ./results/checkpoint-366/config.json
Model weights saved in ./results/checkpoint-366/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-549
Configuration saved in ./results/checkpoint-549/config.json
Model weights saved in ./results/checkpoint-549/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-732
Configuration saved in ./results/checkpoint-732/config.json
Model weights saved in ./results/checkpoint-732/pytorch_model.bin
***** Ru

# classes 8
2915 625 625
# classes in train 8
# classes in dev 8
# classes in test 8


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,

Epoch,Training Loss,Validation Loss,Accuracy
1,1.4824,1.424911,0.4944
2,1.3111,1.317304,0.528
3,0.921,1.312024,0.5616
4,0.6433,1.475935,0.5424
5,0.6702,1.528984,0.5536
6,0.3964,1.603358,0.568
7,0.2933,1.971731,0.5344
8,0.1466,2.129893,0.5392
9,0.1037,2.377722,0.544
10,0.1367,2.629594,0.5328


***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-183
Configuration saved in ./results/checkpoint-183/config.json
Model weights saved in ./results/checkpoint-183/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-366
Configuration saved in ./results/checkpoint-366/config.json
Model weights saved in ./results/checkpoint-366/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-549
Configuration saved in ./results/checkpoint-549/config.json
Model weights saved in ./results/checkpoint-549/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-732
Configuration saved in ./results/checkpoint-732/config.json
Model weights saved in ./results/checkpoint-732/pytorch_model.bin
***** Ru

# classes 8
2915 625 625
# classes in train 8
# classes in dev 8
# classes in test 8


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,

Epoch,Training Loss,Validation Loss,Accuracy
1,1.3772,1.363505,0.5488
2,1.1596,1.278537,0.5696
3,0.9054,1.246145,0.6
4,0.6656,1.369946,0.5968
5,0.4159,1.643938,0.56
6,0.3657,1.830832,0.544
7,0.351,2.120942,0.5472
8,0.1007,2.280218,0.5824
9,0.1193,2.666468,0.5344
10,0.107,2.763258,0.5584


***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-183
Configuration saved in ./results/checkpoint-183/config.json
Model weights saved in ./results/checkpoint-183/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-366
Configuration saved in ./results/checkpoint-366/config.json
Model weights saved in ./results/checkpoint-366/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-549
Configuration saved in ./results/checkpoint-549/config.json
Model weights saved in ./results/checkpoint-549/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-732
Configuration saved in ./results/checkpoint-732/config.json
Model weights saved in ./results/checkpoint-732/pytorch_model.bin
***** Ru

# classes 8
2915 625 625
# classes in train 8
# classes in dev 8
# classes in test 8


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,

Epoch,Training Loss,Validation Loss,Accuracy
1,1.2764,1.212613,0.5808
2,0.9798,1.117378,0.6336
3,0.8446,1.141515,0.6352
4,0.9145,1.255076,0.6304
5,0.5252,1.370795,0.6368
6,0.2031,1.474914,0.6336
7,0.1347,1.787149,0.64
8,0.1474,1.900893,0.6384
9,0.0161,2.206744,0.632
10,0.1032,2.280209,0.6432


***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-183
Configuration saved in ./results/checkpoint-183/config.json
Model weights saved in ./results/checkpoint-183/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-366
Configuration saved in ./results/checkpoint-366/config.json
Model weights saved in ./results/checkpoint-366/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-549
Configuration saved in ./results/checkpoint-549/config.json
Model weights saved in ./results/checkpoint-549/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-732
Configuration saved in ./results/checkpoint-732/config.json
Model weights saved in ./results/checkpoint-732/pytorch_model.bin
***** Ru

# classes 8
2915 625 625
# classes in train 8
# classes in dev 8
# classes in test 8


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,

Epoch,Training Loss,Validation Loss,Accuracy
1,1.1352,1.183312,0.576
2,0.8975,1.110124,0.6096
3,0.6851,1.113878,0.6384
4,0.6206,1.23994,0.6176
5,0.3613,1.375911,0.6224
6,0.1618,1.470408,0.6432
7,0.2102,1.676568,0.6464
8,0.1554,1.977858,0.6192
9,0.041,2.146773,0.6336
10,0.0344,2.35854,0.632


***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-183
Configuration saved in ./results/checkpoint-183/config.json
Model weights saved in ./results/checkpoint-183/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-366
Configuration saved in ./results/checkpoint-366/config.json
Model weights saved in ./results/checkpoint-366/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-549
Configuration saved in ./results/checkpoint-549/config.json
Model weights saved in ./results/checkpoint-549/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-732
Configuration saved in ./results/checkpoint-732/config.json
Model weights saved in ./results/checkpoint-732/pytorch_model.bin
***** Ru

# classes 8
2915 625 625
# classes in train 8
# classes in dev 8
# classes in test 8


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,

Epoch,Training Loss,Validation Loss,Accuracy
1,1.2362,1.338504,0.544
2,0.9726,1.212167,0.5824
3,0.7461,1.247118,0.5936
4,0.6456,1.407349,0.6016
5,0.2686,1.62115,0.5776
6,0.2984,1.663277,0.5952
7,0.1504,2.026405,0.5872
8,0.0395,2.343272,0.5968
9,0.1365,2.670512,0.5616
10,0.0077,2.74867,0.5664


***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-183
Configuration saved in ./results/checkpoint-183/config.json
Model weights saved in ./results/checkpoint-183/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-366
Configuration saved in ./results/checkpoint-366/config.json
Model weights saved in ./results/checkpoint-366/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-549
Configuration saved in ./results/checkpoint-549/config.json
Model weights saved in ./results/checkpoint-549/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-732
Configuration saved in ./results/checkpoint-732/config.json
Model weights saved in ./results/checkpoint-732/pytorch_model.bin
***** Ru

# classes 8
2915 625 625
# classes in train 8
# classes in dev 8
# classes in test 8


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,

Epoch,Training Loss,Validation Loss,Accuracy
1,1.3516,1.308036,0.5536
2,1.0602,1.206354,0.592
3,0.6978,1.26686,0.576
4,0.5227,1.303626,0.6112
5,0.4642,1.486468,0.5856
6,0.208,1.64675,0.5936
7,0.1909,1.791024,0.576
8,0.2035,2.062284,0.5664
9,0.058,2.314323,0.584
10,0.167,2.583298,0.5872


***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-183
Configuration saved in ./results/checkpoint-183/config.json
Model weights saved in ./results/checkpoint-183/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-366
Configuration saved in ./results/checkpoint-366/config.json
Model weights saved in ./results/checkpoint-366/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-549
Configuration saved in ./results/checkpoint-549/config.json
Model weights saved in ./results/checkpoint-549/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-732
Configuration saved in ./results/checkpoint-732/config.json
Model weights saved in ./results/checkpoint-732/pytorch_model.bin
***** Ru

# classes 8
2915 625 625
# classes in train 8
# classes in dev 8
# classes in test 8


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,

Epoch,Training Loss,Validation Loss,Accuracy
1,1.2723,1.212246,0.584
2,1.0339,1.12845,0.6128
3,0.8078,1.156912,0.6048
4,0.7245,1.307925,0.6256
5,0.3936,1.393747,0.6096
6,0.1788,1.664022,0.6
7,0.2554,1.889004,0.6032
8,0.1367,2.065753,0.608
9,0.1179,2.459048,0.5984
10,0.0859,2.544351,0.592


***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-183
Configuration saved in ./results/checkpoint-183/config.json
Model weights saved in ./results/checkpoint-183/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-366
Configuration saved in ./results/checkpoint-366/config.json
Model weights saved in ./results/checkpoint-366/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-549
Configuration saved in ./results/checkpoint-549/config.json
Model weights saved in ./results/checkpoint-549/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-732
Configuration saved in ./results/checkpoint-732/config.json
Model weights saved in ./results/checkpoint-732/pytorch_model.bin
***** Ru

# classes 8
2915 625 625
# classes in train 8
# classes in dev 8
# classes in test 8


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,

Epoch,Training Loss,Validation Loss,Accuracy
1,1.3199,1.205588,0.5776
2,0.9789,1.116255,0.6192
3,0.8163,1.130859,0.6336
4,0.8216,1.280719,0.632
5,0.4968,1.309494,0.6288
6,0.1466,1.554289,0.6096
7,0.1655,1.672504,0.6256
8,0.1786,1.918652,0.6288
9,0.0383,2.086765,0.6384
10,0.116,2.2943,0.6256


***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-183
Configuration saved in ./results/checkpoint-183/config.json
Model weights saved in ./results/checkpoint-183/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-366
Configuration saved in ./results/checkpoint-366/config.json
Model weights saved in ./results/checkpoint-366/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-549
Configuration saved in ./results/checkpoint-549/config.json
Model weights saved in ./results/checkpoint-549/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-732
Configuration saved in ./results/checkpoint-732/config.json
Model weights saved in ./results/checkpoint-732/pytorch_model.bin
***** Ru

# classes 8
2915 625 625
# classes in train 8
# classes in dev 8
# classes in test 8


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,

Epoch,Training Loss,Validation Loss,Accuracy
1,1.1399,1.186527,0.608
2,0.9094,1.059664,0.616
3,0.6856,1.133391,0.6304
4,0.6073,1.20822,0.6352
5,0.3167,1.424255,0.6192
6,0.1826,1.555377,0.632
7,0.1907,1.705964,0.624
8,0.098,1.995148,0.6336
9,0.0072,2.262979,0.6176
10,0.0135,2.442546,0.608


***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-183
Configuration saved in ./results/checkpoint-183/config.json
Model weights saved in ./results/checkpoint-183/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-366
Configuration saved in ./results/checkpoint-366/config.json
Model weights saved in ./results/checkpoint-366/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-549
Configuration saved in ./results/checkpoint-549/config.json
Model weights saved in ./results/checkpoint-549/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-732
Configuration saved in ./results/checkpoint-732/config.json
Model weights saved in ./results/checkpoint-732/pytorch_model.bin
***** Ru

# classes 8
2915 625 625
# classes in train 8
# classes in dev 8
# classes in test 8


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,

Epoch,Training Loss,Validation Loss,Accuracy
1,1.2681,1.286879,0.5488
2,0.961,1.170761,0.5904
3,0.6919,1.191083,0.6256
4,0.6424,1.341316,0.6224
5,0.3129,1.541527,0.624
6,0.2846,1.650567,0.5984
7,0.2486,1.889238,0.6064
8,0.1233,2.147868,0.6
9,0.1619,2.279927,0.6128
10,0.0433,2.516886,0.6144


***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-183
Configuration saved in ./results/checkpoint-183/config.json
Model weights saved in ./results/checkpoint-183/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-366
Configuration saved in ./results/checkpoint-366/config.json
Model weights saved in ./results/checkpoint-366/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-549
Configuration saved in ./results/checkpoint-549/config.json
Model weights saved in ./results/checkpoint-549/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-732
Configuration saved in ./results/checkpoint-732/config.json
Model weights saved in ./results/checkpoint-732/pytorch_model.bin
***** Ru

# classes 8
2915 625 625
# classes in train 8
# classes in dev 8
# classes in test 8


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,

Epoch,Training Loss,Validation Loss,Accuracy
1,1.3711,1.301919,0.5328
2,1.0813,1.196107,0.5968
3,0.6924,1.225822,0.6144
4,0.5353,1.311677,0.5984
5,0.348,1.458576,0.5984
6,0.1663,1.601807,0.6144
7,0.1594,1.825113,0.5968
8,0.1392,2.099366,0.608
9,0.0974,2.326327,0.5824
10,0.0113,2.486365,0.5904


***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-183
Configuration saved in ./results/checkpoint-183/config.json
Model weights saved in ./results/checkpoint-183/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-366
Configuration saved in ./results/checkpoint-366/config.json
Model weights saved in ./results/checkpoint-366/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-549
Configuration saved in ./results/checkpoint-549/config.json
Model weights saved in ./results/checkpoint-549/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-732
Configuration saved in ./results/checkpoint-732/config.json
Model weights saved in ./results/checkpoint-732/pytorch_model.bin
***** Ru

# classes 8
2915 625 625
# classes in train 8
# classes in dev 8
# classes in test 8


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,

Epoch,Training Loss,Validation Loss,Accuracy
1,1.2929,1.18713,0.6032
2,1.0512,1.085045,0.6336
3,0.7895,1.104119,0.632
4,0.6917,1.240097,0.6064
5,0.3469,1.456409,0.6144
6,0.2584,1.631499,0.6352
7,0.2917,1.943097,0.6144
8,0.0631,2.06987,0.6304
9,0.1509,2.32331,0.6096
10,0.007,2.446229,0.6128


***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-183
Configuration saved in ./results/checkpoint-183/config.json
Model weights saved in ./results/checkpoint-183/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-366
Configuration saved in ./results/checkpoint-366/config.json
Model weights saved in ./results/checkpoint-366/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-549
Configuration saved in ./results/checkpoint-549/config.json
Model weights saved in ./results/checkpoint-549/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-732
Configuration saved in ./results/checkpoint-732/config.json
Model weights saved in ./results/checkpoint-732/pytorch_model.bin
***** Ru

Epoch,Training Loss,Validation Loss,Accuracy
1,1.2929,1.18713,0.6032
2,1.0512,1.085045,0.6336
3,0.7895,1.104119,0.632
4,0.6917,1.240097,0.6064
5,0.3469,1.456409,0.6144
6,0.2584,1.631499,0.6352
7,0.2917,1.943097,0.6144
8,0.0631,2.06987,0.6304
9,0.1509,2.32331,0.6096
10,0.007,2.446229,0.6128


***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-3294
Configuration saved in ./results/checkpoint-3294/config.json
Model weights saved in ./results/checkpoint-3294/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-3477
Configuration saved in ./results/checkpoint-3477/config.json
Model weights saved in ./results/checkpoint-3477/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 625
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-3660
Configuration saved in ./results/checkpoint-3660/config.json
Model weights saved in ./results/checkpoint-3660/pytorch_model.bin


Training completed. Do not forget to share your model on huggingface.co/models =)


Loading best model from ./results/checkpoint-366 (score: 1.085044503211975).
***** Running Prediction *****
  Num examples = 625
  Batch size = 64


In [None]:
def process_result(result):
  return round(np.mean(result), 3), round(np.std(result), 3)

for key, result in results.items():
  print(key, "\t", process_result(result))

44/64 	 (0.472, 0.014)
44/256 	 (0.511, 0.015)
44/512 	 (0.527, 0.013)
8/64 	 (0.581, 0.014)
8/256 	 (0.625, 0.007)
8/512 	 (0.631, 0.015)


In [None]:
end = time.time()
print(f"The program took {(end - start) // 60} minutes in total.")

The program took 472.0 minutes in total.


In [None]:
from google.colab import runtime
runtime.unassign()