In [None]:
!pip install transformers
!pip install datasets
!pip install --upgrade --no-cache-dir gdown==4.5.4

!gdown 18oZZ4jqRK-uF-Nz6ftRdgNjKix88hrnO
!unzip data_and_models.zip && rm data_and_models.zip

Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/
Collecting transformers
  Downloading transformers-4.23.1-py3-none-any.whl (5.3 MB)
[K     |████████████████████████████████| 5.3 MB 4.9 MB/s 
Collecting tokenizers!=0.11.3,<0.14,>=0.11.1
  Downloading tokenizers-0.13.1-cp37-cp37m-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (7.6 MB)
[K     |████████████████████████████████| 7.6 MB 70.1 MB/s 
Collecting huggingface-hub<1.0,>=0.10.0
  Downloading huggingface_hub-0.10.1-py3-none-any.whl (163 kB)
[K     |████████████████████████████████| 163 kB 83.9 MB/s 
Installing collected packages: tokenizers, huggingface-hub, transformers
Successfully installed huggingface-hub-0.10.1 tokenizers-0.13.1 transformers-4.23.1
Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/
Collecting datasets
  Downloading datasets-2.6.1-py3-none-any.whl (441 kB)
[K     |████████████████████████████████| 441 kB 4.7 MB/

In [None]:
from collections import defaultdict
import csv
import random
import time

from datasets import load_metric
import numpy as np
from sklearn.model_selection import train_test_split
import torch
from transformers import RobertaTokenizerFast


def compute_metrics(eval_preds):
    metric = load_metric("accuracy")
    logits, labels = eval_preds
    predictions = np.argmax(logits, axis=-1)
    return metric.compute(predictions=predictions, references=labels)

  
directory = "./data_and_models/"
mlength = 512
start = time.time()
tokenizer = RobertaTokenizerFast.from_pretrained('roberta-base')

class PSCDataset(torch.utils.data.Dataset):
    def __init__(self, encodings, labels):
        self.encodings = encodings
        self.labels = labels

    def __getitem__(self, idx):
        item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
        item['labels'] = torch.tensor(self.labels[idx])
        return item

    def __len__(self):
        return len(self.labels)

def top_k_accuracy(top_k, predictions, labels):
  assert len(predictions) == len(labels)
  total = 0
  correct = 0
  for i in range(len(predictions)):
    total += 1
    prediction = []
    for j, k in enumerate(predictions[i]):
      prediction.append([j, k])
    prediction.sort(key = lambda x: -x[1])
    for j, _ in prediction[:top_k]:
      if j == labels[i]:
        correct += 1
        break
  return correct/total

tasks = {
    "44": {
        "number_of_labels": 42,
         "label_column": 1,
    },
    "8": {
        "number_of_labels": 8,
        "label_column": 2,
    }
}

def compute_task(task):
  results = {}
  for train_size in [200, 300, 400]:
    t1 =[]
    seeds = range(11, 16)
    nclasses = tasks[task]["number_of_labels"]
    tasks[task]["label_column"]
    epochs = 20
    learning_rate = 4e-5
    for seed in seeds:
      np.random.seed(seed)
      torch.manual_seed(seed)
      random.seed(seed)

      index = -1
      classes = {}
      texts = []
      labels = []
      lm_reverse_mapper = {}
      with open(directory + "target_corpus.csv") as doc:
        reader = csv.reader(doc)
        next(reader)
        for row in reader:
          topic = row[tasks[task]["label_column"]]
          if topic not in classes:
            index += 1
            classes[topic] = index
            lm_reverse_mapper[index] = topic.capitalize()
          labels.append(classes[topic])
          texts.append(row[0])
      print("# classes", len(classes))
      test_size = (4165 - 400)//2 + 1
      dev_size = (4165 - 400)//2
      X_train, X_test, y_train, y_test = train_test_split(texts, labels, test_size=test_size, random_state=seed)
      X_train, X_dev, y_train, y_dev = train_test_split(X_train, y_train, test_size=dev_size, random_state=seed)
      if train_size < 400: 
        _, X_train, _, y_train = train_test_split(X_train, y_train, test_size = train_size, random_state = seed)
      print(len(X_train), len(X_dev), len(X_test))
      print("# classes in train", len(set(y_train)))
      print("# classes in dev", len(set(y_dev)))
      print("# classes in test", len(set(y_test)))


      train_encodings = tokenizer(X_train, truncation=True, padding=True, max_length=mlength)
      dev_encodings = tokenizer(X_dev, truncation=True, padding=True, max_length = mlength)
      test_encodings = tokenizer(X_test, truncation=True, padding=True, max_length= mlength)


      train_dataset = PSCDataset(train_encodings, y_train)
      dev_dataset = PSCDataset(dev_encodings, y_dev)
      test_dataset = PSCDataset(test_encodings, y_test)

      from transformers import RobertaForSequenceClassification, TrainingArguments, Trainer

      training_args = TrainingArguments(
          output_dir="./results",          # output directory
          num_train_epochs=epochs,         # total number of training epochs
          per_device_train_batch_size=16,  # batch size per device during training
          per_device_eval_batch_size=64,   # batch size for evaluation
          warmup_steps=0,                  # number of warmup steps for learning rate scheduler
          weight_decay=0.01,               # strength of weight decay
          logging_dir='./logs',            # directory for storing logs
          logging_steps=10,
          learning_rate = learning_rate,
          save_strategy= "epoch",
          evaluation_strategy="epoch",
          load_best_model_at_end= True,
          metric_for_best_model="accuracy",
          save_total_limit = 2,
          seed = seed, 
      )

      def model_init():
          return RobertaForSequenceClassification.from_pretrained("roberta-base", num_labels=nclasses)
      trainer = Trainer(
          model_init=model_init,               # the instantiated 🤗 Transformers model to be trained
          args=training_args,                  # training arguments, defined above
          train_dataset=train_dataset,         # training dataset
          eval_dataset=dev_dataset,            # evaluation dataset
          compute_metrics=compute_metrics,     # compute_metrics
          )

      trainer.train()
      predictions = trainer.predict(test_dataset)
      preds = np.argmax(predictions.predictions, axis=-1)

      t1.append(top_k_accuracy(1, predictions.predictions, test_dataset.labels))

    results[train_size] = t1
  return results

outputs = {}
for task in tasks:
  outputs[task] = compute_task(task)

np.save( directory + "figure_1_results.npy", outputs)

Downloading:   0%|          | 0.00/899k [00:00<?, ?B/s]

Downloading:   0%|          | 0.00/456k [00:00<?, ?B/s]

Downloading:   0%|          | 0.00/1.36M [00:00<?, ?B/s]

Downloading:   0%|          | 0.00/481 [00:00<?, ?B/s]

# classes 42
200 1882 1883
# classes in train 34
# classes in dev 40
# classes in test 39


loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "LABEL_12",
    "13": "LABEL_13",
    "14": "LABEL_14",
    "15": "LABEL_15",
    "16": "LABEL_16",
    "17": "LABEL_17",
    "18": "LABEL_18",
    "19": "LABEL_19",
    "20": "LABEL_20",
    "21": "LABEL_21",
    "22": "LABEL_22",
    "23": "LABEL_23",
    "24": "LABEL_24",
    "25": "LABEL_25",

Downloading:   0%|          | 0.00/501M [00:00<?, ?B/s]

loading weights file pytorch_model.bin from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/pytorch_model.bin
Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.dense.bias', 'lm_head.dense.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'roberta.pooler.dense.weight', 'roberta.pooler.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some 

Epoch,Training Loss,Validation Loss,Accuracy
1,3.6373,3.438698,0.171095
2,3.3908,3.317014,0.171095
3,3.15,3.221827,0.171095
4,2.9537,3.116266,0.193411
5,2.7625,2.936279,0.268863
6,2.4348,2.85551,0.274708
7,1.8929,2.771087,0.289586
8,1.8125,2.705738,0.320935
9,1.4696,2.653631,0.33475
10,1.1494,2.60669,0.357067


***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
  


Downloading builder script:   0%|          | 0.00/1.65k [00:00<?, ?B/s]

Saving model checkpoint to ./results/checkpoint-13
Configuration saved in ./results/checkpoint-13/config.json
Model weights saved in ./results/checkpoint-13/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-26
Configuration saved in ./results/checkpoint-26/config.json
Model weights saved in ./results/checkpoint-26/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-39
Configuration saved in ./results/checkpoint-39/config.json
Model weights saved in ./results/checkpoint-39/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-26] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-52
Configuration saved in ./results/checkpoint-52/config.json
Model weights saved in ./results/checkpoint-52/pytorch_model.bin
Deleting

# classes 42
200 1882 1883
# classes in train 31
# classes in dev 41
# classes in test 40


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "

Epoch,Training Loss,Validation Loss,Accuracy
1,3.7068,3.351836,0.196068
2,3.2797,3.185449,0.196068
3,3.1876,3.008971,0.259299
4,2.6514,2.89599,0.265675
5,2.5288,2.776418,0.285335
6,2.2344,2.680371,0.328374
7,1.7101,2.655349,0.31509
8,1.4279,2.592257,0.340595
9,1.2477,2.599226,0.337407
10,0.9436,2.568644,0.36238


***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-13
Configuration saved in ./results/checkpoint-13/config.json
Model weights saved in ./results/checkpoint-13/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-247] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-26
Configuration saved in ./results/checkpoint-26/config.json
Model weights saved in ./results/checkpoint-26/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-260] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-39
Configuration saved in ./results/checkpoint-39/config.json
Model weights saved in ./results/checkpoint-39/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-13] due to args.save_total_limit
***** Running Evaluatio

# classes 42
200 1882 1883
# classes in train 32
# classes in dev 41
# classes in test 41


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "

Epoch,Training Loss,Validation Loss,Accuracy
1,3.6114,3.352728,0.195537
2,3.2567,3.201875,0.195537
3,2.9589,3.047744,0.238576
4,2.5974,2.878942,0.293836
5,2.4504,2.856372,0.30712
6,2.1842,2.686482,0.353879
7,1.7203,2.633838,0.35813
8,1.55,2.603144,0.383634
9,1.3295,2.581018,0.384166
10,1.1072,2.571044,0.391073


***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-13
Configuration saved in ./results/checkpoint-13/config.json
Model weights saved in ./results/checkpoint-13/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-247] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-26
Configuration saved in ./results/checkpoint-26/config.json
Model weights saved in ./results/checkpoint-26/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-260] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-39
Configuration saved in ./results/checkpoint-39/config.json
Model weights saved in ./results/checkpoint-39/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-13] due to args.save_total_limit
***** Running Evaluatio

# classes 42
200 1882 1883
# classes in train 30
# classes in dev 39
# classes in test 42


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "

Epoch,Training Loss,Validation Loss,Accuracy
1,3.6656,3.365279,0.18491
2,3.3072,3.252143,0.18491
3,3.1763,3.109071,0.218385
4,2.6172,2.972684,0.273645
5,2.4064,2.880045,0.302869
6,2.2745,2.775948,0.323592
7,1.6322,2.725397,0.347503
8,1.3867,2.689137,0.343783
9,1.3397,2.668491,0.352285
10,0.9201,2.65728,0.362912


***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-13
Configuration saved in ./results/checkpoint-13/config.json
Model weights saved in ./results/checkpoint-13/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-195] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-26
Configuration saved in ./results/checkpoint-26/config.json
Model weights saved in ./results/checkpoint-26/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-260] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-39
Configuration saved in ./results/checkpoint-39/config.json
Model weights saved in ./results/checkpoint-39/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-13] due to args.save_total_limit
***** Running Evaluatio

# classes 42
200 1882 1883
# classes in train 31
# classes in dev 41
# classes in test 39


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "

Epoch,Training Loss,Validation Loss,Accuracy
1,3.6532,3.348582,0.19288
2,3.3776,3.241226,0.19288
3,3.241,3.196209,0.19288
4,3.0458,3.042512,0.257705
5,2.8169,2.890058,0.27949
6,2.473,2.75823,0.30712
7,2.0812,2.704084,0.336876
8,1.7071,2.619623,0.363974
9,1.5695,2.577912,0.375133
10,1.1234,2.528905,0.39373


***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-13
Configuration saved in ./results/checkpoint-13/config.json
Model weights saved in ./results/checkpoint-13/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-208] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-26
Configuration saved in ./results/checkpoint-26/config.json
Model weights saved in ./results/checkpoint-26/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-260] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-39
Configuration saved in ./results/checkpoint-39/config.json
Model weights saved in ./results/checkpoint-39/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-26] due to args.save_total_limit
***** Running Evaluatio

# classes 42
300 1882 1883
# classes in train 34
# classes in dev 40
# classes in test 39


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "

Epoch,Training Loss,Validation Loss,Accuracy
1,3.6846,3.355794,0.171095
2,3.1723,3.175599,0.171095
3,3.003,3.014982,0.238576
4,2.7269,2.783,0.309245
5,2.2002,2.588919,0.353879
6,1.7074,2.514342,0.373007
7,1.4452,2.454774,0.39745
8,1.0753,2.441601,0.413921
9,0.9107,2.427202,0.419766
10,0.6641,2.426107,0.424017


***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-19
Configuration saved in ./results/checkpoint-19/config.json
Model weights saved in ./results/checkpoint-19/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-247] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-38
Configuration saved in ./results/checkpoint-38/config.json
Model weights saved in ./results/checkpoint-38/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-260] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-57
Configuration saved in ./results/checkpoint-57/config.json
Model weights saved in ./results/checkpoint-57/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-19] due to args.save_total_limit
***** Running Evaluatio

# classes 42
300 1882 1883
# classes in train 36
# classes in dev 41
# classes in test 40


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "

Epoch,Training Loss,Validation Loss,Accuracy
1,3.6653,3.274939,0.196068
2,3.246,3.123399,0.196068
3,2.9957,2.894967,0.246015
4,2.6344,2.730283,0.297024
5,2.0945,2.638974,0.343252
6,1.7375,2.544092,0.376727
7,1.5284,2.482233,0.385228
8,1.0898,2.483757,0.378321
9,0.8721,2.466243,0.392667
10,0.7369,2.48363,0.384166


***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-19
Configuration saved in ./results/checkpoint-19/config.json
Model weights saved in ./results/checkpoint-19/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-266] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-38
Configuration saved in ./results/checkpoint-38/config.json
Model weights saved in ./results/checkpoint-38/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-380] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-57
Configuration saved in ./results/checkpoint-57/config.json
Model weights saved in ./results/checkpoint-57/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-19] due to args.save_total_limit
***** Running Evaluatio

# classes 42
300 1882 1883
# classes in train 32
# classes in dev 41
# classes in test 41


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "

Epoch,Training Loss,Validation Loss,Accuracy
1,3.6835,3.269358,0.195537
2,3.1305,3.176287,0.195537
3,3.0221,2.978158,0.265143
4,2.7146,2.792143,0.301807
5,2.31,2.657253,0.351753
6,2.0148,2.56581,0.359724
7,1.5059,2.527896,0.390542
8,1.2581,2.423936,0.418704
9,1.0778,2.381187,0.439426
10,0.7799,2.3628,0.435175


***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-19
Configuration saved in ./results/checkpoint-19/config.json
Model weights saved in ./results/checkpoint-19/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-323] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-38
Configuration saved in ./results/checkpoint-38/config.json
Model weights saved in ./results/checkpoint-38/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-380] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-57
Configuration saved in ./results/checkpoint-57/config.json
Model weights saved in ./results/checkpoint-57/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-19] due to args.save_total_limit
***** Running Evaluatio

# classes 42
300 1882 1883
# classes in train 33
# classes in dev 39
# classes in test 42


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "

Epoch,Training Loss,Validation Loss,Accuracy
1,3.6219,3.290799,0.18491
2,3.0774,3.151619,0.190223
3,2.852,3.016177,0.227418
4,2.5112,2.914029,0.238045
5,2.1694,2.829404,0.294368
6,1.8065,2.652848,0.342721
7,1.4694,2.601874,0.353348
8,1.1672,2.568219,0.387885
9,0.9242,2.52657,0.400106
10,0.6789,2.516763,0.383103


***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-19
Configuration saved in ./results/checkpoint-19/config.json
Model weights saved in ./results/checkpoint-19/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-171] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-38
Configuration saved in ./results/checkpoint-38/config.json
Model weights saved in ./results/checkpoint-38/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-380] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-57
Configuration saved in ./results/checkpoint-57/config.json
Model weights saved in ./results/checkpoint-57/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-19] due to args.save_total_limit
***** Running Evaluatio

# classes 42
300 1882 1883
# classes in train 34
# classes in dev 41
# classes in test 39


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "

Epoch,Training Loss,Validation Loss,Accuracy
1,3.6811,3.248961,0.19288
2,3.1566,3.065289,0.239639
3,2.9035,2.81701,0.273114
4,2.4333,2.633851,0.377258
5,1.9643,2.491365,0.398512
6,1.4874,2.476863,0.396918
7,1.2119,2.467585,0.404888
8,0.9238,2.40714,0.42933
9,0.7966,2.459828,0.411265
10,0.512,2.471809,0.410202


***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-19
Configuration saved in ./results/checkpoint-19/config.json
Model weights saved in ./results/checkpoint-19/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-361] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-38
Configuration saved in ./results/checkpoint-38/config.json
Model weights saved in ./results/checkpoint-38/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-380] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-57
Configuration saved in ./results/checkpoint-57/config.json
Model weights saved in ./results/checkpoint-57/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-19] due to args.save_total_limit
***** Running Evaluatio

# classes 42
400 1882 1883
# classes in train 36
# classes in dev 40
# classes in test 39


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "

Epoch,Training Loss,Validation Loss,Accuracy
1,3.3497,3.290063,0.171095
2,3.0952,3.141652,0.175345
3,2.785,2.828135,0.297556
4,2.2282,2.576829,0.369288
5,1.7215,2.509804,0.34644
6,1.4824,2.340569,0.40542
7,1.2191,2.322978,0.431987
8,0.8017,2.29779,0.436238
9,0.8111,2.339722,0.435175
10,0.5575,2.346094,0.442614


***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-25
Configuration saved in ./results/checkpoint-25/config.json
Model weights saved in ./results/checkpoint-25/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-152] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-50
Configuration saved in ./results/checkpoint-50/config.json
Model weights saved in ./results/checkpoint-50/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-380] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-75
Configuration saved in ./results/checkpoint-75/config.json
Model weights saved in ./results/checkpoint-75/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-25] due to args.save_total_limit
***** Running Evaluatio

# classes 42
400 1882 1883
# classes in train 38
# classes in dev 41
# classes in test 40


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "

Epoch,Training Loss,Validation Loss,Accuracy
1,3.4204,3.18342,0.196068
2,2.9204,2.900103,0.251328
3,2.6794,2.660297,0.314028
4,2.1373,2.519305,0.366631
5,1.7559,2.443678,0.392136
6,1.3467,2.402054,0.402232
7,1.058,2.353516,0.412859
8,0.7594,2.361482,0.414453
9,0.6295,2.416414,0.400106
10,0.4272,2.414849,0.417109


***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-25
Configuration saved in ./results/checkpoint-25/config.json
Model weights saved in ./results/checkpoint-25/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-475] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-50
Configuration saved in ./results/checkpoint-50/config.json
Model weights saved in ./results/checkpoint-50/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-500] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-75
Configuration saved in ./results/checkpoint-75/config.json
Model weights saved in ./results/checkpoint-75/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-25] due to args.save_total_limit
***** Running Evaluatio

# classes 42
400 1882 1883
# classes in train 33
# classes in dev 41
# classes in test 41


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "

Epoch,Training Loss,Validation Loss,Accuracy
1,3.3365,3.218424,0.195537
2,3.0397,2.923923,0.259299
3,2.5979,2.688065,0.321467
4,2.1423,2.497275,0.391073
5,2.0213,2.408473,0.407545
6,1.5572,2.386353,0.428799
7,1.3377,2.33274,0.437301
8,1.0325,2.33463,0.442083
9,0.7559,2.257548,0.46068
10,0.6502,2.339005,0.46865


***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-25
Configuration saved in ./results/checkpoint-25/config.json
Model weights saved in ./results/checkpoint-25/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-375] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-50
Configuration saved in ./results/checkpoint-50/config.json
Model weights saved in ./results/checkpoint-50/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-500] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-75
Configuration saved in ./results/checkpoint-75/config.json
Model weights saved in ./results/checkpoint-75/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-25] due to args.save_total_limit
***** Running Evaluatio

# classes 42
400 1882 1883
# classes in train 35
# classes in dev 39
# classes in test 42


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "

Epoch,Training Loss,Validation Loss,Accuracy
1,3.2777,3.231005,0.18491
2,2.8234,2.971889,0.263018
3,2.5783,2.677901,0.321467
4,1.8154,2.503471,0.37407
5,1.5647,2.431044,0.381509
6,1.2948,2.455089,0.414984
7,0.9401,2.389544,0.421892
8,0.7934,2.350041,0.427205
9,0.5709,2.376637,0.445802
10,0.4413,2.493687,0.428799


***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-25
Configuration saved in ./results/checkpoint-25/config.json
Model weights saved in ./results/checkpoint-25/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-250] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-50
Configuration saved in ./results/checkpoint-50/config.json
Model weights saved in ./results/checkpoint-50/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-500] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-75
Configuration saved in ./results/checkpoint-75/config.json
Model weights saved in ./results/checkpoint-75/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-25] due to args.save_total_limit
***** Running Evaluatio

# classes 42
400 1882 1883
# classes in train 36
# classes in dev 41
# classes in test 39


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "

Epoch,Training Loss,Validation Loss,Accuracy
1,3.5617,3.20693,0.19288
2,3.2317,3.092108,0.247078
3,3.0371,2.848934,0.267269
4,2.5774,2.671996,0.335282
5,2.0151,2.44912,0.396387
6,1.4391,2.352765,0.417641
7,1.2727,2.483296,0.385228
8,0.8801,2.37538,0.421892
9,0.7904,2.356519,0.433581
10,0.5139,2.436685,0.427205


***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-25
Configuration saved in ./results/checkpoint-25/config.json
Model weights saved in ./results/checkpoint-25/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-225] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-50
Configuration saved in ./results/checkpoint-50/config.json
Model weights saved in ./results/checkpoint-50/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-500] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-75
Configuration saved in ./results/checkpoint-75/config.json
Model weights saved in ./results/checkpoint-75/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-25] due to args.save_total_limit
***** Running Evaluatio

# classes 8
200 1882 1883
# classes in train 8
# classes in dev 8
# classes in test 8


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,

Epoch,Training Loss,Validation Loss,Accuracy
1,2.0172,1.943102,0.242295
2,1.8826,1.885604,0.242295
3,1.79,1.73394,0.322529
4,1.5014,1.577496,0.448459
5,1.165,1.565355,0.448459
6,0.9639,1.577729,0.484591
7,0.4815,1.640471,0.473433
8,0.3799,1.811237,0.474495
9,0.3185,1.798931,0.510627
10,0.1431,1.968634,0.492561


***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-13
Configuration saved in ./results/checkpoint-13/config.json
Model weights saved in ./results/checkpoint-13/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-400] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-26
Configuration saved in ./results/checkpoint-26/config.json
Model weights saved in ./results/checkpoint-26/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-500] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-39
Configuration saved in ./results/checkpoint-39/config.json
Model weights saved in ./results/checkpoint-39/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-13] due to args.save_total_limit
***** Running Evaluatio

# classes 8
200 1882 1883
# classes in train 8
# classes in dev 8
# classes in test 8


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,

Epoch,Training Loss,Validation Loss,Accuracy
1,2.0595,1.926887,0.266738
2,1.9193,1.837176,0.35813
3,1.9031,1.66373,0.41339
4,1.3805,1.495119,0.477152
5,1.0472,1.51947,0.490967
6,0.8101,1.626215,0.485654
7,0.4053,1.560553,0.522848
8,0.2538,1.725679,0.502125
9,0.1432,1.822184,0.517003
10,0.0547,2.102013,0.497875


***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-13
Configuration saved in ./results/checkpoint-13/config.json
Model weights saved in ./results/checkpoint-13/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-117] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-26
Configuration saved in ./results/checkpoint-26/config.json
Model weights saved in ./results/checkpoint-26/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-260] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-39
Configuration saved in ./results/checkpoint-39/config.json
Model weights saved in ./results/checkpoint-39/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-13] due to args.save_total_limit
***** Running Evaluatio

# classes 8
200 1882 1883
# classes in train 8
# classes in dev 8
# classes in test 8


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,

Epoch,Training Loss,Validation Loss,Accuracy
1,2.0171,1.894493,0.267269
2,1.9108,1.828404,0.267269
3,1.7552,1.629486,0.416578
4,1.2704,1.513461,0.4644
5,1.0635,1.576056,0.44899
6,0.8966,1.498389,0.512752
7,0.4414,1.558421,0.527099
8,0.3034,1.665541,0.505845
9,0.2146,1.730014,0.525505
10,0.0714,1.781626,0.525505


***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-13
Configuration saved in ./results/checkpoint-13/config.json
Model weights saved in ./results/checkpoint-13/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-91] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-26
Configuration saved in ./results/checkpoint-26/config.json
Model weights saved in ./results/checkpoint-26/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-260] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-39
Configuration saved in ./results/checkpoint-39/config.json
Model weights saved in ./results/checkpoint-39/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-13] due to args.save_total_limit
***** Running Evaluation

# classes 8
200 1882 1883
# classes in train 8
# classes in dev 8
# classes in test 8


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,

Epoch,Training Loss,Validation Loss,Accuracy
1,1.9959,1.926051,0.255579
2,1.8559,1.864178,0.320404
3,1.906,1.761038,0.300744
4,1.5305,1.564557,0.459617
5,1.1888,1.383003,0.528693
6,0.9595,1.444349,0.528162
7,0.3702,1.553294,0.527099
8,0.2552,1.703556,0.518066
9,0.1915,1.727714,0.534006
10,0.0927,1.895508,0.522317


***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-13
Configuration saved in ./results/checkpoint-13/config.json
Model weights saved in ./results/checkpoint-13/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-247] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-26
Configuration saved in ./results/checkpoint-26/config.json
Model weights saved in ./results/checkpoint-26/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-260] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-39
Configuration saved in ./results/checkpoint-39/config.json
Model weights saved in ./results/checkpoint-39/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-13] due to args.save_total_limit
***** Running Evaluatio

# classes 8
200 1882 1883
# classes in train 8
# classes in dev 8
# classes in test 8


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,

Epoch,Training Loss,Validation Loss,Accuracy
1,2.0532,1.956157,0.164187
2,1.9475,1.804451,0.38204
3,1.8281,1.639905,0.403294
4,1.258,1.583122,0.422954
5,1.0945,1.510847,0.475027
6,0.8639,1.478758,0.522317
7,0.4027,1.537051,0.530287
8,0.2775,1.709229,0.51594
9,0.1644,1.780277,0.512752
10,0.085,1.94342,0.516472


***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-13
Configuration saved in ./results/checkpoint-13/config.json
Model weights saved in ./results/checkpoint-13/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-117] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-26
Configuration saved in ./results/checkpoint-26/config.json
Model weights saved in ./results/checkpoint-26/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-260] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-39
Configuration saved in ./results/checkpoint-39/config.json
Model weights saved in ./results/checkpoint-39/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-13] due to args.save_total_limit
***** Running Evaluatio

# classes 8
300 1882 1883
# classes in train 8
# classes in dev 8
# classes in test 8


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,

Epoch,Training Loss,Validation Loss,Accuracy
1,2.0173,1.915356,0.194474
2,1.759,1.718211,0.311902
3,1.5059,1.527857,0.44474
4,1.041,1.442086,0.487779
5,0.7031,1.486028,0.498937
6,0.3889,1.660009,0.517003
7,0.1908,1.871873,0.505313
8,0.1213,2.028041,0.497343
9,0.0392,2.164007,0.510627
10,0.0146,2.360769,0.513815


***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-19
Configuration saved in ./results/checkpoint-19/config.json
Model weights saved in ./results/checkpoint-19/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-234] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-38
Configuration saved in ./results/checkpoint-38/config.json
Model weights saved in ./results/checkpoint-38/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-260] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-57
Configuration saved in ./results/checkpoint-57/config.json
Model weights saved in ./results/checkpoint-57/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-19] due to args.save_total_limit
***** Running Evaluatio

# classes 8
300 1882 1883
# classes in train 8
# classes in dev 8
# classes in test 8


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,

Epoch,Training Loss,Validation Loss,Accuracy
1,2.0354,1.853607,0.2678
2,1.8323,1.622635,0.438895
3,1.4199,1.448552,0.468119
4,0.9962,1.439003,0.537194
5,0.6386,1.468036,0.52763
6,0.4117,1.62478,0.534006
7,0.2526,1.820151,0.499469
8,0.0953,2.046814,0.495749
9,0.0807,2.029547,0.517535
10,0.021,2.318681,0.520191


***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-19
Configuration saved in ./results/checkpoint-19/config.json
Model weights saved in ./results/checkpoint-19/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-285] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-38
Configuration saved in ./results/checkpoint-38/config.json
Model weights saved in ./results/checkpoint-38/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-380] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-57
Configuration saved in ./results/checkpoint-57/config.json
Model weights saved in ./results/checkpoint-57/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-19] due to args.save_total_limit
***** Running Evaluatio

# classes 8
300 1882 1883
# classes in train 8
# classes in dev 8
# classes in test 8


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,

Epoch,Training Loss,Validation Loss,Accuracy
1,2.0531,1.880952,0.287991
2,1.7884,1.703997,0.376196
3,1.4527,1.512457,0.486716
4,0.9445,1.56215,0.483528
5,0.5975,1.54122,0.506376
6,0.2764,1.578075,0.528162
7,0.1321,1.807051,0.518066
8,0.0562,2.103063,0.515409
9,0.0564,2.26484,0.526036
10,0.0105,2.567545,0.498937


***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-19
Configuration saved in ./results/checkpoint-19/config.json
Model weights saved in ./results/checkpoint-19/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-76] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-38
Configuration saved in ./results/checkpoint-38/config.json
Model weights saved in ./results/checkpoint-38/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-380] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-57
Configuration saved in ./results/checkpoint-57/config.json
Model weights saved in ./results/checkpoint-57/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-19] due to args.save_total_limit
***** Running Evaluation

# classes 8
300 1882 1883
# classes in train 8
# classes in dev 8
# classes in test 8


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,

Epoch,Training Loss,Validation Loss,Accuracy
1,2.0447,1.925716,0.255579
2,1.8534,1.757751,0.393199
3,1.5167,1.535486,0.44899
4,1.0785,1.43524,0.522317
5,0.6692,1.480019,0.51594
6,0.3206,1.62254,0.534538
7,0.1695,1.808301,0.512752
8,0.0841,1.891993,0.534538
9,0.0543,2.121623,0.532412
10,0.0157,2.242105,0.53135


***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-19
Configuration saved in ./results/checkpoint-19/config.json
Model weights saved in ./results/checkpoint-19/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-114] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-38
Configuration saved in ./results/checkpoint-38/config.json
Model weights saved in ./results/checkpoint-38/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-380] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-57
Configuration saved in ./results/checkpoint-57/config.json
Model weights saved in ./results/checkpoint-57/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-19] due to args.save_total_limit
***** Running Evaluatio

# classes 8
300 1882 1883
# classes in train 8
# classes in dev 8
# classes in test 8


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,

Epoch,Training Loss,Validation Loss,Accuracy
1,2.0597,1.883418,0.236982
2,1.8591,1.638963,0.390542
3,1.3817,1.539201,0.461211
4,0.9636,1.459565,0.534006
5,0.5209,1.574273,0.528162
6,0.4128,1.620064,0.534538
7,0.1964,1.737319,0.549947
8,0.0859,2.125861,0.513284
9,0.0431,2.287673,0.517535
10,0.0163,2.31435,0.538789


***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-19
Configuration saved in ./results/checkpoint-19/config.json
Model weights saved in ./results/checkpoint-19/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-361] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-38
Configuration saved in ./results/checkpoint-38/config.json
Model weights saved in ./results/checkpoint-38/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-380] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-57
Configuration saved in ./results/checkpoint-57/config.json
Model weights saved in ./results/checkpoint-57/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-19] due to args.save_total_limit
***** Running Evaluatio

# classes 8
400 1882 1883
# classes in train 8
# classes in dev 8
# classes in test 8


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,

Epoch,Training Loss,Validation Loss,Accuracy
1,1.9135,1.872633,0.246546
2,1.6885,1.619704,0.414984
3,1.3453,1.47576,0.476089
4,0.9596,1.398114,0.534006
5,0.7259,1.462917,0.543039
6,0.2969,1.567623,0.559511
7,0.2376,1.671318,0.551541
8,0.0921,1.956201,0.538789
9,0.0794,2.213268,0.529756
10,0.0371,2.247084,0.548353


***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-25
Configuration saved in ./results/checkpoint-25/config.json
Model weights saved in ./results/checkpoint-25/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-133] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-50
Configuration saved in ./results/checkpoint-50/config.json
Model weights saved in ./results/checkpoint-50/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-380] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-75
Configuration saved in ./results/checkpoint-75/config.json
Model weights saved in ./results/checkpoint-75/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-25] due to args.save_total_limit
***** Running Evaluatio

# classes 8
400 1882 1883
# classes in train 8
# classes in dev 8
# classes in test 8


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,

Epoch,Training Loss,Validation Loss


Epoch,Training Loss,Validation Loss,Accuracy
1,2.009,1.826857,0.361318
2,1.6701,1.511216,0.466525
3,1.2341,1.488632,0.47237
4,0.9363,1.393727,0.542508
5,0.6236,1.464176,0.5356
6,0.4918,1.601031,0.522317
7,0.2396,1.896017,0.505845
8,0.1405,1.933705,0.535069
9,0.0983,2.063449,0.541977
10,0.0525,2.348956,0.501063


***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-25
Configuration saved in ./results/checkpoint-25/config.json
Model weights saved in ./results/checkpoint-25/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-150] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-50
Configuration saved in ./results/checkpoint-50/config.json
Model weights saved in ./results/checkpoint-50/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-500] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-75
Configuration saved in ./results/checkpoint-75/config.json
Model weights saved in ./results/checkpoint-75/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-25] due to args.save_total_limit
***** Running Evaluatio

# classes 8
400 1882 1883
# classes in train 8
# classes in dev 8
# classes in test 8


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,

Epoch,Training Loss,Validation Loss,Accuracy
1,1.9014,1.867552,0.345909
2,1.6627,1.586032,0.420829
3,1.35,1.525296,0.475558
4,1.1218,1.501122,0.531881
5,0.6085,1.771485,0.458555
6,0.4159,1.555267,0.541445
7,0.2665,1.694039,0.53932
8,0.116,1.934513,0.540914
9,0.0412,2.190274,0.52763
10,0.0351,2.277709,0.538257


***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-25
Configuration saved in ./results/checkpoint-25/config.json
Model weights saved in ./results/checkpoint-25/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-375] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-50
Configuration saved in ./results/checkpoint-50/config.json
Model weights saved in ./results/checkpoint-50/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-500] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-75
Configuration saved in ./results/checkpoint-75/config.json
Model weights saved in ./results/checkpoint-75/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-25] due to args.save_total_limit
***** Running Evaluatio

# classes 8
400 1882 1883
# classes in train 8
# classes in dev 8
# classes in test 8


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,

Epoch,Training Loss,Validation Loss,Accuracy
1,1.9242,1.854954,0.264612
2,1.5914,1.517027,0.47237
3,1.1885,1.435185,0.498406
4,0.8081,1.49396,0.503188
5,0.5741,1.474471,0.548353
6,0.2802,1.729007,0.535069
7,0.2259,1.770037,0.539851
8,0.0716,2.054895,0.55898
9,0.0504,2.278,0.546759
10,0.0193,2.403611,0.548884


***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-25
Configuration saved in ./results/checkpoint-25/config.json
Model weights saved in ./results/checkpoint-25/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-475] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-50
Configuration saved in ./results/checkpoint-50/config.json
Model weights saved in ./results/checkpoint-50/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-500] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-75
Configuration saved in ./results/checkpoint-75/config.json
Model weights saved in ./results/checkpoint-75/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-25] due to args.save_total_limit
***** Running Evaluatio

# classes 8
400 1882 1883
# classes in train 8
# classes in dev 8
# classes in test 8


PyTorch: setting up devices
The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).
loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--roberta-base/snapshots/ff46155979338ff8063cdad90908b498ab91b181/config.json
Model config RobertaConfig {
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,

Epoch,Training Loss,Validation Loss,Accuracy
1,1.9875,1.928288,0.20085
2,1.6128,1.566792,0.44899
3,1.3248,1.462904,0.498937
4,0.9411,1.459053,0.539851
5,0.6045,1.508209,0.538789
6,0.4423,1.749491,0.520191
7,0.3453,2.000509,0.502657
8,0.1579,2.102963,0.525505
9,0.0371,2.146791,0.554729
10,0.1282,2.391114,0.535069


***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-25
Configuration saved in ./results/checkpoint-25/config.json
Model weights saved in ./results/checkpoint-25/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-200] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-50
Configuration saved in ./results/checkpoint-50/config.json
Model weights saved in ./results/checkpoint-50/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-500] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1882
  Batch size = 64
Saving model checkpoint to ./results/checkpoint-75
Configuration saved in ./results/checkpoint-75/config.json
Model weights saved in ./results/checkpoint-75/pytorch_model.bin
Deleting older checkpoint [results/checkpoint-25] due to args.save_total_limit
***** Running Evaluatio

In [None]:
for task in tasks:
  print(task + "-Topic Classification")
  results = outputs[task]
  for train_size in results:
    print(train_size, np.mean(results[train_size]), np.std(results[train_size]))

44-Topic Classification
200 0.3938396176314392 0.014272184414012389
300 0.4302708443972385 0.018305733848378577
400 0.44503451938396166 0.011139764717686148
8-Topic Classification
200 0.5348911311736589 0.018559724542714137
300 0.5472118959107807 0.015179984895792472
400 0.5595326606479023 0.016832743779634632


In [None]:
end = time.time()
print(f"The program took {(end - start) // 60} minutes in total.")

The program took 245.0 minutes in total.


In [None]:
from google.colab import runtime
runtime.unassign()