# Initiliation

In [1]:
!pip install transformers datasets --quiet

[K     |████████████████████████████████| 3.3 MB 5.3 MB/s 
[K     |████████████████████████████████| 298 kB 36.8 MB/s 
[K     |████████████████████████████████| 596 kB 54.5 MB/s 
[K     |████████████████████████████████| 3.3 MB 68.4 MB/s 
[K     |████████████████████████████████| 895 kB 55.1 MB/s 
[K     |████████████████████████████████| 61 kB 630 kB/s 
[K     |████████████████████████████████| 132 kB 62.4 MB/s 
[K     |████████████████████████████████| 243 kB 53.4 MB/s 
[K     |████████████████████████████████| 1.1 MB 53.2 MB/s 
[K     |████████████████████████████████| 271 kB 74.3 MB/s 
[K     |████████████████████████████████| 192 kB 63.1 MB/s 
[K     |████████████████████████████████| 160 kB 56.0 MB/s 
[?25h

In [2]:
from transformers import TrainingArguments
from transformers import Trainer
from transformers import AutoModelForSequenceClassification
from transformers import AutoTokenizer

from sklearn.model_selection import train_test_split
from sklearn.metrics import precision_recall_fscore_support, accuracy_score, classification_report, confusion_matrix
from datasets import Dataset
from datasets import load_metric

import numpy as np
import math
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

from google.colab import drive

# Data Preparation

In [3]:
drive.mount('/content/drive/')

Mounted at /content/drive/


In [4]:
%cd 'drive/MyDrive/Masterarbeit/Colab Notebooks/OVERVIEW MBTI/Datasets/URL_Balanced_MASK'

/content/drive/.shortcut-targets-by-id/1aHXlqhpj1STohhfU4gn53D4whaLH__Jz/Masterarbeit/Colab Notebooks/OVERVIEW MBTI/Datasets/URL_Balanced_MASK


In [5]:
dfNS = pd.read_csv('MBTI_NS_URL_Balanced_MASK.csv', sep=",", error_bad_lines=False)
dfNS

Unnamed: 0,text,label
0,i like that you are kind as [MASK] i find that...,0
1,oh my you are right who really talks like tha...,0
2,yep yep yep especially the last one yep agree ...,0
3,things that are generalizable to the entire po...,0
4,work student hobbies studying gaming reading d...,0
...,...,...
1947,favorites one flew over the cuckoos nest1984 a...,1
1948,could i have my name changed to barkhouse than...,1
1949,i hate small talk just get to the point if its...,1
1950,when some days you talk with every people you ...,1


# Model Training

In [6]:
modeltype = "roberta-base"

In [7]:
train, test = train_test_split(dfNS, test_size=0.2, random_state=0, stratify=dfNS.label)

train = Dataset.from_pandas(train)
test = Dataset.from_pandas(test)

tokenizer = AutoTokenizer.from_pretrained(modeltype)

def tokenize_function(examples):
    return tokenizer(examples["text"], padding="max_length", truncation=True)

tokenized_train = train.map(tokenize_function, batched=True)
tokenized_test = test.map(tokenize_function, batched=True)

full_train_dataset = tokenized_train
full_eval_dataset = tokenized_test

model = AutoModelForSequenceClassification.from_pretrained(modeltype, num_labels=2)

training_args = TrainingArguments(
    "RoBERTa_NS_MASK", 
    evaluation_strategy="epoch",
    save_strategy = 'no',
    save_steps = 100000,
    save_total_limit = 1,
    metric_for_best_model="eval_f1")

def compute_metrics(pred):
    labels = pred.label_ids
    preds = pred.predictions.argmax(-1)
    precision, recall, f1, _ = precision_recall_fscore_support(labels, preds, average='macro')
    acc = accuracy_score(labels, preds)
    print(classification_report(labels, preds, labels=[0,1]))
    print(confusion_matrix(labels,preds))
    return {
        'accuracy': acc,
        'f1': f1,
        'precision': precision,
        'recall': recall
    }

Downloading:   0%|          | 0.00/481 [00:00<?, ?B/s]

Downloading:   0%|          | 0.00/878k [00:00<?, ?B/s]

Downloading:   0%|          | 0.00/446k [00:00<?, ?B/s]

Downloading:   0%|          | 0.00/1.29M [00:00<?, ?B/s]

  0%|          | 0/2 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

Downloading:   0%|          | 0.00/478M [00:00<?, ?B/s]

Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.decoder.weight', 'lm_head.layer_norm.weight', 'roberta.pooler.dense.bias', 'lm_head.dense.bias', 'roberta.pooler.dense.weight', 'lm_head.layer_norm.bias', 'lm_head.dense.weight', 'lm_head.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.bias', 'classifier.

# Hyperparameter Optimization

In [8]:
! pip install optuna --quiet

[K     |████████████████████████████████| 308 kB 5.2 MB/s 
[K     |████████████████████████████████| 80 kB 11.3 MB/s 
[K     |████████████████████████████████| 209 kB 65.3 MB/s 
[K     |████████████████████████████████| 75 kB 5.5 MB/s 
[K     |████████████████████████████████| 49 kB 8.3 MB/s 
[K     |████████████████████████████████| 149 kB 72.3 MB/s 
[K     |████████████████████████████████| 112 kB 75.7 MB/s 
[?25h  Building wheel for pyperclip (setup.py) ... [?25l[?25hdone


In [9]:
def model_init():
    return AutoModelForSequenceClassification.from_pretrained(modeltype, num_labels=2)

In [10]:
trainer = Trainer(
      model_init=model_init,
      args=training_args, 
      train_dataset=full_train_dataset, 
      eval_dataset=full_eval_dataset,
      compute_metrics=compute_metrics 
  )

loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta-base/r

In [11]:
import sklearn.metrics as metrics
import optuna
import sys
import logging

def objective (metrics):
  return metrics['eval_f1']

def hyperparameter_space(trial):

    return {
        "learning_rate": trial.suggest_float("learning_rate", 5e-8, 5e-1, log=True),
        "per_device_train_batch_size": trial.suggest_categorical("per_device_train_batch_size", [2, 4, 8, 16]),
        "weight_decay": trial.suggest_float("weight_decay", 5e-12, 5e-1, log=True),
        "num_train_epochs": trial.suggest_float("num_train_epochs",1,8,log=True),
        #"adam_epsilon": trial.suggest_float("adam_epsilon", 1e-10, 1e-6, log=True),
        #"seed" : trial.suggest_float("seed",10,60,log=True)
        }

optuna.logging.get_logger("optuna").addHandler(logging.StreamHandler(sys.stdout))
study_name = "RoBERTa_MASK_NS"  # Unique identifier of the study.
storage_name = "sqlite:///{}.db".format(study_name)

best_run = trainer.hyperparameter_search(hp_space=hyperparameter_space,compute_objective=objective, n_trials=50, direction="maximize",study_name=study_name, storage=storage_name )

study = optuna.create_study()

[32m[I 2021-12-12 17:02:21,689][0m A new study created in RDB with name: RoBERTa_MASK_NS[0m


A new study created in RDB with name: RoBERTa_MASK_NS


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.6996,0.693003,0.511509,0.338409,0.255754,0.5
2,0.6943,0.701743,0.511509,0.338409,0.255754,0.5
3,0.7028,0.69361,0.488491,0.328179,0.244246,0.5
4,0.6979,0.693073,0.511509,0.338409,0.255754,0.5
5,0.6969,0.693119,0.511509,0.338409,0.255754,0.5
6,0.6963,0.693242,0.488491,0.328179,0.244246,0.5
7,0.6928,0.692922,0.511509,0.338409,0.255754,0.5
7,0.6927,0.692914,0.511509,0.338409,0.255754,0.5


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.51      1.00      0.68       200
           1       0.00      0.00      0.00       191

    accuracy                           0.51       391
   macro avg       0.26      0.50      0.34       391
weighted avg       0.26      0.51      0.35       391

[[200   0]
 [191   0]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.51      1.00      0.68       200
           1       0.00      0.00      0.00       191

    accuracy                           0.51       391
   macro avg       0.26      0.50      0.34       391
weighted avg       0.26      0.51      0.35       391

[[200   0]
 [191   0]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       200
           1       0.49      1.00      0.66       191

    accuracy                           0.49       391
   macro avg       0.24      0.50      0.33       391
weighted avg       0.24      0.49      0.32       391

[[  0 200]
 [  0 191]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.51      1.00      0.68       200
           1       0.00      0.00      0.00       191

    accuracy                           0.51       391
   macro avg       0.26      0.50      0.34       391
weighted avg       0.26      0.51      0.35       391

[[200   0]
 [191   0]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.51      1.00      0.68       200
           1       0.00      0.00      0.00       191

    accuracy                           0.51       391
   macro avg       0.26      0.50      0.34       391
weighted avg       0.26      0.51      0.35       391

[[200   0]
 [191   0]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       200
           1       0.49      1.00      0.66       191

    accuracy                           0.49       391
   macro avg       0.24      0.50      0.33       391
weighted avg       0.24      0.49      0.32       391

[[  0 200]
 [  0 191]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.51      1.00      0.68       200
           1       0.00      0.00      0.00       191

    accuracy                           0.51       391
   macro avg       0.26      0.50      0.34       391
weighted avg       0.26      0.51      0.35       391

[[200   0]
 [191   0]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.51      1.00      0.68       200
           1       0.00      0.00      0.00       191

    accuracy                           0.51       391
   macro avg       0.26      0.50      0.34       391
weighted avg       0.26      0.51      0.35       391

[[200   0]
 [191   0]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.



Training completed. Do not forget to share your model on huggingface.co/models =)


[32m[I 2021-12-12 17:18:53,141][0m Trial 0 finished with value: 0.3384094754653131 and parameters: {'learning_rate': 1.0696002857866855e-05, 'per_device_train_batch_size': 2, 'weight_decay': 8.320150727863287e-08, 'num_train_epochs': 7.722647604976535}. Best is trial 0 with value: 0.338409475465

Trial 0 finished with value: 0.3384094754653131 and parameters: {'learning_rate': 1.0696002857866855e-05, 'per_device_train_batch_size': 2, 'weight_decay': 8.320150727863287e-08, 'num_train_epochs': 7.722647604976535}. Best is trial 0 with value: 0.3384094754653131.


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,63.963413,0.488491,0.328179,0.244246,0.5
2,38.979600,23.543633,0.488491,0.328179,0.244246,0.5
3,27.888500,34.840885,0.511509,0.338409,0.255754,0.5
4,19.730000,3.168558,0.488491,0.328179,0.244246,0.5
5,19.730000,9.346238,0.511509,0.338409,0.255754,0.5
5,10.670900,1.094561,0.511509,0.338409,0.255754,0.5


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       200
           1       0.49      1.00      0.66       191

    accuracy                           0.49       391
   macro avg       0.24      0.50      0.33       391
weighted avg       0.24      0.49      0.32       391

[[  0 200]
 [  0 191]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       200
           1       0.49      1.00      0.66       191

    accuracy                           0.49       391
   macro avg       0.24      0.50      0.33       391
weighted avg       0.24      0.49      0.32       391

[[  0 200]
 [  0 191]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.51      1.00      0.68       200
           1       0.00      0.00      0.00       191

    accuracy                           0.51       391
   macro avg       0.26      0.50      0.34       391
weighted avg       0.26      0.51      0.35       391

[[200   0]
 [191   0]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       200
           1       0.49      1.00      0.66       191

    accuracy                           0.49       391
   macro avg       0.24      0.50      0.33       391
weighted avg       0.24      0.49      0.32       391

[[  0 200]
 [  0 191]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.51      1.00      0.68       200
           1       0.00      0.00      0.00       191

    accuracy                           0.51       391
   macro avg       0.26      0.50      0.34       391
weighted avg       0.26      0.51      0.35       391

[[200   0]
 [191   0]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.51      1.00      0.68       200
           1       0.00      0.00      0.00       191

    accuracy                           0.51       391
   macro avg       0.26      0.50      0.34       391
weighted avg       0.26      0.51      0.35       391

[[200   0]
 [191   0]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.



Training completed. Do not forget to share your model on huggingface.co/models =)


[32m[I 2021-12-12 17:29:16,156][0m Trial 1 finished with value: 0.3384094754653131 and parameters: {'learning_rate': 0.4221776849260434, 'per_device_train_batch_size': 4, 'weight_decay': 0.041326081068267045, 'num_train_epochs': 5.688070851486295}. Best is trial 0 with value: 0.3384094754653131.

Trial 1 finished with value: 0.3384094754653131 and parameters: {'learning_rate': 0.4221776849260434, 'per_device_train_batch_size': 4, 'weight_decay': 0.041326081068267045, 'num_train_epochs': 5.688070851486295}. Best is trial 0 with value: 0.3384094754653131.


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.69287,0.491049,0.333719,0.744872,0.5025
2,No log,0.689997,0.514066,0.348745,0.589777,0.502736
2,0.692100,0.689222,0.531969,0.440629,0.559797,0.522945


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       1.00      0.01      0.01       200
           1       0.49      1.00      0.66       191

    accuracy                           0.49       391
   macro avg       0.74      0.50      0.33       391
weighted avg       0.75      0.49      0.33       391

[[  1 199]
 [  0 191]]


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.51      0.99      0.68       200
           1       0.67      0.01      0.02       191

    accuracy                           0.51       391
   macro avg       0.59      0.50      0.35       391
weighted avg       0.59      0.51      0.36       391

[[199   1]
 [189   2]]


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.52      0.92      0.67       200
           1       0.60      0.13      0.21       191

    accuracy                           0.53       391
   macro avg       0.56      0.52      0.44       391
weighted avg       0.56      0.53      0.45       391

[[183  17]
 [166  25]]




Training completed. Do not forget to share your model on huggingface.co/models =)


[32m[I 2021-12-12 17:33:52,484][0m Trial 2 finished with value: 0.4406294706723891 and parameters: {'learning_rate': 2.4400310752316386e-06, 'per_device_train_batch_size': 8, 'weight_decay': 5.252611964132717e-07, 'num_train_epochs': 2.7442387285254384}. Best is trial 2 with value: 0.4406294706723891.[0m


Trial 2 finished with value: 0.4406294706723891 and parameters: {'learning_rate': 2.4400310752316386e-06, 'per_device_train_batch_size': 8, 'weight_decay': 5.252611964132717e-07, 'num_train_epochs': 2.7442387285254384}. Best is trial 2 with value: 0.4406294706723891.


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.690054,0.493606,0.377268,0.517985,0.503822
2,No log,0.692057,0.598465,0.579037,0.612367,0.593835
2,No log,0.646226,0.634271,0.634118,0.634108,0.634136


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.55      0.06      0.11       200
           1       0.49      0.95      0.65       191

    accuracy                           0.49       391
   macro avg       0.52      0.50      0.38       391
weighted avg       0.52      0.49      0.37       391

[[ 12 188]
 [ 10 181]]


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.58      0.80      0.67       200
           1       0.65      0.39      0.49       191

    accuracy                           0.60       391
   macro avg       0.61      0.59      0.58       391
weighted avg       0.61      0.60      0.58       391

[[159  41]
 [116  75]]


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.64      0.64      0.64       200
           1       0.62      0.63      0.63       191

    accuracy                           0.63       391
   macro avg       0.63      0.63      0.63       391
weighted avg       0.63      0.63      0.63       391

[[128  72]
 [ 71 120]]




Training completed. Do not forget to share your model on huggingface.co/models =)


[32m[I 2021-12-12 17:38:32,834][0m Trial 3 finished with value: 0.6341179319054817 and parameters: {'learning_rate': 1.0813915071256551e-05, 'per_device_train_batch_size': 16, 'weight_decay': 3.5099819965382977e-09, 'num_train_epochs': 2.981915880251583}. Best is trial 3 with value: 0.6341179319054817.[0m


Trial 3 finished with value: 0.6341179319054817 and parameters: {'learning_rate': 1.0813915071256551e-05, 'per_device_train_batch_size': 16, 'weight_decay': 3.5099819965382977e-09, 'num_train_epochs': 2.981915880251583}. Best is trial 3 with value: 0.6341179319054817.


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.690643,0.554987,0.524504,0.584866,0.561113
2,0.692400,0.683923,0.526854,0.376514,0.697291,0.515825
2,0.672000,0.667631,0.616368,0.616366,0.616784,0.616754


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.64      0.29      0.40       200
           1       0.53      0.83      0.64       191

    accuracy                           0.55       391
   macro avg       0.58      0.56      0.52       391
weighted avg       0.59      0.55      0.52       391

[[ 59 141]
 [ 33 158]]


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.52      0.99      0.68       200
           1       0.88      0.04      0.07       191

    accuracy                           0.53       391
   macro avg       0.70      0.52      0.38       391
weighted avg       0.69      0.53      0.38       391

[[199   1]
 [184   7]]


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.63      0.60      0.62       200
           1       0.60      0.63      0.62       191

    accuracy                           0.62       391
   macro avg       0.62      0.62      0.62       391
weighted avg       0.62      0.62      0.62       391

[[120  80]
 [ 70 121]]




Training completed. Do not forget to share your model on huggingface.co/models =)


[32m[I 2021-12-12 17:43:17,950][0m Trial 4 finished with value: 0.6163657770800628 and parameters: {'learning_rate': 2.1074410097143765e-06, 'per_device_train_batch_size': 4, 'weight_decay': 4.113693549617035e-11, 'num_train_epochs': 2.571573491376362}. Best is trial 3 with value: 0.6341179319054817.[0m


Trial 4 finished with value: 0.6163657770800628 and parameters: {'learning_rate': 2.1074410097143765e-06, 'per_device_train_batch_size': 4, 'weight_decay': 4.113693549617035e-11, 'num_train_epochs': 2.571573491376362}. Best is trial 3 with value: 0.6341179319054817.


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.693982,0.488491,0.328179,0.244246,0.5


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       200
           1       0.49      1.00      0.66       191

    accuracy                           0.49       391
   macro avg       0.24      0.50      0.33       391
weighted avg       0.24      0.49      0.32       391

[[  0 200]
 [  0 191]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-12 17:44:53,009][0m Trial 5 pruned. [0m


Trial 5 pruned. 


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,2.316601,0.511509,0.338409,0.255754,0.5
2,No log,0.705415,0.488491,0.328179,0.244246,0.5


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.51      1.00      0.68       200
           1       0.00      0.00      0.00       191

    accuracy                           0.51       391
   macro avg       0.26      0.50      0.34       391
weighted avg       0.26      0.51      0.35       391

[[200   0]
 [191   0]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       200
           1       0.49      1.00      0.66       191

    accuracy                           0.49       391
   macro avg       0.24      0.50      0.33       391
weighted avg       0.24      0.49      0.32       391

[[  0 200]
 [  0 191]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-12 17:48:13,852][0m Trial 6 pruned. [0m


Trial 6 pruned. 


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.7193,0.693007,0.511509,0.338409,0.255754,0.5
1,0.6999,0.6929,0.511509,0.338409,0.255754,0.5


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.51      1.00      0.68       200
           1       0.00      0.00      0.00       191

    accuracy                           0.51       391
   macro avg       0.26      0.50      0.34       391
weighted avg       0.26      0.51      0.35       391

[[200   0]
 [191   0]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.51      1.00      0.68       200
           1       0.00      0.00      0.00       191

    accuracy                           0.51       391
   macro avg       0.26      0.50      0.34       391
weighted avg       0.26      0.51      0.35       391

[[200   0]
 [191   0]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-12 17:51:15,538][0m Trial 7 pruned. [0m


Trial 7 pruned. 


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.673365,0.608696,0.60844,0.610155,0.609607
2,No log,0.661759,0.613811,0.604498,0.620233,0.610602
3,No log,0.665142,0.634271,0.632105,0.635068,0.63284
3,No log,0.71452,0.634271,0.625451,0.642487,0.631073


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.63      0.57      0.60       200
           1       0.59      0.65      0.62       191

    accuracy                           0.61       391
   macro avg       0.61      0.61      0.61       391
weighted avg       0.61      0.61      0.61       391

[[114  86]
 [ 67 124]]


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.60      0.75      0.67       200
           1       0.64      0.47      0.54       191

    accuracy                           0.61       391
   macro avg       0.62      0.61      0.60       391
weighted avg       0.62      0.61      0.61       391

[[150  50]
 [101  90]]


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.63      0.69      0.66       200
           1       0.64      0.57      0.60       191

    accuracy                           0.63       391
   macro avg       0.64      0.63      0.63       391
weighted avg       0.63      0.63      0.63       391

[[139  61]
 [ 82 109]]


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.61      0.77      0.68       200
           1       0.67      0.49      0.57       191

    accuracy                           0.63       391
   macro avg       0.64      0.63      0.63       391
weighted avg       0.64      0.63      0.63       391

[[154  46]
 [ 97  94]]




Training completed. Do not forget to share your model on huggingface.co/models =)


[32m[I 2021-12-12 17:56:35,168][0m Trial 8 finished with value: 0.6254513300420013 and parameters: {'learning_rate': 3.01722160191678e-05, 'per_device_train_batch_size': 16, 'weight_decay': 0.0034806136879271246, 'num_train_epochs': 3.355906718431561}. Best is trial 3 with value: 0.6341179319054817.[0m


Trial 8 finished with value: 0.6254513300420013 and parameters: {'learning_rate': 3.01722160191678e-05, 'per_device_train_batch_size': 16, 'weight_decay': 0.0034806136879271246, 'num_train_epochs': 3.355906718431561}. Best is trial 3 with value: 0.6341179319054817.


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.693878,0.511509,0.338409,0.255754,0.5


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.51      1.00      0.68       200
           1       0.00      0.00      0.00       191

    accuracy                           0.51       391
   macro avg       0.26      0.50      0.34       391
weighted avg       0.26      0.51      0.35       391

[[200   0]
 [191   0]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-12 17:58:16,453][0m Trial 9 pruned. [0m


Trial 9 pruned. 


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.698762,0.488491,0.328179,0.244246,0.5


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       200
           1       0.49      1.00      0.66       191

    accuracy                           0.49       391
   macro avg       0.24      0.50      0.33       391
weighted avg       0.24      0.49      0.32       391

[[  0 200]
 [  0 191]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-12 17:59:51,470][0m Trial 10 pruned. [0m


Trial 10 pruned. 


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.694234,0.511509,0.338409,0.255754,0.5


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.51      1.00      0.68       200
           1       0.00      0.00      0.00       191

    accuracy                           0.51       391
   macro avg       0.26      0.50      0.34       391
weighted avg       0.26      0.51      0.35       391

[[200   0]
 [191   0]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-12 18:01:26,509][0m Trial 11 pruned. [0m


Trial 11 pruned. 


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.698773,0.488491,0.328179,0.244246,0.5


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       200
           1       0.49      1.00      0.66       191

    accuracy                           0.49       391
   macro avg       0.24      0.50      0.33       391
weighted avg       0.24      0.49      0.32       391

[[  0 200]
 [  0 191]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-12 18:03:01,806][0m Trial 12 pruned. [0m


Trial 12 pruned. 


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.682153,0.560102,0.472947,0.635854,0.551034
2,No log,0.65905,0.624041,0.621176,0.625154,0.622369
3,No log,0.646753,0.649616,0.646275,0.652111,0.647723
3,No log,0.705227,0.639386,0.636639,0.640857,0.637723


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.54      0.94      0.69       200
           1       0.73      0.16      0.26       191

    accuracy                           0.56       391
   macro avg       0.64      0.55      0.47       391
weighted avg       0.63      0.56      0.48       391

[[189  11]
 [161  30]]


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.62      0.69      0.65       200
           1       0.63      0.55      0.59       191

    accuracy                           0.62       391
   macro avg       0.63      0.62      0.62       391
weighted avg       0.62      0.62      0.62       391

[[139  61]
 [ 86 105]]


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.64      0.73      0.68       200
           1       0.67      0.57      0.61       191

    accuracy                           0.65       391
   macro avg       0.65      0.65      0.65       391
weighted avg       0.65      0.65      0.65       391

[[146  54]
 [ 83 108]]


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.63      0.71      0.67       200
           1       0.65      0.57      0.61       191

    accuracy                           0.64       391
   macro avg       0.64      0.64      0.64       391
weighted avg       0.64      0.64      0.64       391

[[142  58]
 [ 83 108]]




Training completed. Do not forget to share your model on huggingface.co/models =)


[32m[I 2021-12-12 18:09:14,828][0m Trial 13 finished with value: 0.6366386554621848 and parameters: {'learning_rate': 2.9136645854693335e-05, 'per_device_train_batch_size': 16, 'weight_decay': 1.0946416634758784e-08, 'num_train_epochs': 3.9728281289117455}. Best is trial 13 with value: 0.6366386554621848.[0m


Trial 13 finished with value: 0.6366386554621848 and parameters: {'learning_rate': 2.9136645854693335e-05, 'per_device_train_batch_size': 16, 'weight_decay': 1.0946416634758784e-08, 'num_train_epochs': 3.9728281289117455}. Best is trial 13 with value: 0.6366386554621848.


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.829817,0.488491,0.328179,0.244246,0.5


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       200
           1       0.49      1.00      0.66       191

    accuracy                           0.49       391
   macro avg       0.24      0.50      0.33       391
weighted avg       0.24      0.49      0.32       391

[[  0 200]
 [  0 191]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-12 18:10:50,038][0m Trial 14 pruned. [0m


Trial 14 pruned. 


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.695934,0.488491,0.328179,0.244246,0.5


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       200
           1       0.49      1.00      0.66       191

    accuracy                           0.49       391
   macro avg       0.24      0.50      0.33       391
weighted avg       0.24      0.49      0.32       391

[[  0 200]
 [  0 191]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-12 18:12:25,129][0m Trial 15 pruned. [0m


Trial 15 pruned. 


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,2.99491,0.488491,0.328179,0.244246,0.5


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       200
           1       0.49      1.00      0.66       191

    accuracy                           0.49       391
   macro avg       0.24      0.50      0.33       391
weighted avg       0.24      0.49      0.32       391

[[  0 200]
 [  0 191]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-12 18:14:00,301][0m Trial 16 pruned. [0m


Trial 16 pruned. 


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.69364,0.511509,0.338409,0.255754,0.5


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.51      1.00      0.68       200
           1       0.00      0.00      0.00       191

    accuracy                           0.51       391
   macro avg       0.26      0.50      0.34       391
weighted avg       0.26      0.51      0.35       391

[[200   0]
 [191   0]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-12 18:15:51,132][0m Trial 17 pruned. [0m


Trial 17 pruned. 


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.6999,0.702908,0.488491,0.328179,0.244246,0.5


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       200
           1       0.49      1.00      0.66       191

    accuracy                           0.49       391
   macro avg       0.24      0.50      0.33       391
weighted avg       0.24      0.49      0.32       391

[[  0 200]
 [  0 191]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-12 18:18:01,381][0m Trial 18 pruned. [0m


Trial 18 pruned. 


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.692894,0.511509,0.338409,0.255754,0.5


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.51      1.00      0.68       200
           1       0.00      0.00      0.00       191

    accuracy                           0.51       391
   macro avg       0.26      0.50      0.34       391
weighted avg       0.26      0.51      0.35       391

[[200   0]
 [191   0]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-12 18:19:36,550][0m Trial 19 pruned. [0m


Trial 19 pruned. 


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.696312,0.488491,0.328179,0.244246,0.5


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       200
           1       0.49      1.00      0.66       191

    accuracy                           0.49       391
   macro avg       0.24      0.50      0.33       391
weighted avg       0.24      0.49      0.32       391

[[  0 200]
 [  0 191]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-12 18:21:11,718][0m Trial 20 pruned. [0m


Trial 20 pruned. 


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.692661,0.575448,0.566229,0.57798,0.572395
2,No log,0.700582,0.511509,0.338409,0.255754,0.5
3,No log,0.69254,0.511509,0.338409,0.255754,0.5


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.57      0.70      0.63       200
           1       0.59      0.44      0.50       191

    accuracy                           0.58       391
   macro avg       0.58      0.57      0.57       391
weighted avg       0.58      0.58      0.57       391

[[141  59]
 [107  84]]


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.51      1.00      0.68       200
           1       0.00      0.00      0.00       191

    accuracy                           0.51       391
   macro avg       0.26      0.50      0.34       391
weighted avg       0.26      0.51      0.35       391

[[200   0]
 [191   0]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.51      1.00      0.68       200
           1       0.00      0.00      0.00       191

    accuracy                           0.51       391
   macro avg       0.26      0.50      0.34       391
weighted avg       0.26      0.51      0.35       391

[[200   0]
 [191   0]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-12 18:25:52,717][0m Trial 21 pruned. [0m


Trial 21 pruned. 


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.675485,0.629156,0.629069,0.63015,0.629843
2,No log,0.667878,0.613811,0.600256,0.624703,0.609895
3,No log,0.648524,0.629156,0.626331,0.630388,0.627487
3,No log,0.648824,0.629156,0.626331,0.630388,0.627487


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.65      0.60      0.62       200
           1       0.61      0.66      0.63       191

    accuracy                           0.63       391
   macro avg       0.63      0.63      0.63       391
weighted avg       0.63      0.63      0.63       391

[[120  80]
 [ 65 126]]


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.59      0.78      0.67       200
           1       0.66      0.44      0.53       191

    accuracy                           0.61       391
   macro avg       0.62      0.61      0.60       391
weighted avg       0.62      0.61      0.60       391

[[156  44]
 [107  84]]


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.62      0.70      0.66       200
           1       0.64      0.55      0.59       191

    accuracy                           0.63       391
   macro avg       0.63      0.63      0.63       391
weighted avg       0.63      0.63      0.63       391

[[140  60]
 [ 85 106]]


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.62      0.70      0.66       200
           1       0.64      0.55      0.59       191

    accuracy                           0.63       391
   macro avg       0.63      0.63      0.63       391
weighted avg       0.63      0.63      0.63       391

[[140  60]
 [ 85 106]]




Training completed. Do not forget to share your model on huggingface.co/models =)


[32m[I 2021-12-12 18:30:49,421][0m Trial 22 finished with value: 0.6263305322128851 and parameters: {'learning_rate': 1.3558861400977725e-05, 'per_device_train_batch_size': 16, 'weight_decay': 0.0016058525778814324, 'num_train_epochs': 3.087744367688028}. Best is trial 13 with value: 0.6366386554621848.[0m


Trial 22 finished with value: 0.6263305322128851 and parameters: {'learning_rate': 1.3558861400977725e-05, 'per_device_train_batch_size': 16, 'weight_decay': 0.0016058525778814324, 'num_train_epochs': 3.087744367688028}. Best is trial 13 with value: 0.6366386554621848.


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.691873,0.480818,0.324698,0.242268,0.492147


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       200
           1       0.48      0.98      0.65       191

    accuracy                           0.48       391
   macro avg       0.24      0.49      0.32       391
weighted avg       0.24      0.48      0.32       391

[[  0 200]
 [  3 188]]


[32m[I 2021-12-12 18:32:24,924][0m Trial 23 pruned. [0m


Trial 23 pruned. 


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.69352,0.488491,0.328179,0.244246,0.5


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       200
           1       0.49      1.00      0.66       191

    accuracy                           0.49       391
   macro avg       0.24      0.50      0.33       391
weighted avg       0.24      0.49      0.32       391

[[  0 200]
 [  0 191]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-12 18:33:59,807][0m Trial 24 pruned. [0m


Trial 24 pruned. 


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.695985,0.488491,0.328179,0.244246,0.5


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       200
           1       0.49      1.00      0.66       191

    accuracy                           0.49       391
   macro avg       0.24      0.50      0.33       391
weighted avg       0.24      0.49      0.32       391

[[  0 200]
 [  0 191]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-12 18:35:34,801][0m Trial 25 pruned. [0m


Trial 25 pruned. 


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.692647,0.488491,0.332537,0.494216,0.499882


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.50      0.01      0.01       200
           1       0.49      0.99      0.66       191

    accuracy                           0.49       391
   macro avg       0.49      0.50      0.33       391
weighted avg       0.49      0.49      0.33       391

[[  1 199]
 [  1 190]]


[32m[I 2021-12-12 18:37:16,087][0m Trial 26 pruned. [0m


Trial 26 pruned. 


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.692931,0.511509,0.338409,0.255754,0.5


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.51      1.00      0.68       200
           1       0.00      0.00      0.00       191

    accuracy                           0.51       391
   macro avg       0.26      0.50      0.34       391
weighted avg       0.26      0.51      0.35       391

[[200   0]
 [191   0]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-12 18:39:06,004][0m Trial 27 pruned. [0m


Trial 27 pruned. 


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.659404,0.608696,0.608532,0.609881,0.60949
2,No log,0.658282,0.608696,0.606378,0.60905,0.607251
2,No log,0.6682,0.611253,0.603406,0.616022,0.608338


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.63      0.57      0.60       200
           1       0.59      0.64      0.62       191

    accuracy                           0.61       391
   macro avg       0.61      0.61      0.61       391
weighted avg       0.61      0.61      0.61       391

[[115  85]
 [ 68 123]]


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.61      0.67      0.64       200
           1       0.61      0.54      0.58       191

    accuracy                           0.61       391
   macro avg       0.61      0.61      0.61       391
weighted avg       0.61      0.61      0.61       391

[[134  66]
 [ 87 104]]


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.60      0.73      0.66       200
           1       0.63      0.48      0.55       191

    accuracy                           0.61       391
   macro avg       0.62      0.61      0.60       391
weighted avg       0.62      0.61      0.60       391

[[147  53]
 [ 99  92]]


[32m[I 2021-12-12 18:43:40,944][0m Trial 28 pruned. [0m


Trial 28 pruned. 


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.6947,0.691884,0.557545,0.550189,0.565872,0.560785
2,0.6898,0.691405,0.519182,0.368488,0.591187,0.508207
3,0.684,0.67321,0.601023,0.595174,0.611814,0.60411


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.60      0.42      0.49       200
           1       0.54      0.70      0.61       191

    accuracy                           0.56       391
   macro avg       0.57      0.56      0.55       391
weighted avg       0.57      0.56      0.55       391

[[ 84 116]
 [ 57 134]]


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.52      0.98      0.68       200
           1       0.67      0.03      0.06       191

    accuracy                           0.52       391
   macro avg       0.59      0.51      0.37       391
weighted avg       0.59      0.52      0.38       391

[[197   3]
 [185   6]]


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.65      0.47      0.55       200
           1       0.57      0.74      0.64       191

    accuracy                           0.60       391
   macro avg       0.61      0.60      0.60       391
weighted avg       0.61      0.60      0.59       391

[[ 94 106]
 [ 50 141]]


[32m[I 2021-12-12 18:50:04,350][0m Trial 29 pruned. [0m


Trial 29 pruned. 


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,1.1176,1.248005,0.488491,0.328179,0.244246,0.5


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       200
           1       0.49      1.00      0.66       191

    accuracy                           0.49       391
   macro avg       0.24      0.50      0.33       391
weighted avg       0.24      0.49      0.32       391

[[  0 200]
 [  0 191]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-12 18:52:13,577][0m Trial 30 pruned. [0m


Trial 30 pruned. 


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.658447,0.613811,0.61235,0.613795,0.612723
2,No log,0.648751,0.629156,0.629146,0.629324,0.629372
3,No log,0.672306,0.639386,0.633868,0.643952,0.636898
3,No log,0.691414,0.636829,0.633179,0.63913,0.634869


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.61      0.66      0.64       200
           1       0.61      0.57      0.59       191

    accuracy                           0.61       391
   macro avg       0.61      0.61      0.61       391
weighted avg       0.61      0.61      0.61       391

[[132  68]
 [ 83 108]]


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.64      0.62      0.63       200
           1       0.62      0.64      0.63       191

    accuracy                           0.63       391
   macro avg       0.63      0.63      0.63       391
weighted avg       0.63      0.63      0.63       391

[[124  76]
 [ 69 122]]


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.62      0.74      0.68       200
           1       0.66      0.53      0.59       191

    accuracy                           0.64       391
   macro avg       0.64      0.64      0.63       391
weighted avg       0.64      0.64      0.63       391

[[149  51]
 [ 90 101]]


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.63      0.72      0.67       200
           1       0.65      0.55      0.60       191

    accuracy                           0.64       391
   macro avg       0.64      0.63      0.63       391
weighted avg       0.64      0.64      0.63       391

[[144  56]
 [ 86 105]]




Training completed. Do not forget to share your model on huggingface.co/models =)


[32m[I 2021-12-12 18:57:32,256][0m Trial 31 finished with value: 0.633179175475687 and parameters: {'learning_rate': 2.482091827924726e-05, 'per_device_train_batch_size': 16, 'weight_decay': 0.0024601092568661046, 'num_train_epochs': 3.34403559358756}. Best is trial 13 with value: 0.6366386554621848.[0m


Trial 31 finished with value: 0.633179175475687 and parameters: {'learning_rate': 2.482091827924726e-05, 'per_device_train_batch_size': 16, 'weight_decay': 0.0024601092568661046, 'num_train_epochs': 3.34403559358756}. Best is trial 13 with value: 0.6366386554621848.


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.687446,0.57289,0.554229,0.595753,0.577906
2,No log,0.668458,0.634271,0.62958,0.637561,0.632016
3,No log,0.645724,0.624041,0.620456,0.625761,0.622134
4,No log,0.659245,0.636829,0.624445,0.650305,0.632984
4,No log,0.668237,0.629156,0.62696,0.629864,0.627723


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.65      0.36      0.46       200
           1       0.54      0.80      0.65       191

    accuracy                           0.57       391
   macro avg       0.60      0.58      0.55       391
weighted avg       0.60      0.57      0.55       391

[[ 72 128]
 [ 39 152]]


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.62      0.73      0.67       200
           1       0.65      0.53      0.59       191

    accuracy                           0.63       391
   macro avg       0.64      0.63      0.63       391
weighted avg       0.64      0.63      0.63       391

[[146  54]
 [ 89 102]]


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.62      0.70      0.66       200
           1       0.64      0.54      0.58       191

    accuracy                           0.62       391
   macro avg       0.63      0.62      0.62       391
weighted avg       0.63      0.62      0.62       391

[[141  59]
 [ 88 103]]


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.61      0.80      0.69       200
           1       0.69      0.47      0.56       191

    accuracy                           0.64       391
   macro avg       0.65      0.63      0.62       391
weighted avg       0.65      0.64      0.63       391

[[160  40]
 [102  89]]


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.62      0.69      0.66       200
           1       0.64      0.57      0.60       191

    accuracy                           0.63       391
   macro avg       0.63      0.63      0.63       391
weighted avg       0.63      0.63      0.63       391

[[138  62]
 [ 83 108]]




Training completed. Do not forget to share your model on huggingface.co/models =)


[32m[I 2021-12-12 19:04:49,480][0m Trial 32 finished with value: 0.6269599489409861 and parameters: {'learning_rate': 1.0895430041659685e-05, 'per_device_train_batch_size': 16, 'weight_decay': 0.0030793307766418536, 'num_train_epochs': 4.635265632779619}. Best is trial 13 with value: 0.6366386554621848.[0m


Trial 32 finished with value: 0.6269599489409861 and parameters: {'learning_rate': 1.0895430041659685e-05, 'per_device_train_batch_size': 16, 'weight_decay': 0.0030793307766418536, 'num_train_epochs': 4.635265632779619}. Best is trial 13 with value: 0.6366386554621848.


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.692909,0.511509,0.338409,0.255754,0.5


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.51      1.00      0.68       200
           1       0.00      0.00      0.00       191

    accuracy                           0.51       391
   macro avg       0.26      0.50      0.34       391
weighted avg       0.26      0.51      0.35       391

[[200   0]
 [191   0]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-12 19:06:24,626][0m Trial 33 pruned. [0m


Trial 33 pruned. 


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.678106,0.626598,0.620136,0.631288,0.623927


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.61      0.74      0.67       200
           1       0.65      0.51      0.57       191

    accuracy                           0.63       391
   macro avg       0.63      0.62      0.62       391
weighted avg       0.63      0.63      0.62       391

[[148  52]
 [ 94  97]]


Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.678106,0.626598,0.620136,0.631288,0.623927
2,0.687500,0.666478,0.626598,0.618491,0.644521,0.630288
3,0.643000,0.628921,0.621483,0.614398,0.626408,0.618691


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.70      0.47      0.56       200
           1       0.59      0.79      0.67       191

    accuracy                           0.63       391
   macro avg       0.64      0.63      0.62       391
weighted avg       0.65      0.63      0.62       391

[[ 94 106]
 [ 40 151]]


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.61      0.74      0.67       200
           1       0.65      0.50      0.56       191

    accuracy                           0.62       391
   macro avg       0.63      0.62      0.61       391
weighted avg       0.63      0.62      0.62       391

[[148  52]
 [ 96  95]]


[32m[I 2021-12-12 19:11:51,229][0m Trial 34 pruned. [0m


Trial 34 pruned. 


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.693972,0.488491,0.328179,0.244246,0.5


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       200
           1       0.49      1.00      0.66       191

    accuracy                           0.49       391
   macro avg       0.24      0.50      0.33       391
weighted avg       0.24      0.49      0.32       391

[[  0 200]
 [  0 191]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-12 19:13:26,341][0m Trial 35 pruned. [0m


Trial 35 pruned. 


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.692905,0.488491,0.328179,0.244246,0.5


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       200
           1       0.49      1.00      0.66       191

    accuracy                           0.49       391
   macro avg       0.24      0.50      0.33       391
weighted avg       0.24      0.49      0.32       391

[[  0 200]
 [  0 191]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-12 19:15:07,829][0m Trial 36 pruned. [0m


Trial 36 pruned. 


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.697718,0.488491,0.328179,0.244246,0.5


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       200
           1       0.49      1.00      0.66       191

    accuracy                           0.49       391
   macro avg       0.24      0.50      0.33       391
weighted avg       0.24      0.49      0.32       391

[[  0 200]
 [  0 191]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-12 19:16:42,876][0m Trial 37 pruned. [0m


Trial 37 pruned. 


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.660606,0.611253,0.610129,0.611073,0.61034
2,No log,0.662962,0.636829,0.636807,0.637472,0.637343
3,No log,0.651779,0.631714,0.629949,0.632139,0.630458
4,No log,0.749231,0.618926,0.618886,0.619652,0.61949
5,No log,0.80915,0.629156,0.6244,0.632229,0.626898
5,0.541900,0.835212,0.618926,0.605551,0.63051,0.615013


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.61      0.65      0.63       200
           1       0.61      0.57      0.59       191

    accuracy                           0.61       391
   macro avg       0.61      0.61      0.61       391
weighted avg       0.61      0.61      0.61       391

[[130  70]
 [ 82 109]]


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.65      0.61      0.63       200
           1       0.62      0.66      0.64       191

    accuracy                           0.64       391
   macro avg       0.64      0.64      0.64       391
weighted avg       0.64      0.64      0.64       391

[[123  77]
 [ 65 126]]


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.63      0.69      0.66       200
           1       0.64      0.58      0.60       191

    accuracy                           0.63       391
   macro avg       0.63      0.63      0.63       391
weighted avg       0.63      0.63      0.63       391

[[137  63]
 [ 81 110]]


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.64      0.59      0.61       200
           1       0.60      0.64      0.62       191

    accuracy                           0.62       391
   macro avg       0.62      0.62      0.62       391
weighted avg       0.62      0.62      0.62       391

[[119  81]
 [ 68 123]]


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.62      0.72      0.67       200
           1       0.65      0.53      0.58       191

    accuracy                           0.63       391
   macro avg       0.63      0.63      0.62       391
weighted avg       0.63      0.63      0.63       391

[[145  55]
 [ 90 101]]


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.60      0.79      0.68       200
           1       0.66      0.45      0.53       191

    accuracy                           0.62       391
   macro avg       0.63      0.62      0.61       391
weighted avg       0.63      0.62      0.61       391

[[157  43]
 [106  85]]




Training completed. Do not forget to share your model on huggingface.co/models =)


[32m[I 2021-12-12 19:25:11,504][0m Trial 38 finished with value: 0.6055505528209781 and parameters: {'learning_rate': 1.7126909465601443e-05, 'per_device_train_batch_size': 16, 'weight_decay': 1.7275485042756645e-06, 'num_train_epochs': 5.38631612164996}. Best is trial 13 with value: 0.6366386554621848.[0m


Trial 38 finished with value: 0.6055505528209781 and parameters: {'learning_rate': 1.7126909465601443e-05, 'per_device_train_batch_size': 16, 'weight_decay': 1.7275485042756645e-06, 'num_train_epochs': 5.38631612164996}. Best is trial 13 with value: 0.6366386554621848.


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,135.295609,0.488491,0.328179,0.244246,0.5


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       200
           1       0.49      1.00      0.66       191

    accuracy                           0.49       391
   macro avg       0.24      0.50      0.33       391
weighted avg       0.24      0.49      0.32       391

[[  0 200]
 [  0 191]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-12 19:27:01,641][0m Trial 39 pruned. [0m


Trial 39 pruned. 


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.69326,0.511509,0.338409,0.255754,0.5


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.51      1.00      0.68       200
           1       0.00      0.00      0.00       191

    accuracy                           0.51       391
   macro avg       0.26      0.50      0.34       391
weighted avg       0.26      0.51      0.35       391

[[200   0]
 [191   0]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-12 19:28:43,135][0m Trial 40 pruned. [0m


Trial 40 pruned. 


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.692863,0.511509,0.338409,0.255754,0.5


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.51      1.00      0.68       200
           1       0.00      0.00      0.00       191

    accuracy                           0.51       391
   macro avg       0.26      0.50      0.34       391
weighted avg       0.26      0.51      0.35       391

[[200   0]
 [191   0]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-12 19:30:18,189][0m Trial 41 pruned. [0m


Trial 41 pruned. 


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.685204,0.621483,0.620388,0.625113,0.62305
2,No log,0.6713,0.613811,0.601023,0.623858,0.610013
2,No log,0.644448,0.616368,0.612902,0.617708,0.614516


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.65      0.56      0.60       200
           1       0.60      0.69      0.64       191

    accuracy                           0.62       391
   macro avg       0.63      0.62      0.62       391
weighted avg       0.63      0.62      0.62       391

[[111  89]
 [ 59 132]]


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.59      0.78      0.67       200
           1       0.65      0.45      0.53       191

    accuracy                           0.61       391
   macro avg       0.62      0.61      0.60       391
weighted avg       0.62      0.61      0.60       391

[[155  45]
 [106  85]]


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.61      0.69      0.65       200
           1       0.63      0.53      0.58       191

    accuracy                           0.62       391
   macro avg       0.62      0.61      0.61       391
weighted avg       0.62      0.62      0.61       391

[[139  61]
 [ 89 102]]


[32m[I 2021-12-12 19:34:36,504][0m Trial 42 pruned. [0m


Trial 42 pruned. 


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.693967,0.488491,0.328179,0.244246,0.5


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       200
           1       0.49      1.00      0.66       191

    accuracy                           0.49       391
   macro avg       0.24      0.50      0.33       391
weighted avg       0.24      0.49      0.32       391

[[  0 200]
 [  0 191]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-12 19:36:11,581][0m Trial 43 pruned. [0m


Trial 43 pruned. 


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.709101,0.488491,0.328179,0.244246,0.5


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       200
           1       0.49      1.00      0.66       191

    accuracy                           0.49       391
   macro avg       0.24      0.50      0.33       391
weighted avg       0.24      0.49      0.32       391

[[  0 200]
 [  0 191]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-12 19:37:46,710][0m Trial 44 pruned. [0m


Trial 44 pruned. 


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.693007,0.488491,0.328179,0.244246,0.5


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       200
           1       0.49      1.00      0.66       191

    accuracy                           0.49       391
   macro avg       0.24      0.50      0.33       391
weighted avg       0.24      0.49      0.32       391

[[  0 200]
 [  0 191]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-12 19:39:21,678][0m Trial 45 pruned. [0m


Trial 45 pruned. 


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.694079,0.488491,0.328179,0.244246,0.5


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       200
           1       0.49      1.00      0.66       191

    accuracy                           0.49       391
   macro avg       0.24      0.50      0.33       391
weighted avg       0.24      0.49      0.32       391

[[  0 200]
 [  0 191]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-12 19:40:56,854][0m Trial 46 pruned. [0m


Trial 46 pruned. 


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.7095,0.692908,0.511509,0.338409,0.255754,0.5


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.51      1.00      0.68       200
           1       0.00      0.00      0.00       191

    accuracy                           0.51       391
   macro avg       0.26      0.50      0.34       391
weighted avg       0.26      0.51      0.35       391

[[200   0]
 [191   0]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-12 19:43:06,194][0m Trial 47 pruned. [0m


Trial 47 pruned. 


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.692911,0.511509,0.338409,0.255754,0.5


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.51      1.00      0.68       200
           1       0.00      0.00      0.00       191

    accuracy                           0.51       391
   macro avg       0.26      0.50      0.34       391
weighted avg       0.26      0.51      0.35       391

[[200   0]
 [191   0]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-12 19:44:41,417][0m Trial 48 pruned. [0m


Trial 48 pruned. 


Trial:
loading configuration file https://huggingface.co/roberta-base/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/733bade19e5f0ce98e6531021dd5180994bb2f7b8bd7e80c7968805834ba351e.35205c6cfc956461d8515139f0f8dd5d207a2f336c0c3a83b4bc8dca3518e37b
Model config RobertaConfig {
  "_name_or_path": "roberta-base",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-05,
  "max_position_embeddings": 514,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "transformers_version": "4.13.0",
  "type_vocab_size": 1,
  "use_cache": true,
  "vocab_size": 50265
}

loading weights file https://huggingface.co/roberta

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.693635,0.488491,0.328179,0.244246,0.5


The following columns in the evaluation set  don't have a corresponding argument in `RobertaForSequenceClassification.forward` and have been ignored: __index_level_0__, text.
***** Running Evaluation *****
  Num examples = 391
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       200
           1       0.49      1.00      0.66       191

    accuracy                           0.49       391
   macro avg       0.24      0.50      0.33       391
weighted avg       0.24      0.49      0.32       391

[[  0 200]
 [  0 191]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-12 19:46:16,604][0m Trial 49 pruned. [0m


Trial 49 pruned. 


[32m[I 2021-12-12 19:46:16,642][0m A new study created in memory with name: no-name-39219a64-861d-4682-a20e-1ba445b59167[0m


A new study created in memory with name: no-name-39219a64-861d-4682-a20e-1ba445b59167


In [12]:
storage_name

'sqlite:///RoBERTa_MASK_NS.db'

In [13]:
study_name

'RoBERTa_MASK_NS'

In [14]:
study = optuna.create_study(study_name=study_name, storage=storage_name, load_if_exists=True, direction="maximize")
df = study.trials_dataframe(attrs=("number", "value", "params", "state"))

[32m[I 2021-12-12 19:46:16,753][0m Using an existing study with name 'RoBERTa_MASK_NS' instead of creating a new one.[0m


Using an existing study with name 'RoBERTa_MASK_NS' instead of creating a new one.


In [15]:
df

Unnamed: 0,number,value,params_learning_rate,params_num_train_epochs,params_per_device_train_batch_size,params_weight_decay,state
0,0,0.338409,1.0696e-05,7.722648,2,8.320151e-08,COMPLETE
1,1,0.338409,0.4221777,5.688071,4,0.04132608,COMPLETE
2,2,0.440629,2.440031e-06,2.744239,8,5.252612e-07,COMPLETE
3,3,0.634118,1.081392e-05,2.981916,16,3.509982e-09,COMPLETE
4,4,0.616366,2.107441e-06,2.571573,4,4.113694e-11,COMPLETE
5,5,0.328179,2.30841e-06,4.656619,16,4.119576e-11,PRUNED
6,6,0.328179,0.005303481,7.334966,8,0.1188048,PRUNED
7,7,0.338409,8.714368e-05,1.361011,2,0.0002285913,PRUNED
8,8,0.625451,3.017222e-05,3.355907,16,0.003480614,COMPLETE
9,9,0.338409,0.0003571422,1.17325,8,1.629541e-11,PRUNED


In [16]:
fig = optuna.visualization.plot_param_importances(study)
fig.show()

In [17]:
best_run

BestRun(run_id='13', objective=0.6366386554621848, hyperparameters={'learning_rate': 2.9136645854693335e-05, 'num_train_epochs': 3.9728281289117455, 'per_device_train_batch_size': 16, 'weight_decay': 1.0946416634758784e-08})

In [18]:
optuna.visualization.plot_intermediate_values(study)

In [19]:
optuna.visualization.plot_parallel_coordinate(study)

In [20]:
optuna.visualization.plot_optimization_history(study)

In [21]:
optuna.visualization.plot_contour(study)

In [22]:
optuna.visualization.plot_slice(study)

In [23]:
optuna.visualization.plot_edf(study)