# Initiliation

In [None]:
!pip install transformers datasets --quiet

In [None]:
from transformers import TrainingArguments
from transformers import Trainer
from transformers import AutoModelForSequenceClassification
from transformers import AutoTokenizer

from sklearn.model_selection import train_test_split
from sklearn.metrics import precision_recall_fscore_support, accuracy_score, classification_report, confusion_matrix
from datasets import Dataset
from datasets import load_metric

import numpy as np
import math
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

from google.colab import drive

# Data Preparation

In [None]:
drive.mount('/content/drive/')

Mounted at /content/drive/


In [None]:
%cd 'drive/MyDrive/Masterarbeit/Colab Notebooks/OVERVIEW myPers/00_Datasets/Baseline'

/content/drive/.shortcut-targets-by-id/1aHXlqhpj1STohhfU4gn53D4whaLH__Jz/Masterarbeit/Colab Notebooks/OVERVIEW myPers/00_Datasets/Baseline


In [None]:
dfPJ = pd.read_csv('myPers_OPN_Baseline.csv', sep=",", error_bad_lines=False)
dfPJ

Unnamed: 0,text,label
0,likes the sound of thunder.,1
1,is so sleepy it's not even funny that's she ca...,1
2,is sore and wants the knot of muscles at the b...,1
3,likes how the day sounds in this new song.,1
4,is home. <3,1
...,...,...
9912,little things give you away.,1
9913,is wishing it was Saturday.,1
9914,is studying hard for the G.R.E.,1
9915,snipers get more head,1


In [None]:
df_clean= []
for i,row in dfPJ.iterrows():
  df_clean.append({
      'text': str(row['text']),
      'label': int(row['label']),
  })

dfPJ = pd.DataFrame(df_clean)
dfPJ

Unnamed: 0,text,label
0,likes the sound of thunder.,1
1,is so sleepy it's not even funny that's she ca...,1
2,is sore and wants the knot of muscles at the b...,1
3,likes how the day sounds in this new song.,1
4,is home. <3,1
...,...,...
9912,little things give you away.,1
9913,is wishing it was Saturday.,1
9914,is studying hard for the G.R.E.,1
9915,snipers get more head,1


# Model Training

In [None]:
modeltype = "princeton-nlp/sup-simcse-bert-base-uncased"

In [None]:
train, test = train_test_split(dfPJ, test_size=0.2, random_state=0, stratify=dfPJ.label)

train = Dataset.from_pandas(train)
test = Dataset.from_pandas(test)

tokenizer = AutoTokenizer.from_pretrained(modeltype)

def tokenize_function(examples):
    return tokenizer(examples["text"], padding="max_length", truncation=True)

tokenized_train = train.map(tokenize_function, batched=True)
tokenized_test = test.map(tokenize_function, batched=True)

full_train_dataset = tokenized_train
full_eval_dataset = tokenized_test

model = AutoModelForSequenceClassification.from_pretrained(modeltype, num_labels=2)

training_args = TrainingArguments(
    "SIMCSE_BERT_OPN", 
    evaluation_strategy="epoch",
    save_strategy = 'no',
    save_steps = 100000,
    save_total_limit = 1,
    metric_for_best_model="eval_f1")

def compute_metrics(pred):
    labels = pred.label_ids
    preds = pred.predictions.argmax(-1)
    precision, recall, f1, _ = precision_recall_fscore_support(labels, preds, average='macro')
    acc = accuracy_score(labels, preds)
    print(classification_report(labels, preds, labels=[0,1]))
    print(confusion_matrix(labels,preds))
    return {
        'accuracy': acc,
        'f1': f1,
        'precision': precision,
        'recall': recall
    }

Downloading:   0%|          | 0.00/252 [00:00<?, ?B/s]

Downloading:   0%|          | 0.00/689 [00:00<?, ?B/s]

Downloading:   0%|          | 0.00/226k [00:00<?, ?B/s]

Downloading:   0%|          | 0.00/112 [00:00<?, ?B/s]

  0%|          | 0/8 [00:00<?, ?ba/s]

  0%|          | 0/2 [00:00<?, ?ba/s]

Downloading:   0%|          | 0.00/418M [00:00<?, ?B/s]

Some weights of BertForSequenceClassification were not initialized from the model checkpoint at princeton-nlp/sup-simcse-bert-base-uncased and are newly initialized: ['classifier.weight', 'classifier.bias']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


# Hyperparameter Optimization

In [None]:
! pip install optuna --quiet

[K     |████████████████████████████████| 308 kB 13.3 MB/s 
[K     |████████████████████████████████| 80 kB 8.1 MB/s 
[K     |████████████████████████████████| 209 kB 54.8 MB/s 
[K     |████████████████████████████████| 75 kB 4.4 MB/s 
[K     |████████████████████████████████| 49 kB 6.0 MB/s 
[K     |████████████████████████████████| 112 kB 50.9 MB/s 
[K     |████████████████████████████████| 149 kB 51.0 MB/s 
[?25h  Building wheel for pyperclip (setup.py) ... [?25l[?25hdone


In [None]:
def model_init():
    return AutoModelForSequenceClassification.from_pretrained(modeltype, num_labels=2)

In [None]:
trainer = Trainer(
      model_init=model_init,
      args=training_args, 
      train_dataset=full_train_dataset, 
      eval_dataset=full_eval_dataset,
      compute_metrics=compute_metrics 
  )

loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weights file

In [None]:
import sklearn.metrics as metrics
import optuna
import sys
import logging

def objective (metrics):
  return metrics['eval_f1']

def hyperparameter_space(trial):

    return {
        "learning_rate": trial.suggest_float("learning_rate", 5e-8, 5e-1, log=True),
        "per_device_train_batch_size": trial.suggest_categorical("per_device_train_batch_size", [2, 4, 8, 16]),
        "weight_decay": trial.suggest_float("weight_decay", 5e-12, 5e-1, log=True),
        "num_train_epochs": trial.suggest_float("num_train_epochs",1,8,log=True),
        #"adam_epsilon": trial.suggest_float("adam_epsilon", 1e-10, 1e-6, log=True),
        #"seed" : trial.suggest_float("seed",10,60,log=True)
        }

optuna.logging.get_logger("optuna").addHandler(logging.StreamHandler(sys.stdout))
study_name = "SIMCSE_BERT_myPers_OPN"  # Unique identifier of the study.
storage_name = "sqlite:///{}.db".format(study_name)

best_run = trainer.hyperparameter_search(hp_space=hyperparameter_space,compute_objective=objective, n_trials=50, direction="maximize",study_name=study_name, storage=storage_name )

study = optuna.create_study()

[32m[I 2021-12-26 08:08:26,767][0m A new study created in RDB with name: SIMCSE_BERT_myPers_OPN[0m


A new study created in RDB with name: SIMCSE_BERT_myPers_OPN


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.562775,0.747984,0.453841,0.762744,0.512369
2,0.567700,0.550678,0.765121,0.580592,0.707627,0.579684
3,0.452400,0.7335,0.741935,0.641533,0.652987,0.63461
4,0.231800,1.291667,0.746472,0.623134,0.652731,0.613298
4,0.095900,1.35028,0.748992,0.629726,0.657765,0.619483


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.78      0.03      0.05       510
           1       0.75      1.00      0.85      1474

    accuracy                           0.75      1984
   macro avg       0.76      0.51      0.45      1984
weighted avg       0.76      0.75      0.65      1984

[[  14  496]
 [   4 1470]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.64      0.20      0.30       510
           1       0.78      0.96      0.86      1474

    accuracy                           0.77      1984
   macro avg       0.71      0.58      0.58      1984
weighted avg       0.74      0.77      0.72      1984

[[ 101  409]
 [  57 1417]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.50      0.41      0.45       510
           1       0.81      0.86      0.83      1474

    accuracy                           0.74      1984
   macro avg       0.65      0.63      0.64      1984
weighted avg       0.73      0.74      0.73      1984

[[ 211  299]
 [ 213 1261]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.51      0.34      0.41       510
           1       0.80      0.89      0.84      1474

    accuracy                           0.75      1984
   macro avg       0.65      0.61      0.62      1984
weighted avg       0.72      0.75      0.73      1984

[[ 173  337]
 [ 166 1308]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.52      0.35      0.42       510
           1       0.80      0.89      0.84      1474

    accuracy                           0.75      1984
   macro avg       0.66      0.62      0.63      1984
weighted avg       0.73      0.75      0.73      1984

[[ 180  330]
 [ 168 1306]]




Training completed. Do not forget to share your model on huggingface.co/models =)


[32m[I 2021-12-26 08:44:29,532][0m Trial 0 finished with value: 0.6297259011085378 and parameters: {'learning_rate': 7.938170684431916e-05, 'per_device_train_batch_size': 16, 'weight_decay': 1.0117798083724145e-07, 'num_train_epochs': 4.417547496496372}. Best is trial 0 with value: 0.6297259011085378.[0m


Trial 0 finished with value: 0.6297259011085378 and parameters: {'learning_rate': 7.938170684431916e-05, 'per_device_train_batch_size': 16, 'weight_decay': 1.0117798083724145e-07, 'num_train_epochs': 4.417547496496372}. Best is trial 0 with value: 0.6297259011085378.


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.5865,0.576237,0.742944,0.426258,0.371472,0.5
2,0.5781,0.579458,0.742944,0.426258,0.371472,0.5
3,0.5684,0.577111,0.742944,0.426258,0.371472,0.5
4,0.5745,0.57156,0.742944,0.426258,0.371472,0.5
4,0.5691,0.570479,0.742944,0.426258,0.371472,0.5


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.



Training completed. Do not forget to share your model on huggingface.co/models =)


[32m[I 2021-12-26 09:27:02,922][0m Trial 1 finished with value: 0.42625795257374205 and parameters: {'learning_rate': 9.105112779088691e-05, 'per_device_train_batch_size': 8, 'weight_decay': 1.3970955434012717e-05, 'num_train_epochs': 4.940370160622992}. Best is trial 0 with value: 0.62972590110

Trial 1 finished with value: 0.42625795257374205 and parameters: {'learning_rate': 9.105112779088691e-05, 'per_device_train_batch_size': 8, 'weight_decay': 1.3970955434012717e-05, 'num_train_epochs': 4.940370160622992}. Best is trial 0 with value: 0.6297259011085378.


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,36.1526,20.516682,0.742944,0.426258,0.371472,0.5
2,29.0905,11.98659,0.257056,0.204491,0.128528,0.5
3,15.3398,7.377221,0.742944,0.426258,0.371472,0.5
4,6.6198,15.602224,0.257056,0.204491,0.128528,0.5
4,2.0972,1.656899,0.742944,0.426258,0.371472,0.5


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.26      1.00      0.41       510
           1       0.00      0.00      0.00      1474

    accuracy                           0.26      1984
   macro avg       0.13      0.50      0.20      1984
weighted avg       0.07      0.26      0.11      1984

[[ 510    0]
 [1474    0]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.26      1.00      0.41       510
           1       0.00      0.00      0.00      1474

    accuracy                           0.26      1984
   macro avg       0.13      0.50      0.20      1984
weighted avg       0.07      0.26      0.11      1984

[[ 510    0]
 [1474    0]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.



Training completed. Do not forget to share your model on huggingface.co/models =)


[32m[I 2021-12-26 10:20:00,862][0m Trial 2 finished with value: 0.42625795257374205 and parameters: {'learning_rate': 0.24924007379730578, 'per_device_train_batch_size': 2, 'weight_decay': 0.0351322444546423, 'num_train_epochs': 4.589275599301454}. Best is trial 0 with value: 0.6297259011085378.

Trial 2 finished with value: 0.42625795257374205 and parameters: {'learning_rate': 0.24924007379730578, 'per_device_train_batch_size': 2, 'weight_decay': 0.0351322444546423, 'num_train_epochs': 4.589275599301454}. Best is trial 0 with value: 0.6297259011085378.


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.6767,0.585306,0.742944,0.426258,0.371472,0.5
1,0.6076,0.569956,0.742944,0.426258,0.371472,0.5


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.



Training completed. Do not forget to share your model on huggingface.co/models =)


[32m[I 2021-12-26 10:30:13,655][0m Trial 3 finished with value: 0.42625795257374205 and parameters: {'learning_rate': 0.002094823940009471, 'per_device_train_batch_size': 8, 'weight_decay': 0.020959699276371143, 'num_train_epochs': 1.1104293395030982}. Best is trial 0 with value: 0.6297259011085

Trial 3 finished with value: 0.42625795257374205 and parameters: {'learning_rate': 0.002094823940009471, 'per_device_train_batch_size': 8, 'weight_decay': 0.020959699276371143, 'num_train_epochs': 1.1104293395030982}. Best is trial 0 with value: 0.6297259011085378.


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.8441,0.842264,0.742944,0.426258,0.371472,0.5
1,0.8115,0.828826,0.742944,0.426258,0.371472,0.5


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.



Training completed. Do not forget to share your model on huggingface.co/models =)


[32m[I 2021-12-26 10:43:28,928][0m Trial 4 finished with value: 0.42625795257374205 and parameters: {'learning_rate': 0.00014748982542257642, 'per_device_train_batch_size': 2, 'weight_decay': 5.701091959227532e-09, 'num_train_epochs': 1.0969618372918108}. Best is trial 0 with value: 0.6297259011

Trial 4 finished with value: 0.42625795257374205 and parameters: {'learning_rate': 0.00014748982542257642, 'per_device_train_batch_size': 2, 'weight_decay': 5.701091959227532e-09, 'num_train_epochs': 1.0969618372918108}. Best is trial 0 with value: 0.6297259011085378.


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.9056,0.798579,0.742944,0.426258,0.371472,0.5
2,0.7303,0.651146,0.742944,0.426258,0.371472,0.5
2,0.6286,0.574372,0.742944,0.426258,0.371472,0.5


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.



Training completed. Do not forget to share your model on huggingface.co/models =)


[32m[I 2021-12-26 11:06:36,831][0m Trial 5 finished with value: 0.42625795257374205 and parameters: {'learning_rate': 0.005193582221375533, 'per_device_train_batch_size': 8, 'weight_decay': 0.1268058158816691, 'num_train_epochs': 2.657386756262832}. Best is trial 0 with value: 0.6297259011085378

Trial 5 finished with value: 0.42625795257374205 and parameters: {'learning_rate': 0.005193582221375533, 'per_device_train_batch_size': 8, 'weight_decay': 0.1268058158816691, 'num_train_epochs': 2.657386756262832}. Best is trial 0 with value: 0.6297259011085378.


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.6277,0.57671,0.742944,0.426258,0.371472,0.5
2,0.5704,0.573997,0.742944,0.426258,0.371472,0.5
2,0.5731,0.573965,0.742944,0.426258,0.371472,0.5


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.



Training completed. Do not forget to share your model on huggingface.co/models =)


[32m[I 2021-12-26 11:26:18,110][0m Trial 6 finished with value: 0.42625795257374205 and parameters: {'learning_rate': 2.5712238591451276e-07, 'per_device_train_batch_size': 8, 'weight_decay': 7.451598279845769e-08, 'num_train_epochs': 2.224512441335921}. Best is trial 0 with value: 0.62972590110

Trial 6 finished with value: 0.42625795257374205 and parameters: {'learning_rate': 2.5712238591451276e-07, 'per_device_train_batch_size': 8, 'weight_decay': 7.451598279845769e-08, 'num_train_epochs': 2.224512441335921}. Best is trial 0 with value: 0.6297259011085378.


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,10.3468,7.369725,0.742944,0.426258,0.371472,0.5
1,9.1423,2.907565,0.742944,0.426258,0.371472,0.5


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.



Training completed. Do not forget to share your model on huggingface.co/models =)


[32m[I 2021-12-26 11:38:19,817][0m Trial 7 finished with value: 0.42625795257374205 and parameters: {'learning_rate': 0.1406138008482885, 'per_device_train_batch_size': 4, 'weight_decay': 3.498291856029254e-06, 'num_train_epochs': 1.2107526090854794}. Best is trial 0 with value: 0.62972590110853

Trial 7 finished with value: 0.42625795257374205 and parameters: {'learning_rate': 0.1406138008482885, 'per_device_train_batch_size': 4, 'weight_decay': 3.498291856029254e-06, 'num_train_epochs': 1.2107526090854794}. Best is trial 0 with value: 0.6297259011085378.


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.677177,0.742944,0.426258,0.371472,0.5
2,1.304600,1.544762,0.742944,0.426258,0.371472,0.5
3,1.047400,0.572451,0.742944,0.426258,0.371472,0.5
3,0.951200,0.574366,0.742944,0.426258,0.371472,0.5


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.



Training completed. Do not forget to share your model on huggingface.co/models =)


[32m[I 2021-12-26 12:07:15,457][0m Trial 8 finished with value: 0.42625795257374205 and parameters: {'learning_rate': 0.01705713334505547, 'per_device_train_batch_size': 16, 'weight_decay': 3.848107718466195e-06, 'num_train_epochs': 3.567578309314404}. Best is trial 0 with value: 0.6297259011085

Trial 8 finished with value: 0.42625795257374205 and parameters: {'learning_rate': 0.01705713334505547, 'per_device_train_batch_size': 16, 'weight_decay': 3.848107718466195e-06, 'num_train_epochs': 3.567578309314404}. Best is trial 0 with value: 0.6297259011085378.


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.9715,1.227961,0.742944,0.426258,0.371472,0.5
1,0.9894,0.991875,0.742944,0.426258,0.371472,0.5


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.



Training completed. Do not forget to share your model on huggingface.co/models =)


[32m[I 2021-12-26 12:24:50,912][0m Trial 9 finished with value: 0.42625795257374205 and parameters: {'learning_rate': 0.001774046256208598, 'per_device_train_batch_size': 2, 'weight_decay': 8.088637700418087e-10, 'num_train_epochs': 1.5290486026803884}. Best is trial 0 with value: 0.629725901108

Trial 9 finished with value: 0.42625795257374205 and parameters: {'learning_rate': 0.001774046256208598, 'per_device_train_batch_size': 2, 'weight_decay': 8.088637700418087e-10, 'num_train_epochs': 1.5290486026803884}. Best is trial 0 with value: 0.6297259011085378.


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.56115,0.742944,0.426258,0.371472,0.5
2,0.571200,0.551184,0.743952,0.430411,0.871847,0.501961
3,0.548200,0.546043,0.753024,0.478079,0.773213,0.524096
4,0.522600,0.543137,0.754032,0.523494,0.688934,0.544651
5,0.496800,0.544246,0.752016,0.545143,0.665935,0.555477
6,0.471500,0.544988,0.744456,0.568468,0.639667,0.568341
7,0.453500,0.549531,0.74748,0.560034,0.647334,0.563324
7,0.436400,0.549327,0.744456,0.563706,0.63909,0.565136


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       1.00      0.00      0.01       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.87      0.50      0.43      1984
weighted avg       0.81      0.74      0.64      1984

[[   2  508]
 [   0 1474]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.79      0.05      0.10       510
           1       0.75      1.00      0.86      1474

    accuracy                           0.75      1984
   macro avg       0.77      0.52      0.48      1984
weighted avg       0.76      0.75      0.66      1984

[[  27  483]
 [   7 1467]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.62      0.11      0.19       510
           1       0.76      0.98      0.85      1474

    accuracy                           0.75      1984
   macro avg       0.69      0.54      0.52      1984
weighted avg       0.72      0.75      0.68      1984

[[  58  452]
 [  36 1438]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.57      0.15      0.24       510
           1       0.77      0.96      0.85      1474

    accuracy                           0.75      1984
   macro avg       0.67      0.56      0.55      1984
weighted avg       0.71      0.75      0.69      1984

[[  77  433]
 [  59 1415]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.51      0.21      0.29       510
           1       0.77      0.93      0.84      1474

    accuracy                           0.74      1984
   macro avg       0.64      0.57      0.57      1984
weighted avg       0.70      0.74      0.70      1984

[[ 105  405]
 [ 102 1372]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.53      0.18      0.27       510
           1       0.77      0.94      0.85      1474

    accuracy                           0.75      1984
   macro avg       0.65      0.56      0.56      1984
weighted avg       0.71      0.75      0.70      1984

[[  94  416]
 [  85 1389]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.51      0.20      0.28       510
           1       0.77      0.93      0.84      1474

    accuracy                           0.74      1984
   macro avg       0.64      0.57      0.56      1984
weighted avg       0.70      0.74      0.70      1984

[[ 100  410]
 [  97 1377]]




Training completed. Do not forget to share your model on huggingface.co/models =)


[32m[I 2021-12-26 13:28:18,725][0m Trial 10 finished with value: 0.5637058251757624 and parameters: {'learning_rate': 2.8764583368954434e-06, 'per_device_train_batch_size': 16, 'weight_decay': 5.686880929802635e-11, 'num_train_epochs': 7.913531923612611}. Best is trial 0 with value: 0.6297259011085378.[0m


Trial 10 finished with value: 0.5637058251757624 and parameters: {'learning_rate': 2.8764583368954434e-06, 'per_device_train_batch_size': 16, 'weight_decay': 5.686880929802635e-11, 'num_train_epochs': 7.913531923612611}. Best is trial 0 with value: 0.6297259011085378.


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.562082,0.742944,0.426258,0.371472,0.5
2,0.572000,0.552733,0.743448,0.428338,0.871659,0.50098
3,0.550300,0.547644,0.74748,0.451869,0.756018,0.511388
4,0.527800,0.543974,0.753024,0.506681,0.698106,0.536279
5,0.505800,0.543147,0.755544,0.538258,0.687458,0.552722
6,0.483800,0.543103,0.746976,0.552453,0.645712,0.558496


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       1.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.87      0.50      0.43      1984
weighted avg       0.81      0.74      0.63      1984

[[   1  509]
 [   0 1474]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.76      0.03      0.05       510
           1       0.75      1.00      0.85      1474

    accuracy                           0.75      1984
   macro avg       0.76      0.51      0.45      1984
weighted avg       0.75      0.75      0.65      1984

[[  13  497]
 [   4 1470]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.64      0.09      0.16       510
           1       0.76      0.98      0.86      1474

    accuracy                           0.75      1984
   macro avg       0.70      0.54      0.51      1984
weighted avg       0.73      0.75      0.68      1984

[[  46  464]
 [  26 1448]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.61      0.14      0.22       510
           1       0.76      0.97      0.86      1474

    accuracy                           0.76      1984
   macro avg       0.69      0.55      0.54      1984
weighted avg       0.72      0.76      0.69      1984

[[  69  441]
 [  44 1430]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.52      0.17      0.26       510
           1       0.77      0.95      0.85      1474

    accuracy                           0.75      1984
   macro avg       0.65      0.56      0.55      1984
weighted avg       0.70      0.75      0.70      1984

[[  87  423]
 [  79 1395]]


[32m[I 2021-12-26 14:16:22,905][0m Trial 11 pruned. [0m


Trial 11 pruned. 


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.555768,0.743448,0.428338,0.871659,0.50098
2,0.566600,0.541704,0.756552,0.508824,0.73295,0.538653
3,0.529800,0.543498,0.754032,0.548841,0.673829,0.558116
4,0.480300,0.55642,0.743952,0.581546,0.640417,0.57762
5,0.429500,0.57951,0.74496,0.583193,0.642804,0.57894
6,0.384000,0.587422,0.735383,0.602541,0.631713,0.594936
7,0.350700,0.600663,0.738911,0.598969,0.63547,0.59154
7,0.326900,0.599579,0.738911,0.601152,0.636108,0.593463


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       1.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.87      0.50      0.43      1984
weighted avg       0.81      0.74      0.63      1984

[[   1  509]
 [   0 1474]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.71      0.09      0.16       510
           1       0.76      0.99      0.86      1474

    accuracy                           0.76      1984
   macro avg       0.73      0.54      0.51      1984
weighted avg       0.75      0.76      0.68      1984

[[  46  464]
 [  19 1455]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.58      0.15      0.24       510
           1       0.77      0.96      0.85      1474

    accuracy                           0.75      1984
   macro avg       0.67      0.56      0.55      1984
weighted avg       0.72      0.75      0.70      1984

[[  79  431]
 [  57 1417]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.50      0.24      0.32       510
           1       0.78      0.92      0.84      1474

    accuracy                           0.74      1984
   macro avg       0.64      0.58      0.58      1984
weighted avg       0.71      0.74      0.71      1984

[[ 120  390]
 [ 118 1356]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.51      0.24      0.32       510
           1       0.78      0.92      0.84      1474

    accuracy                           0.74      1984
   macro avg       0.64      0.58      0.58      1984
weighted avg       0.71      0.74      0.71      1984

[[ 121  389]
 [ 117 1357]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.48      0.31      0.37       510
           1       0.79      0.88      0.83      1474

    accuracy                           0.74      1984
   macro avg       0.63      0.59      0.60      1984
weighted avg       0.71      0.74      0.71      1984

[[ 156  354]
 [ 171 1303]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.49      0.29      0.36       510
           1       0.78      0.89      0.84      1474

    accuracy                           0.74      1984
   macro avg       0.64      0.59      0.60      1984
weighted avg       0.71      0.74      0.71      1984

[[ 147  363]
 [ 155 1319]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.49      0.29      0.37       510
           1       0.79      0.89      0.84      1474

    accuracy                           0.74      1984
   macro avg       0.64      0.59      0.60      1984
weighted avg       0.71      0.74      0.72      1984

[[ 150  360]
 [ 158 1316]]




Training completed. Do not forget to share your model on huggingface.co/models =)


[32m[I 2021-12-26 15:14:49,754][0m Trial 12 finished with value: 0.6011518609073622 and parameters: {'learning_rate': 4.775435462681336e-06, 'per_device_train_batch_size': 16, 'weight_decay': 8.95677938171612e-12, 'num_train_epochs': 7.2279998930948866}. Best is trial 0 with value: 0.6297259011085378.[0m


Trial 12 finished with value: 0.6011518609073622 and parameters: {'learning_rate': 4.775435462681336e-06, 'per_device_train_batch_size': 16, 'weight_decay': 8.95677938171612e-12, 'num_train_epochs': 7.2279998930948866}. Best is trial 0 with value: 0.6297259011085378.


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.542651,0.75252,0.476203,0.7699,0.523116
2,0.557100,0.558552,0.756552,0.578732,0.674202,0.577124
3,0.465500,0.612455,0.726815,0.618257,0.629366,0.612252
4,0.330100,0.772239,0.730847,0.608854,0.628848,0.601501
5,0.205400,0.936336,0.729839,0.620192,0.632863,0.613646
5,0.129500,0.982301,0.733367,0.612199,0.63291,0.604479


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.79      0.05      0.10       510
           1       0.75      1.00      0.86      1474

    accuracy                           0.75      1984
   macro avg       0.77      0.52      0.48      1984
weighted avg       0.76      0.75      0.66      1984

[[  26  484]
 [   7 1467]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.57      0.21      0.31       510
           1       0.78      0.95      0.85      1474

    accuracy                           0.76      1984
   macro avg       0.67      0.58      0.58      1984
weighted avg       0.72      0.76      0.71      1984

[[ 106  404]
 [  79 1395]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.46      0.38      0.41       510
           1       0.80      0.85      0.82      1474

    accuracy                           0.73      1984
   macro avg       0.63      0.61      0.62      1984
weighted avg       0.71      0.73      0.72      1984

[[ 192  318]
 [ 224 1250]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.47      0.34      0.39       510
           1       0.79      0.87      0.83      1474

    accuracy                           0.73      1984
   macro avg       0.63      0.60      0.61      1984
weighted avg       0.71      0.73      0.71      1984

[[ 171  339]
 [ 195 1279]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.47      0.37      0.42       510
           1       0.80      0.85      0.82      1474

    accuracy                           0.73      1984
   macro avg       0.63      0.61      0.62      1984
weighted avg       0.71      0.73      0.72      1984

[[ 191  319]
 [ 217 1257]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.47      0.34      0.40       510
           1       0.79      0.87      0.83      1474

    accuracy                           0.73      1984
   macro avg       0.63      0.60      0.61      1984
weighted avg       0.71      0.73      0.72      1984

[[ 173  337]
 [ 192 1282]]




Training completed. Do not forget to share your model on huggingface.co/models =)


[32m[I 2021-12-26 16:00:17,925][0m Trial 13 finished with value: 0.6121986051452588 and parameters: {'learning_rate': 1.2218645158411856e-05, 'per_device_train_batch_size': 16, 'weight_decay': 5.8152450109840236e-08, 'num_train_epochs': 5.645854909698767}. Best is trial 0 with value: 0.6297259011085378.[0m


Trial 13 finished with value: 0.6121986051452588 and parameters: {'learning_rate': 1.2218645158411856e-05, 'per_device_train_batch_size': 16, 'weight_decay': 5.8152450109840236e-08, 'num_train_epochs': 5.645854909698767}. Best is trial 0 with value: 0.6297259011085378.


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.545129,0.753024,0.484438,0.745721,0.526661
2,0.553200,0.579504,0.74496,0.606818,0.646891,0.598175
3,0.407800,0.829453,0.71623,0.625877,0.626814,0.625005
4,0.189300,1.360759,0.746976,0.60702,0.650344,0.598249
5,0.074700,1.55321,0.738911,0.622422,0.642887,0.613981
5,0.027600,1.557255,0.737903,0.622185,0.641672,0.613944


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.74      0.06      0.11       510
           1       0.75      0.99      0.86      1474

    accuracy                           0.75      1984
   macro avg       0.75      0.53      0.48      1984
weighted avg       0.75      0.75      0.67      1984

[[  31  479]
 [  11 1463]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.51      0.30      0.37       510
           1       0.79      0.90      0.84      1474

    accuracy                           0.74      1984
   macro avg       0.65      0.60      0.61      1984
weighted avg       0.72      0.74      0.72      1984

[[ 151  359]
 [ 147 1327]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.45      0.44      0.44       510
           1       0.81      0.81      0.81      1474

    accuracy                           0.72      1984
   macro avg       0.63      0.63      0.63      1984
weighted avg       0.71      0.72      0.72      1984

[[ 223  287]
 [ 276 1198]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.51      0.29      0.37       510
           1       0.79      0.90      0.84      1474

    accuracy                           0.75      1984
   macro avg       0.65      0.60      0.61      1984
weighted avg       0.72      0.75      0.72      1984

[[ 149  361]
 [ 141 1333]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.49      0.36      0.41       510
           1       0.80      0.87      0.83      1474

    accuracy                           0.74      1984
   macro avg       0.64      0.61      0.62      1984
weighted avg       0.72      0.74      0.72      1984

[[ 182  328]
 [ 190 1284]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.49      0.36      0.41       510
           1       0.80      0.87      0.83      1474

    accuracy                           0.74      1984
   macro avg       0.64      0.61      0.62      1984
weighted avg       0.72      0.74      0.72      1984

[[ 183  327]
 [ 193 1281]]




Training completed. Do not forget to share your model on huggingface.co/models =)


[32m[I 2021-12-26 16:41:57,550][0m Trial 14 finished with value: 0.6221854707227432 and parameters: {'learning_rate': 2.4872860441210207e-05, 'per_device_train_batch_size': 16, 'weight_decay': 0.000225088124687041, 'num_train_epochs': 5.127132643894254}. Best is trial 0 with value: 0.6297259011085378.[0m


Trial 14 finished with value: 0.6221854707227432 and parameters: {'learning_rate': 2.4872860441210207e-05, 'per_device_train_batch_size': 16, 'weight_decay': 0.000225088124687041, 'num_train_epochs': 5.127132643894254}. Best is trial 0 with value: 0.6297259011085378.


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.593,0.570541,0.745464,0.438438,0.801106,0.505543
2,0.5436,0.741521,0.759073,0.507486,0.772007,0.539067
3,0.418,1.059431,0.754536,0.626035,0.665978,0.614879
3,0.1937,1.454044,0.731351,0.618519,0.633492,0.611457


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.86      0.01      0.02       510
           1       0.75      1.00      0.85      1474

    accuracy                           0.75      1984
   macro avg       0.80      0.51      0.44      1984
weighted avg       0.77      0.75      0.64      1984

[[   6  504]
 [   1 1473]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.79      0.09      0.16       510
           1       0.76      0.99      0.86      1474

    accuracy                           0.76      1984
   macro avg       0.77      0.54      0.51      1984
weighted avg       0.77      0.76      0.68      1984

[[  44  466]
 [  12 1462]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.54      0.33      0.41       510
           1       0.79      0.90      0.85      1474

    accuracy                           0.75      1984
   macro avg       0.67      0.61      0.63      1984
weighted avg       0.73      0.75      0.73      1984

[[ 167  343]
 [ 144 1330]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.47      0.36      0.41       510
           1       0.80      0.86      0.83      1474

    accuracy                           0.73      1984
   macro avg       0.63      0.61      0.62      1984
weighted avg       0.71      0.73      0.72      1984

[[ 186  324]
 [ 209 1265]]




Training completed. Do not forget to share your model on huggingface.co/models =)


[32m[I 2021-12-26 17:18:32,667][0m Trial 15 finished with value: 0.6185186588095664 and parameters: {'learning_rate': 4.03990606088607e-05, 'per_device_train_batch_size': 4, 'weight_decay': 0.00052164210061194, 'num_train_epochs': 3.874751284872604}. Best is trial 0 with value: 0.6297259011085378.[0m


Trial 15 finished with value: 0.6185186588095664 and parameters: {'learning_rate': 4.03990606088607e-05, 'per_device_train_batch_size': 4, 'weight_decay': 0.00052164210061194, 'num_train_epochs': 3.874751284872604}. Best is trial 0 with value: 0.6297259011085378.


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.619343,0.740423,0.425427,0.371147,0.498304


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   5 1469]]


[32m[I 2021-12-26 17:26:35,661][0m Trial 16 pruned. [0m


Trial 16 pruned. 


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.570856,0.742944,0.426258,0.371472,0.5
2,0.603500,0.573652,0.742944,0.426258,0.371472,0.5
3,0.584500,0.573652,0.742944,0.426258,0.371472,0.5


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-26 17:50:38,665][0m Trial 17 pruned. [0m


Trial 17 pruned. 


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.571272,0.742944,0.426258,0.371472,0.5
2,0.583800,0.568999,0.742944,0.426258,0.371472,0.5
2,0.566700,0.568952,0.742944,0.426258,0.371472,0.5


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-26 18:09:16,456][0m Trial 18 pruned. [0m


Trial 18 pruned. 


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.5742,0.570075,0.751008,0.465525,0.791667,0.518251
2,0.497,0.862075,0.762097,0.550047,0.718636,0.560979
3,0.3083,1.280751,0.748488,0.61682,0.654539,0.606961
4,0.1093,1.749733,0.74244,0.609708,0.643632,0.600967
4,0.1018,1.806562,0.736895,0.613832,0.637538,0.605571


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.83      0.04      0.07       510
           1       0.75      1.00      0.86      1474

    accuracy                           0.75      1984
   macro avg       0.79      0.52      0.47      1984
weighted avg       0.77      0.75      0.66      1984

[[  20  490]
 [   4 1470]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.67      0.15      0.24       510
           1       0.77      0.97      0.86      1474

    accuracy                           0.76      1984
   macro avg       0.72      0.56      0.55      1984
weighted avg       0.74      0.76      0.70      1984

[[  75  435]
 [  37 1437]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.52      0.32      0.39       510
           1       0.79      0.90      0.84      1474

    accuracy                           0.75      1984
   macro avg       0.65      0.61      0.62      1984
weighted avg       0.72      0.75      0.73      1984

[[ 161  349]
 [ 150 1324]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.50      0.31      0.38       510
           1       0.79      0.89      0.84      1474

    accuracy                           0.74      1984
   macro avg       0.64      0.60      0.61      1984
weighted avg       0.71      0.74      0.72      1984

[[ 158  352]
 [ 159 1315]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.48      0.34      0.40       510
           1       0.79      0.88      0.83      1474

    accuracy                           0.74      1984
   macro avg       0.64      0.61      0.61      1984
weighted avg       0.71      0.74      0.72      1984

[[ 171  339]
 [ 183 1291]]




Training completed. Do not forget to share your model on huggingface.co/models =)


[32m[I 2021-12-26 18:49:56,966][0m Trial 19 finished with value: 0.613831615120275 and parameters: {'learning_rate': 2.3701452712891675e-05, 'per_device_train_batch_size': 4, 'weight_decay': 0.004418539989332095, 'num_train_epochs': 4.269238799024415}. Best is trial 0 with value: 0.6297259011085378.[0m


Trial 19 finished with value: 0.613831615120275 and parameters: {'learning_rate': 2.3701452712891675e-05, 'per_device_train_batch_size': 4, 'weight_decay': 0.004418539989332095, 'num_train_epochs': 4.269238799024415}. Best is trial 0 with value: 0.6297259011085378.


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.575126,0.742944,0.426258,0.371472,0.5
2,0.584400,0.577541,0.742944,0.426258,0.371472,0.5
3,0.575400,0.574776,0.742944,0.426258,0.371472,0.5


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-26 19:14:03,034][0m Trial 20 pruned. [0m


Trial 20 pruned. 


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.5925,0.573209,0.742944,0.426258,0.371472,0.5
2,0.5617,0.575909,0.748992,0.531372,0.655632,0.54703
3,0.5557,0.71845,0.756552,0.580631,0.673737,0.578406
3,0.365,1.116308,0.75252,0.624314,0.662323,0.613522


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.55      0.13      0.21       510
           1       0.76      0.96      0.85      1474

    accuracy                           0.75      1984
   macro avg       0.66      0.55      0.53      1984
weighted avg       0.71      0.75      0.69      1984

[[  67  443]
 [  55 1419]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.57      0.21      0.31       510
           1       0.78      0.95      0.85      1474

    accuracy                           0.76      1984
   macro avg       0.67      0.58      0.58      1984
weighted avg       0.72      0.76      0.71      1984

[[ 108  402]
 [  81 1393]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.53      0.33      0.40       510
           1       0.79      0.90      0.84      1474

    accuracy                           0.75      1984
   macro avg       0.66      0.61      0.62      1984
weighted avg       0.73      0.75      0.73      1984

[[ 167  343]
 [ 148 1326]]




Training completed. Do not forget to share your model on huggingface.co/models =)


[32m[I 2021-12-26 19:51:11,467][0m Trial 21 finished with value: 0.6243141565190563 and parameters: {'learning_rate': 4.191884223796244e-05, 'per_device_train_batch_size': 4, 'weight_decay': 0.0004720500586884353, 'num_train_epochs': 3.8950982499459768}. Best is trial 0 with value: 0.6297259011085378.[0m


Trial 21 finished with value: 0.6243141565190563 and parameters: {'learning_rate': 4.191884223796244e-05, 'per_device_train_batch_size': 4, 'weight_decay': 0.0004720500586884353, 'num_train_epochs': 3.8950982499459768}. Best is trial 0 with value: 0.6297259011085378.


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.5688,0.578653,0.751008,0.468881,0.768113,0.519533
2,0.4764,0.849019,0.761593,0.585573,0.689901,0.582439
3,0.3395,1.266789,0.753024,0.622026,0.662943,0.611296
3,0.1725,1.395384,0.744456,0.622716,0.64984,0.613224


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.79      0.04      0.08       510
           1       0.75      1.00      0.86      1474

    accuracy                           0.75      1984
   macro avg       0.77      0.52      0.47      1984
weighted avg       0.76      0.75      0.66      1984

[[  22  488]
 [   6 1468]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.60      0.21      0.32       510
           1       0.78      0.95      0.86      1474

    accuracy                           0.76      1984
   macro avg       0.69      0.58      0.59      1984
weighted avg       0.73      0.76      0.72      1984

[[ 109  401]
 [  72 1402]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.53      0.32      0.40       510
           1       0.79      0.90      0.84      1474

    accuracy                           0.75      1984
   macro avg       0.66      0.61      0.62      1984
weighted avg       0.73      0.75      0.73      1984

[[ 163  347]
 [ 143 1331]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.50      0.34      0.41       510
           1       0.80      0.88      0.84      1474

    accuracy                           0.74      1984
   macro avg       0.65      0.61      0.62      1984
weighted avg       0.72      0.74      0.73      1984

[[ 175  335]
 [ 172 1302]]




Training completed. Do not forget to share your model on huggingface.co/models =)


[32m[I 2021-12-26 20:24:21,126][0m Trial 22 finished with value: 0.6227156470790776 and parameters: {'learning_rate': 1.6502386249986932e-05, 'per_device_train_batch_size': 4, 'weight_decay': 5.109043427278698e-07, 'num_train_epochs': 3.4418368177758083}. Best is trial 0 with value: 0.6297259011085378.[0m


Trial 22 finished with value: 0.6227156470790776 and parameters: {'learning_rate': 1.6502386249986932e-05, 'per_device_train_batch_size': 4, 'weight_decay': 5.109043427278698e-07, 'num_train_epochs': 3.4418368177758083}. Best is trial 0 with value: 0.6297259011085378.


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.5798,0.576984,0.742944,0.426258,0.371472,0.5
2,0.572,0.578908,0.742944,0.426258,0.371472,0.5


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-26 20:43:26,641][0m Trial 23 pruned. [0m


Trial 23 pruned. 


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.5873,0.573805,0.742944,0.426258,0.371472,0.5
2,0.5709,0.581278,0.742944,0.426258,0.371472,0.5


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-26 21:02:30,704][0m Trial 24 pruned. [0m


Trial 24 pruned. 


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.5662,0.576866,0.751008,0.468881,0.768113,0.519533
1,0.4698,0.604363,0.756048,0.555855,0.680139,0.562679


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.79      0.04      0.08       510
           1       0.75      1.00      0.86      1474

    accuracy                           0.75      1984
   macro avg       0.77      0.52      0.47      1984
weighted avg       0.76      0.75      0.66      1984

[[  22  488]
 [   6 1468]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.59      0.16      0.26       510
           1       0.77      0.96      0.85      1474

    accuracy                           0.76      1984
   macro avg       0.68      0.56      0.56      1984
weighted avg       0.72      0.76      0.70      1984

[[  84  426]
 [  58 1416]]




Training completed. Do not forget to share your model on huggingface.co/models =)


[32m[I 2021-12-26 21:19:37,417][0m Trial 25 finished with value: 0.5558548624627202 and parameters: {'learning_rate': 8.795038060179635e-06, 'per_device_train_batch_size': 4, 'weight_decay': 5.284877813800335e-07, 'num_train_epochs': 1.7948792732489052}. Best is trial 0 with value: 0.6297259011085378.[0m


Trial 25 finished with value: 0.5558548624627202 and parameters: {'learning_rate': 8.795038060179635e-06, 'per_device_train_batch_size': 4, 'weight_decay': 5.284877813800335e-07, 'num_train_epochs': 1.7948792732489052}. Best is trial 0 with value: 0.6297259011085378.


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.5953,0.576066,0.742944,0.426258,0.371472,0.5
2,0.5752,0.685463,0.742944,0.426258,0.371472,0.5


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-26 21:38:27,558][0m Trial 26 pruned. [0m


Trial 26 pruned. 


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.581,0.572359,0.742944,0.426258,0.371472,0.5
2,0.5659,0.571573,0.742944,0.426258,0.371472,0.5


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-26 21:57:17,633][0m Trial 27 pruned. [0m


Trial 27 pruned. 


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.5833,0.561853,0.74496,0.434534,0.872222,0.503922
2,0.5446,0.69321,0.755544,0.529612,0.694298,0.548233
3,0.4799,0.933802,0.75,0.599583,0.655223,0.591949
4,0.2496,1.305342,0.733871,0.611335,0.633128,0.603536
4,0.2351,1.385633,0.730847,0.613255,0.630719,0.605989


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       1.00      0.01      0.02       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.87      0.50      0.43      1984
weighted avg       0.81      0.74      0.64      1984

[[   4  506]
 [   0 1474]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.63      0.12      0.20       510
           1       0.76      0.97      0.86      1474

    accuracy                           0.76      1984
   macro avg       0.69      0.55      0.53      1984
weighted avg       0.73      0.76      0.69      1984

[[  62  448]
 [  37 1437]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.53      0.27      0.35       510
           1       0.78      0.92      0.84      1474

    accuracy                           0.75      1984
   macro avg       0.66      0.59      0.60      1984
weighted avg       0.72      0.75      0.72      1984

[[ 136  374]
 [ 122 1352]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.47      0.34      0.39       510
           1       0.79      0.87      0.83      1474

    accuracy                           0.73      1984
   macro avg       0.63      0.60      0.61      1984
weighted avg       0.71      0.73      0.72      1984

[[ 171  339]
 [ 189 1285]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.47      0.35      0.40       510
           1       0.79      0.86      0.83      1474

    accuracy                           0.73      1984
   macro avg       0.63      0.61      0.61      1984
weighted avg       0.71      0.73      0.72      1984

[[ 178  332]
 [ 202 1272]]




Training completed. Do not forget to share your model on huggingface.co/models =)


[32m[I 2021-12-26 22:36:47,995][0m Trial 28 finished with value: 0.6132553606237816 and parameters: {'learning_rate': 4.46912604574302e-05, 'per_device_train_batch_size': 4, 'weight_decay': 2.4655165685811364e-07, 'num_train_epochs': 4.137939010652064}. Best is trial 0 with value: 0.6297259011085378.[0m


Trial 28 finished with value: 0.6132553606237816 and parameters: {'learning_rate': 4.46912604574302e-05, 'per_device_train_batch_size': 4, 'weight_decay': 2.4655165685811364e-07, 'num_train_epochs': 4.137939010652064}. Best is trial 0 with value: 0.6297259011085378.


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.5899,0.574594,0.742944,0.426258,0.371472,0.5
2,0.5739,0.661879,0.742944,0.426258,0.371472,0.5


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-26 22:55:52,563][0m Trial 29 pruned. [0m


Trial 29 pruned. 


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.8457,0.84897,0.75252,0.471277,0.801501,0.521192
2,0.7491,0.9663,0.766633,0.595258,0.704546,0.589679
2,0.4859,1.089001,0.753528,0.610222,0.663126,0.600736


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.85      0.05      0.09       510
           1       0.75      1.00      0.86      1474

    accuracy                           0.75      1984
   macro avg       0.80      0.52      0.47      1984
weighted avg       0.78      0.75      0.66      1984

[[  23  487]
 [   4 1470]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.63      0.23      0.33       510
           1       0.78      0.95      0.86      1474

    accuracy                           0.77      1984
   macro avg       0.70      0.59      0.60      1984
weighted avg       0.74      0.77      0.72      1984

[[ 115  395]
 [  68 1406]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.54      0.29      0.37       510
           1       0.79      0.92      0.85      1474

    accuracy                           0.75      1984
   macro avg       0.66      0.60      0.61      1984
weighted avg       0.72      0.75      0.73      1984

[[ 146  364]
 [ 125 1349]]




Training completed. Do not forget to share your model on huggingface.co/models =)


[32m[I 2021-12-26 23:23:01,399][0m Trial 30 finished with value: 0.6102219042067105 and parameters: {'learning_rate': 1.0572138580141994e-05, 'per_device_train_batch_size': 2, 'weight_decay': 0.4874071227704652, 'num_train_epochs': 2.3395849854085395}. Best is trial 0 with value: 0.6297259011085378.[0m


Trial 30 finished with value: 0.6102219042067105 and parameters: {'learning_rate': 1.0572138580141994e-05, 'per_device_train_batch_size': 2, 'weight_decay': 0.4874071227704652, 'num_train_epochs': 2.3395849854085395}. Best is trial 0 with value: 0.6297259011085378.


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.540002,0.754032,0.498658,0.722813,0.53311
2,0.556200,0.593291,0.75504,0.617395,0.666421,0.606883
3,0.385000,1.054122,0.723286,0.63277,0.634744,0.631036
4,0.153900,1.530938,0.733871,0.626995,0.639523,0.620206
4,0.048600,1.599905,0.740927,0.619113,0.644218,0.610208


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.69      0.08      0.14       510
           1       0.76      0.99      0.86      1474

    accuracy                           0.75      1984
   macro avg       0.72      0.53      0.50      1984
weighted avg       0.74      0.75      0.67      1984

[[  40  470]
 [  18 1456]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.54      0.30      0.39       510
           1       0.79      0.91      0.85      1474

    accuracy                           0.76      1984
   macro avg       0.67      0.61      0.62      1984
weighted avg       0.73      0.76      0.73      1984

[[ 154  356]
 [ 130 1344]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.46      0.44      0.45       510
           1       0.81      0.82      0.82      1474

    accuracy                           0.72      1984
   macro avg       0.63      0.63      0.63      1984
weighted avg       0.72      0.72      0.72      1984

[[ 225  285]
 [ 264 1210]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.48      0.39      0.43       510
           1       0.80      0.85      0.83      1474

    accuracy                           0.73      1984
   macro avg       0.64      0.62      0.63      1984
weighted avg       0.72      0.73      0.72      1984

[[ 197  313]
 [ 215 1259]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.49      0.34      0.40       510
           1       0.79      0.88      0.83      1474

    accuracy                           0.74      1984
   macro avg       0.64      0.61      0.62      1984
weighted avg       0.72      0.74      0.72      1984

[[ 174  336]
 [ 178 1296]]




Training completed. Do not forget to share your model on huggingface.co/models =)


[32m[I 2021-12-27 00:00:20,012][0m Trial 31 finished with value: 0.619113070578164 and parameters: {'learning_rate': 4.0307606308861596e-05, 'per_device_train_batch_size': 16, 'weight_decay': 0.00031391492520342217, 'num_train_epochs': 4.607449515519003}. Best is trial 0 with value: 0.6297259011085378.[0m


Trial 31 finished with value: 0.619113070578164 and parameters: {'learning_rate': 4.0307606308861596e-05, 'per_device_train_batch_size': 16, 'weight_decay': 0.00031391492520342217, 'num_train_epochs': 4.607449515519003}. Best is trial 0 with value: 0.6297259011085378.


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.5984,0.581039,0.742944,0.426258,0.371472,0.5


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-27 00:09:00,211][0m Trial 32 pruned. [0m


Trial 32 pruned. 


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.5937,0.57415,0.742944,0.426258,0.371472,0.5


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-27 00:18:30,611][0m Trial 33 pruned. [0m


Trial 33 pruned. 


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.6052,0.590978,0.742944,0.426258,0.371472,0.5


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-27 00:29:47,020][0m Trial 34 pruned. [0m


Trial 34 pruned. 


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.540605,0.752016,0.482334,0.733559,0.525341
2,0.552600,0.576641,0.753528,0.604057,0.663012,0.595606
3,0.416300,0.700009,0.734375,0.630208,0.641377,0.623752
3,0.232700,0.732423,0.741431,0.615642,0.643836,0.6067


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.71      0.06      0.11       510
           1       0.75      0.99      0.86      1474

    accuracy                           0.75      1984
   macro avg       0.73      0.53      0.48      1984
weighted avg       0.74      0.75      0.66      1984

[[  30  480]
 [  12 1462]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.54      0.27      0.36       510
           1       0.78      0.92      0.85      1474

    accuracy                           0.75      1984
   macro avg       0.66      0.60      0.60      1984
weighted avg       0.72      0.75      0.72      1984

[[ 138  372]
 [ 117 1357]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.48      0.40      0.43       510
           1       0.80      0.85      0.83      1474

    accuracy                           0.73      1984
   macro avg       0.64      0.62      0.63      1984
weighted avg       0.72      0.73      0.73      1984

[[ 202  308]
 [ 219 1255]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.50      0.33      0.40       510
           1       0.79      0.88      0.84      1474

    accuracy                           0.74      1984
   macro avg       0.64      0.61      0.62      1984
weighted avg       0.72      0.74      0.72      1984

[[ 168  342]
 [ 171 1303]]




Training completed. Do not forget to share your model on huggingface.co/models =)


[32m[I 2021-12-27 00:56:36,550][0m Trial 35 finished with value: 0.6156419618954613 and parameters: {'learning_rate': 2.258288638119073e-05, 'per_device_train_batch_size': 16, 'weight_decay': 1.0346546993574772e-06, 'num_train_epochs': 3.2704737613347286}. Best is trial 0 with value: 0.6297259011085378.[0m


Trial 35 finished with value: 0.6156419618954613 and parameters: {'learning_rate': 2.258288638119073e-05, 'per_device_train_batch_size': 16, 'weight_decay': 1.0346546993574772e-06, 'num_train_epochs': 3.2704737613347286}. Best is trial 0 with value: 0.6297259011085378.


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.592,0.578938,0.742944,0.426258,0.371472,0.5


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-27 01:05:16,691][0m Trial 36 pruned. [0m


Trial 36 pruned. 


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,1.1038,0.873736,0.742944,0.426258,0.371472,0.5


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-27 01:14:50,434][0m Trial 37 pruned. [0m


Trial 37 pruned. 


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.5665,0.553621,0.743448,0.428338,0.871659,0.50098
2,0.5239,0.542574,0.75504,0.5162,0.704727,0.541482
2,0.4725,0.544695,0.756552,0.544904,0.68877,0.556606


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       1.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.87      0.50      0.43      1984
weighted avg       0.81      0.74      0.63      1984

[[   1  509]
 [   0 1474]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.65      0.10      0.18       510
           1       0.76      0.98      0.86      1474

    accuracy                           0.76      1984
   macro avg       0.70      0.54      0.52      1984
weighted avg       0.73      0.76      0.68      1984

[[  52  458]
 [  28 1446]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.61      0.15      0.23       510
           1       0.77      0.97      0.86      1474

    accuracy                           0.76      1984
   macro avg       0.69      0.56      0.54      1984
weighted avg       0.73      0.76      0.70      1984

[[  74  436]
 [  47 1427]]


[32m[I 2021-12-27 01:40:10,699][0m Trial 38 pruned. [0m


Trial 38 pruned. 


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.8251,0.862959,0.742944,0.426258,0.371472,0.5


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-27 01:51:40,595][0m Trial 39 pruned. [0m


Trial 39 pruned. 


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,4.335145,0.742944,0.426258,0.371472,0.5


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-27 01:59:45,913][0m Trial 40 pruned. [0m


Trial 40 pruned. 


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.541231,0.751512,0.478905,0.735067,0.52372
2,0.557200,0.58709,0.751008,0.618247,0.658991,0.608016
3,0.393800,0.995093,0.731855,0.637552,0.642826,0.633597
4,0.154700,1.493702,0.742944,0.616903,0.646238,0.607718
4,0.047300,1.551081,0.74244,0.622285,0.647086,0.613149


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.72      0.05      0.10       510
           1       0.75      0.99      0.86      1474

    accuracy                           0.75      1984
   macro avg       0.74      0.52      0.48      1984
weighted avg       0.74      0.75      0.66      1984

[[  28  482]
 [  11 1463]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.53      0.31      0.39       510
           1       0.79      0.90      0.84      1474

    accuracy                           0.75      1984
   macro avg       0.66      0.61      0.62      1984
weighted avg       0.72      0.75      0.73      1984

[[ 160  350]
 [ 144 1330]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.48      0.43      0.45       510
           1       0.81      0.84      0.82      1474

    accuracy                           0.73      1984
   macro avg       0.64      0.63      0.64      1984
weighted avg       0.72      0.73      0.73      1984

[[ 220  290]
 [ 242 1232]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.50      0.33      0.40       510
           1       0.79      0.89      0.84      1474

    accuracy                           0.74      1984
   macro avg       0.65      0.61      0.62      1984
weighted avg       0.72      0.74      0.72      1984

[[ 168  342]
 [ 168 1306]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.50      0.35      0.41       510
           1       0.80      0.88      0.84      1474

    accuracy                           0.74      1984
   macro avg       0.65      0.61      0.62      1984
weighted avg       0.72      0.74      0.73      1984

[[ 177  333]
 [ 178 1296]]




Training completed. Do not forget to share your model on huggingface.co/models =)


[32m[I 2021-12-27 02:35:51,016][0m Trial 41 finished with value: 0.622284606170795 and parameters: {'learning_rate': 4.302018644641139e-05, 'per_device_train_batch_size': 16, 'weight_decay': 0.0004311021190148843, 'num_train_epochs': 4.43403753860061}. Best is trial 0 with value: 0.6297259011085378.[0m


Trial 41 finished with value: 0.622284606170795 and parameters: {'learning_rate': 4.302018644641139e-05, 'per_device_train_batch_size': 16, 'weight_decay': 0.0004311021190148843, 'num_train_epochs': 4.43403753860061}. Best is trial 0 with value: 0.6297259011085378.


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.540995,0.752016,0.485455,0.724503,0.526624
2,0.554600,0.566025,0.751008,0.585362,0.657071,0.581087
3,0.443900,0.648047,0.731855,0.622451,0.635693,0.615644
4,0.286700,0.804755,0.732863,0.61492,0.633468,0.607346
4,0.170200,0.809174,0.731351,0.611173,0.630348,0.603763


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.70      0.06      0.12       510
           1       0.75      0.99      0.86      1474

    accuracy                           0.75      1984
   macro avg       0.72      0.53      0.49      1984
weighted avg       0.74      0.75      0.67      1984

[[  32  478]
 [  14 1460]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.54      0.23      0.32       510
           1       0.78      0.93      0.85      1474

    accuracy                           0.75      1984
   macro avg       0.66      0.58      0.59      1984
weighted avg       0.72      0.75      0.71      1984

[[ 118  392]
 [ 102 1372]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.47      0.38      0.42       510
           1       0.80      0.85      0.83      1474

    accuracy                           0.73      1984
   macro avg       0.64      0.62      0.62      1984
weighted avg       0.71      0.73      0.72      1984

[[ 192  318]
 [ 214 1260]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.47      0.35      0.40       510
           1       0.79      0.87      0.83      1474

    accuracy                           0.73      1984
   macro avg       0.63      0.61      0.61      1984
weighted avg       0.71      0.73      0.72      1984

[[ 178  332]
 [ 198 1276]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.47      0.34      0.40       510
           1       0.79      0.87      0.83      1474

    accuracy                           0.73      1984
   macro avg       0.63      0.60      0.61      1984
weighted avg       0.71      0.73      0.72      1984

[[ 174  336]
 [ 197 1277]]




Training completed. Do not forget to share your model on huggingface.co/models =)


[32m[I 2021-12-27 03:09:42,391][0m Trial 42 finished with value: 0.6111730676812102 and parameters: {'learning_rate': 1.613867923844534e-05, 'per_device_train_batch_size': 16, 'weight_decay': 0.0021687913769903094, 'num_train_epochs': 4.134368821797008}. Best is trial 0 with value: 0.6297259011085378.[0m


Trial 42 finished with value: 0.6111730676812102 and parameters: {'learning_rate': 1.613867923844534e-05, 'per_device_train_batch_size': 16, 'weight_decay': 0.0021687913769903094, 'num_train_epochs': 4.134368821797008}. Best is trial 0 with value: 0.6297259011085378.


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.559281,0.75,0.459941,0.799491,0.515649
2,0.563000,0.608835,0.748992,0.617244,0.655436,0.6073
3,0.392400,1.120633,0.712702,0.622943,0.623265,0.62263
4,0.155400,1.544318,0.736391,0.605434,0.634011,0.597538
4,0.052500,1.618315,0.737903,0.615311,0.639257,0.606891


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.85      0.03      0.06       510
           1       0.75      1.00      0.86      1474

    accuracy                           0.75      1984
   macro avg       0.80      0.52      0.46      1984
weighted avg       0.77      0.75      0.65      1984

[[  17  493]
 [   3 1471]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.52      0.32      0.39       510
           1       0.79      0.90      0.84      1474

    accuracy                           0.75      1984
   macro avg       0.66      0.61      0.62      1984
weighted avg       0.72      0.75      0.73      1984

[[ 161  349]
 [ 149 1325]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.44      0.44      0.44       510
           1       0.81      0.81      0.81      1474

    accuracy                           0.71      1984
   macro avg       0.62      0.62      0.62      1984
weighted avg       0.71      0.71      0.71      1984

[[ 223  287]
 [ 283 1191]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.48      0.31      0.38       510
           1       0.79      0.88      0.83      1474

    accuracy                           0.74      1984
   macro avg       0.63      0.60      0.61      1984
weighted avg       0.71      0.74      0.72      1984

[[ 159  351]
 [ 172 1302]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.49      0.34      0.40       510
           1       0.79      0.88      0.83      1474

    accuracy                           0.74      1984
   macro avg       0.64      0.61      0.62      1984
weighted avg       0.71      0.74      0.72      1984

[[ 172  338]
 [ 182 1292]]




Training completed. Do not forget to share your model on huggingface.co/models =)


[32m[I 2021-12-27 03:45:23,702][0m Trial 43 finished with value: 0.6153111874761359 and parameters: {'learning_rate': 5.819447367275609e-05, 'per_device_train_batch_size': 16, 'weight_decay': 0.012787210805926066, 'num_train_epochs': 4.381077103246245}. Best is trial 0 with value: 0.6297259011085378.[0m


Trial 43 finished with value: 0.6153111874761359 and parameters: {'learning_rate': 5.819447367275609e-05, 'per_device_train_batch_size': 16, 'weight_decay': 0.012787210805926066, 'num_train_epochs': 4.381077103246245}. Best is trial 0 with value: 0.6297259011085378.


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.555174,0.743448,0.428338,0.871659,0.50098


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       1.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.87      0.50      0.43      1984
weighted avg       0.81      0.74      0.63      1984

[[   1  509]
 [   0 1474]]


[32m[I 2021-12-27 03:53:27,016][0m Trial 44 pruned. [0m


Trial 44 pruned. 


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.568332,0.742944,0.426258,0.371472,0.5


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-27 04:01:29,954][0m Trial 45 pruned. [0m


Trial 45 pruned. 


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.543721,0.751008,0.480229,0.721397,0.524022
2,0.552800,0.581962,0.74496,0.611795,0.647942,0.602663
3,0.400100,0.834718,0.722782,0.630872,0.633339,0.628773
3,0.180400,1.169417,0.739919,0.626887,0.645574,0.618506


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.69      0.06      0.11       510
           1       0.75      0.99      0.86      1474

    accuracy                           0.75      1984
   macro avg       0.72      0.52      0.48      1984
weighted avg       0.74      0.75      0.66      1984

[[  29  481]
 [  13 1461]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.51      0.31      0.38       510
           1       0.79      0.90      0.84      1474

    accuracy                           0.74      1984
   macro avg       0.65      0.60      0.61      1984
weighted avg       0.72      0.74      0.72      1984

[[ 158  352]
 [ 154 1320]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.46      0.44      0.45       510
           1       0.81      0.82      0.82      1474

    accuracy                           0.72      1984
   macro avg       0.63      0.63      0.63      1984
weighted avg       0.72      0.72      0.72      1984

[[ 222  288]
 [ 262 1212]]


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.49      0.37      0.42       510
           1       0.80      0.87      0.83      1474

    accuracy                           0.74      1984
   macro avg       0.65      0.62      0.63      1984
weighted avg       0.72      0.74      0.73      1984

[[ 188  322]
 [ 194 1280]]




Training completed. Do not forget to share your model on huggingface.co/models =)


[32m[I 2021-12-27 04:32:45,752][0m Trial 46 finished with value: 0.6268871692898005 and parameters: {'learning_rate': 2.7946686647766176e-05, 'per_device_train_batch_size': 16, 'weight_decay': 9.526708810697573e-05, 'num_train_epochs': 3.890881441631214}. Best is trial 0 with value: 0.6297259011085378.[0m


Trial 46 finished with value: 0.6268871692898005 and parameters: {'learning_rate': 2.7946686647766176e-05, 'per_device_train_batch_size': 16, 'weight_decay': 9.526708810697573e-05, 'num_train_epochs': 3.890881441631214}. Best is trial 0 with value: 0.6297259011085378.


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.573331,0.742944,0.426258,0.371472,0.5


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-27 04:40:48,437][0m Trial 47 pruned. [0m


Trial 47 pruned. 


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.6975,0.569956,0.742944,0.426258,0.371472,0.5


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-27 04:50:14,239][0m Trial 48 pruned. [0m


Trial 48 pruned. 


Trial:
loading configuration file https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/886dba277a27c6ab50ab3d0bfd8839d354cfeed717289623026415c62b687338.1b14bcddba43d86a607eedb4b638b87d30aa00c839358953dbd36f2cd3317c83
Model config BertConfig {
  "_name_or_path": "princeton-nlp/sup-simcse-bert-base-uncased",
  "architectures": [
    "BertModel"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.15.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weigh

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.5706,0.559809,0.742944,0.426258,0.371472,0.5


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, __index_level_0__.
***** Running Evaluation *****
  Num examples = 1984
  Batch size = 8


              precision    recall  f1-score   support

           0       0.00      0.00      0.00       510
           1       0.74      1.00      0.85      1474

    accuracy                           0.74      1984
   macro avg       0.37      0.50      0.43      1984
weighted avg       0.55      0.74      0.63      1984

[[   0  510]
 [   0 1474]]



Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.


Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.

[32m[I 2021-12-27 04:58:49,731][0m Trial 49 pruned. [0m


Trial 49 pruned. 


[32m[I 2021-12-27 04:58:49,788][0m A new study created in memory with name: no-name-a0ce318f-fd0f-4bfa-acab-7495344456e6[0m


A new study created in memory with name: no-name-a0ce318f-fd0f-4bfa-acab-7495344456e6


In [None]:
storage_name

'sqlite:///SIMCSE_BERT_myPers_OPN.db'

In [None]:
study_name

'SIMCSE_BERT_myPers_OPN'

In [None]:
study = optuna.create_study(study_name=study_name, storage=storage_name, load_if_exists=True, direction="maximize")
df = study.trials_dataframe(attrs=("number", "value", "params", "state"))

[32m[I 2021-12-27 04:58:49,903][0m Using an existing study with name 'SIMCSE_BERT_myPers_OPN' instead of creating a new one.[0m


Using an existing study with name 'SIMCSE_BERT_myPers_OPN' instead of creating a new one.


In [None]:
df

Unnamed: 0,number,value,params_learning_rate,params_num_train_epochs,params_per_device_train_batch_size,params_weight_decay,state
0,0,0.629726,7.938171e-05,4.417547,16,1.01178e-07,COMPLETE
1,1,0.426258,9.105113e-05,4.94037,8,1.397096e-05,COMPLETE
2,2,0.426258,0.2492401,4.589276,2,0.03513224,COMPLETE
3,3,0.426258,0.002094824,1.110429,8,0.0209597,COMPLETE
4,4,0.426258,0.0001474898,1.096962,2,5.701092e-09,COMPLETE
5,5,0.426258,0.005193582,2.657387,8,0.1268058,COMPLETE
6,6,0.426258,2.571224e-07,2.224512,8,7.451598e-08,COMPLETE
7,7,0.426258,0.1406138,1.210753,4,3.498292e-06,COMPLETE
8,8,0.426258,0.01705713,3.567578,16,3.848108e-06,COMPLETE
9,9,0.426258,0.001774046,1.529049,2,8.088638e-10,COMPLETE


In [None]:
fig = optuna.visualization.plot_param_importances(study)
fig.show()

In [None]:
best_run

BestRun(run_id='0', objective=0.6297259011085378, hyperparameters={'learning_rate': 7.938170684431916e-05, 'num_train_epochs': 4.417547496496372, 'per_device_train_batch_size': 16, 'weight_decay': 1.0117798083724145e-07})

In [None]:
optuna.visualization.plot_intermediate_values(study)

In [None]:
optuna.visualization.plot_parallel_coordinate(study)

In [None]:
optuna.visualization.plot_optimization_history(study)

In [None]:
optuna.visualization.plot_contour(study)

In [None]:
optuna.visualization.plot_slice(study)

In [None]:
optuna.visualization.plot_edf(study)