In [None]:
import os 

In [None]:

!pip install -qq transformers
!pip install -qq optuna
!pip install -qq datasets

[K     |████████████████████████████████| 3.5 MB 13.5 MB/s 
[K     |████████████████████████████████| 596 kB 78.7 MB/s 
[K     |████████████████████████████████| 6.8 MB 89.6 MB/s 
[K     |████████████████████████████████| 895 kB 67.9 MB/s 
[K     |████████████████████████████████| 67 kB 5.3 MB/s 
[K     |████████████████████████████████| 308 kB 13.4 MB/s 
[K     |████████████████████████████████| 210 kB 82.7 MB/s 
[K     |████████████████████████████████| 80 kB 11.9 MB/s 
[K     |████████████████████████████████| 75 kB 5.7 MB/s 
[K     |████████████████████████████████| 49 kB 8.1 MB/s 
[K     |████████████████████████████████| 149 kB 85.4 MB/s 
[K     |████████████████████████████████| 113 kB 87.8 MB/s 
[?25h  Building wheel for pyperclip (setup.py) ... [?25l[?25hdone
[K     |████████████████████████████████| 311 kB 14.2 MB/s 
[K     |████████████████████████████████| 1.1 MB 77.4 MB/s 
[K     |████████████████████████████████| 133 kB 92.9 MB/s 
[K     |██████████████

In [None]:
import transformers
import datasets
from transformers import AutoTokenizer,AutoModelForQuestionAnswering, AutoModelForSequenceClassification,AdamW, get_linear_schedule_with_warmup,Trainer, TrainingArguments
from transformers import DataCollator, DataCollatorForLanguageModeling,default_data_collator
from transformers.file_utils import is_tf_available, is_torch_available, is_torch_tpu_available
import torch
import numpy as np
import pandas as pd
import seaborn as sns
from pylab import rcParams
import matplotlib.pyplot as plt
from matplotlib import rc
from sklearn.model_selection import train_test_split
from sklearn.metrics import confusion_matrix, classification_report
from collections import defaultdict
import random
from textwrap import wrap
from datetime import datetime
from datasets import load_from_disk
from datasets import load_dataset
from datasets import Dataset
from sklearn.metrics import accuracy_score,classification_report, confusion_matrix
from sklearn.metrics import precision_recall_fscore_support
from torch import nn

In [None]:
# the model we gonna train, base uncased BERT
# check text classification models here: https://huggingface.co/models?filter=text-classification
MODEL_NAME = "distilbert-base-uncased"
# max sequence length for each document/sentence sample
BATCH_SIZE = 16
EPOCHS = 3
LEARNING_RATE= 6.5e-05
WEIGHT_DECAY = 0.289
WARMUP_STEPS = 464
RANDOM_SEED=22

LEARNING_RATE_DECAY_MULTIPLIER = 0.95
REINIT_LAYERS = 2


device = torch.device("cuda") if torch.cuda.is_available() else torch.device("cpu")

In [None]:

class LLRDTrainer(Trainer):

    def create_optimizer_and_scheduler(self, num_training_steps: int):
        """
        Setup the optimizer and the learning rate scheduler.
        We provide a reasonable default that works well. If you want to use something else, you can pass a tuple in the
        Trainer's init through `optimizers`, or subclass and override this method (or `create_optimizer` and/or
        `create_scheduler`) in a subclass.
        """
        self.create_optimizer()
        parameters = get_optimizer_parameters_with_llrd(self.model, LEARNING_RATE, 0.95)
        self.optimizer = AdamW(parameters, lr=LEARNING_RATE,weight_decay=WEIGHT_DECAY)
        self.create_scheduler(num_training_steps=num_training_steps, optimizer=self.optimizer)


def set_seed(seed):
    """Set all seeds to make results reproducible (deterministic mode).
       When seed is None, disables deterministic mode.
    :param seed: an integer to your choosing
    """
    if seed is not None:
        torch.manual_seed(seed)
        torch.cuda.manual_seed_all(seed)
        torch.backends.cudnn.deterministic = True
        torch.backends.cudnn.benchmark = False
        np.random.seed(seed)
        random.seed(seed)

def compute_metrics(pred):
  labels = pred.label_ids
  preds = pred.predictions.argmax(-1)
  # calculate accuracy using sklearn's function
  acc = accuracy_score(labels, preds)
  precision, recall, f1, _ = precision_recall_fscore_support(labels, preds, average='macro')
  acc = accuracy_score(labels, preds)
  confusion_matrix = classification_report(labels, preds, digits=4,output_dict=True)
  return {
        'accuracy': acc,
        'f1': f1,
        'precision': precision,
        'recall': recall,
        'hate_f1': confusion_matrix["0"]["f1-score"],
        'hate_recall': confusion_matrix["0"]["recall"],
        'hate_precision': confusion_matrix["0"]["precision"],
        'offensive_f1': confusion_matrix["1"]["f1-score"],
        'offensive_recall': confusion_matrix["1"]["recall"],
        'offensive_precision': confusion_matrix["1"]["precision"],
        'normal_f1': confusion_matrix["2"]["f1-score"],
        'normal_recall': confusion_matrix["2"]["recall"],
        'normal_precision': confusion_matrix["2"]["precision"],    
  }



def timestamp():
    dateTimeObj = datetime.now()
    timestampStr = dateTimeObj.strftime("%d-%b-%Y (%H:%M:%S.%f)")
    print(timestampStr)


def get_optimizer_parameters_with_llrd(model, peak_lr, multiplicative_factor):
    num_encoder_layers = len(model.distilbert.transformer.layer)
    # Task specific layer gets the peak_lr
    tsl_parameters = [
        {
            "params": [param for name, param in model.named_parameters() if 'distilbert' not in name],
            "param_names": [name for name, param in model.named_parameters() if 'distilbert' not in name],
            "lr": peak_lr,
            "name": "tsl",
        }
    ]

    # Starting from the last encoder layer each encoder layers get a lr defined by
    # current_layer_lr = prev_layer_lr * multiplicative_factor
    # the last encoder layer lr = peak_lr * multiplicative_factor
    encoder_parameters = [
        {
            "params": [param for name, param in model.named_parameters() if f"distilbert.transformer.layer.{layer_num}" in name],
            "param_names": [name for name, param in model.named_parameters() if f"distilbert.transformer.layer.{layer_num}" in name],
            "lr": peak_lr * (multiplicative_factor ** (num_encoder_layers - layer_num)),
            "name": f"layer_{layer_num}",
        }
        for layer_num, layer in enumerate(model.distilbert.transformer.layer)
    ]

    # Embedding layer gets embedding layer lr = first encoder layer lr * multiplicative_factor
    embedding_parameters = [
        {
            "params": [param for name, param in model.named_parameters() if 'embeddings' in name],
            "param_names": [name for name, param in model.named_parameters() if 'embeddings' in name],
            "lr": peak_lr * (multiplicative_factor ** (num_encoder_layers + 1)),
            "name": "embedding",
        }
    ]
    return tsl_parameters + encoder_parameters + embedding_parameters


def reinit_autoencoder_model(model, reinit_num_layers=0):
    """reinitialize autoencoder model layers"""

    if reinit_num_layers:
        for layer in model.distilbert.transformer.layer[-reinit_num_layers:]:
            for module in layer.modules():
                if isinstance(module, nn.Embedding):
                  if module.weight.requires_grad:
                    module.weight.data.normal_(mean=0.0, std=model.config.initializer_range)
                if isinstance(module, nn.Linear):
                  module.weight.data.normal_(mean=0.0, std=model.config.initializer_range)
                elif isinstance(module, nn.LayerNorm):
                  module.bias.data.zero_()
                  module.weight.data.fill_(1.0)
                if isinstance(module, nn.Linear) and module.bias is not None:
                  module.bias.data.zero_()

    return model


def model_init():
    temp_model = AutoModelForSequenceClassification.from_pretrained(MODEL_NAME,num_labels=3).to(device)
    temp_model = reinit_autoencoder_model (temp_model, REINIT_LAYERS)
    return temp_model



In [None]:
set_seed(RANDOM_SEED)

In [None]:
dataset_dfs = load_from_disk('/content/drive/MyDrive/Dissertation/datasets/hatetwit_'+str(1))

In [None]:
training_args = TrainingArguments(
    output_dir='/content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results',          # output directory
    num_train_epochs=EPOCHS,              # total number of training epochs
    save_strategy ="epoch" ,
    per_device_train_batch_size=BATCH_SIZE,  # batch size per device during training
    per_device_eval_batch_size=BATCH_SIZE,   # batch size for evaluation
    weight_decay= WEIGHT_DECAY,               # strength of weight decay
    learning_rate= LEARNING_RATE, 
    logging_dir='./disbert_hate_optimal/hyper/logs',     # directory for storing logs
    load_best_model_at_end=True,     # load the best model when finished training (default metric is loss)
    evaluation_strategy="epoch",
    #eval_steps = 500     # evaluate each `logging_steps`
)

In [None]:
hyper_trainer = LLRDTrainer(
    model_init=model_init,                         # the instantiated Transformers model to be trained
    args=training_args,                  # training arguments, defined above
    train_dataset=dataset_dfs['train'],         # training dataset
    eval_dataset=dataset_dfs['validation'],          # evaluation dataset
    compute_metrics=compute_metrics     # the callback that computes metrics of interest
)

https://huggingface.co/distilbert-base-uncased/resolve/main/config.json not found in cache or force_download set to True, downloading to /root/.cache/huggingface/transformers/tmpbl6biisv


Downloading:   0%|          | 0.00/483 [00:00<?, ?B/s]

storing https://huggingface.co/distilbert-base-uncased/resolve/main/config.json in cache at /root/.cache/huggingface/transformers/23454919702d26495337f3da04d1655c7ee010d5ec9d77bdb9e399e00302c0a1.91b885ab15d631bf9cee9dc9d25ece0afd932f2f5130eba28f2055b2220c0333
creating metadata file for /root/.cache/huggingface/transformers/23454919702d26495337f3da04d1655c7ee010d5ec9d77bdb9e399e00302c0a1.91b885ab15d631bf9cee9dc9d25ece0afd932f2f5130eba28f2055b2220c0333
loading configuration file https://huggingface.co/distilbert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/23454919702d26495337f3da04d1655c7ee010d5ec9d77bdb9e399e00302c0a1.91b885ab15d631bf9cee9dc9d25ece0afd932f2f5130eba28f2055b2220c0333
Model config DistilBertConfig {
  "_name_or_path": "distilbert-base-uncased",
  "activation": "gelu",
  "architectures": [
    "DistilBertForMaskedLM"
  ],
  "attention_dropout": 0.1,
  "dim": 768,
  "dropout": 0.1,
  "hidden_dim": 3072,
  "id2label": {
    "0": "

Downloading:   0%|          | 0.00/256M [00:00<?, ?B/s]

storing https://huggingface.co/distilbert-base-uncased/resolve/main/pytorch_model.bin in cache at /root/.cache/huggingface/transformers/9c169103d7e5a73936dd2b627e42851bec0831212b677c637033ee4bce9ab5ee.126183e36667471617ae2f0835fab707baa54b731f991507ebbb55ea85adb12a
creating metadata file for /root/.cache/huggingface/transformers/9c169103d7e5a73936dd2b627e42851bec0831212b677c637033ee4bce9ab5ee.126183e36667471617ae2f0835fab707baa54b731f991507ebbb55ea85adb12a
loading weights file https://huggingface.co/distilbert-base-uncased/resolve/main/pytorch_model.bin from cache at /root/.cache/huggingface/transformers/9c169103d7e5a73936dd2b627e42851bec0831212b677c637033ee4bce9ab5ee.126183e36667471617ae2f0835fab707baa54b731f991507ebbb55ea85adb12a
Some weights of the model checkpoint at distilbert-base-uncased were not used when initializing DistilBertForSequenceClassification: ['vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_transform.weight', 'vocab_layer_norm.weight', 'vocab_projector.bia

In [None]:
def hp_space_optuna(trial) :
    return {
        "learning_rate": trial.suggest_categorical("learning_rate", [1.5e-5, 3.5e-5, 6.5e-5, 10.5e-5]),
        "warmup_steps": trial.suggest_int("warmup_steps", 0, 500),
        "weight_decay": trial.suggest_float("weight_decay", 0.1 , 0.3),
        "per_device_train_batch_size": trial.suggest_categorical("per_device_train_batch_size", [ 16,32,64,128]),
    }

In [None]:
best_trial = hyper_trainer.hyperparameter_search(n_trials=40, direction="maximize", backend="optuna", hp_space=hp_space_optuna)

[32m[I 2022-02-15 21:45:35,004][0m A new study created in memory with name: no-name-eea1c617-842a-447d-b9cc-8ead97c2bd1f[0m
Trial:
loading configuration file https://huggingface.co/distilbert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/23454919702d26495337f3da04d1655c7ee010d5ec9d77bdb9e399e00302c0a1.91b885ab15d631bf9cee9dc9d25ece0afd932f2f5130eba28f2055b2220c0333
Model config DistilBertConfig {
  "_name_or_path": "distilbert-base-uncased",
  "activation": "gelu",
  "architectures": [
    "DistilBertForMaskedLM"
  ],
  "attention_dropout": 0.1,
  "dim": 768,
  "dropout": 0.1,
  "hidden_dim": 3072,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0.02,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_2": 2
  },
  "max_position_embeddings": 512,
  "model_type": "distilbert",
  "n_heads": 12,
  "n_layers": 6,
  "pad_token_id": 0,
  "qa_dropout": 0.1,
  "seq_classif_dropout":

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,0.5823,0.550534,0.775703,0.721651,0.735487,0.711784,0.712902,0.703219,0.722854,0.853973,0.883377,0.826463,0.598078,0.548755,0.657143
2,0.4555,0.494986,0.799528,0.761102,0.754913,0.768329,0.764621,0.795775,0.735814,0.867761,0.851536,0.884615,0.650924,0.657676,0.644309
3,0.3152,0.520046,0.808113,0.767489,0.764824,0.771924,0.777247,0.817907,0.740437,0.875327,0.868197,0.882574,0.649893,0.629668,0.67146


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
Saving model checkpoint to /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-0/checkpoint-1165
Configuration saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-0/checkpoint-1165/config.json
Model weights saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-0/checkpoint-1165/pytorch_model.bin
The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
Saving mode

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,0.5769,0.539596,0.773127,0.712312,0.735958,0.697009,0.706191,0.677062,0.737939,0.854986,0.901518,0.813022,0.575758,0.512448,0.656915
2,0.4435,0.495122,0.804464,0.765329,0.759079,0.773415,0.769596,0.814889,0.729073,0.872947,0.855979,0.890601,0.653445,0.649378,0.657563
3,0.2856,0.551783,0.810045,0.766844,0.766532,0.768619,0.784124,0.814889,0.755597,0.879259,0.878934,0.879585,0.637149,0.612033,0.664414


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
Saving model checkpoint to /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-1/checkpoint-2330
Configuration saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-1/checkpoint-2330/config.json
Model weights saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-1/checkpoint-2330/pytorch_model.bin
The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
Saving mode

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,No log,0.582558,0.751449,0.710902,0.711135,0.729222,0.685239,0.828974,0.583983,0.828365,0.787116,0.874178,0.619101,0.571577,0.675245
2,0.607100,0.523493,0.786435,0.733673,0.755842,0.717739,0.720213,0.681087,0.764108,0.860116,0.902629,0.821429,0.62069,0.569502,0.681988
3,0.607100,0.509643,0.794591,0.749243,0.750268,0.751683,0.751303,0.797787,0.709937,0.866938,0.865976,0.867904,0.629486,0.591286,0.672963


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
Saving model checkpoint to /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-2/checkpoint-292
Configuration saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-2/checkpoint-292/config.json
Model weights saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-2/checkpoint-292/pytorch_model.bin
The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
Saving model c

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,0.5694,0.530946,0.777205,0.726461,0.73277,0.72181,0.714571,0.720322,0.708911,0.855687,0.870418,0.841446,0.609126,0.574689,0.647953
2,0.4377,0.512852,0.801889,0.76134,0.75641,0.767102,0.758354,0.787726,0.731092,0.872816,0.860052,0.885965,0.65285,0.653527,0.652174
3,0.2879,0.559558,0.805967,0.762826,0.763436,0.764644,0.784069,0.821932,0.749541,0.873521,0.874491,0.872553,0.630887,0.59751,0.668213


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
Saving model checkpoint to /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-3/checkpoint-2330
Configuration saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-3/checkpoint-2330/config.json
Model weights saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-3/checkpoint-2330/pytorch_model.bin
The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
Saving mode

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,No log,0.639283,0.713887,0.681552,0.67934,0.717552,0.65565,0.858149,0.530473,0.791113,0.705294,0.900709,0.597895,0.589212,0.606838
2,0.651900,0.519813,0.787723,0.732738,0.759795,0.714838,0.726405,0.689135,0.767937,0.861345,0.910774,0.817004,0.610465,0.544606,0.694444
3,0.651900,0.498732,0.797381,0.752121,0.752169,0.756095,0.751407,0.805835,0.703866,0.87065,0.865976,0.875374,0.634308,0.596473,0.677267


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
Saving model checkpoint to /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-4/checkpoint-292
Configuration saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-4/checkpoint-292/config.json
Model weights saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-4/checkpoint-292/pytorch_model.bin
The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
Saving model c

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,0.6542,0.540803,0.77463,0.731069,0.728265,0.739844,0.713312,0.789738,0.650373,0.850388,0.832284,0.869296,0.629508,0.59751,0.665127
2,0.4902,0.487199,0.807684,0.764308,0.768563,0.760539,0.757438,0.755533,0.759353,0.877013,0.887079,0.867173,0.658471,0.639004,0.679162
3,0.3858,0.501863,0.80704,0.764714,0.764654,0.767336,0.772901,0.814889,0.735027,0.874954,0.87301,0.876906,0.646288,0.614108,0.682028


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
Saving model checkpoint to /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-5/checkpoint-583
Configuration saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-5/checkpoint-583/config.json
Model weights saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-5/checkpoint-583/pytorch_model.bin
The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
Saving model c

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,0.5725,0.528405,0.782571,0.726071,0.745688,0.711769,0.71474,0.678068,0.755605,0.86235,0.902258,0.825822,0.601124,0.554979,0.655637
2,0.4333,0.500386,0.803391,0.762776,0.757168,0.769397,0.767375,0.799799,0.737477,0.874623,0.860052,0.889697,0.646329,0.64834,0.64433
3,0.2813,0.544801,0.813694,0.772989,0.76952,0.777357,0.787028,0.817907,0.758396,0.882122,0.874121,0.890271,0.649816,0.640041,0.659893


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
Saving model checkpoint to /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-6/checkpoint-2330
Configuration saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-6/checkpoint-2330/config.json
Model weights saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-6/checkpoint-2330/pytorch_model.bin
The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
Saving mode

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,No log,0.64994,0.711097,0.679794,0.678772,0.718129,0.650474,0.862173,0.522243,0.78943,0.696779,0.910498,0.599478,0.595436,0.603575


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
[32m[I 2022-02-15 22:20:51,327][0m Trial 7 pruned. [0m
Trial:
loading configuration file https://huggingface.co/distilbert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/23454919702d26495337f3da04d1655c7ee010d5ec9d77bdb9e399e00302c0a1.91b885ab15d631bf9cee9dc9d25ece0afd932f2f5130eba28f2055b2220c0333
Model config DistilBertConfig {
  "_name_or_path": "distilbert-base-uncased",
  "activation": "gelu",
  "architectures": [
    "DistilBertForMaskedLM"
  ],
  "attention_dropout": 0.1,
  "dim": 768,
  "dropout": 0.1,
  "hidden_dim": 3072,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0.

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,0.687,0.541179,0.777849,0.732695,0.733506,0.735296,0.716376,0.763581,0.674667,0.8521,0.848945,0.855278,0.629609,0.593361,0.670574
2,0.5022,0.489274,0.805323,0.763162,0.76469,0.761679,0.753535,0.750503,0.756592,0.875207,0.878934,0.871512,0.660742,0.655602,0.665964
3,0.3928,0.501783,0.805967,0.762584,0.762141,0.765829,0.769596,0.814889,0.729073,0.875883,0.87264,0.87915,0.642272,0.609959,0.678201


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
Saving model checkpoint to /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-8/checkpoint-583
Configuration saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-8/checkpoint-583/config.json
Model weights saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-8/checkpoint-583/pytorch_model.bin
The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
Saving model c

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,0.5742,0.520922,0.78064,0.725796,0.741303,0.715174,0.72412,0.714286,0.73423,0.858519,0.890781,0.828512,0.594749,0.540456,0.661168
2,0.435,0.501118,0.804679,0.765728,0.757837,0.776082,0.774741,0.826962,0.728723,0.874074,0.851907,0.897426,0.648369,0.649378,0.647363
3,0.2807,0.55793,0.804894,0.761461,0.758638,0.765657,0.778846,0.814889,0.745856,0.876539,0.870048,0.883127,0.628998,0.612033,0.64693


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
Saving model checkpoint to /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-9/checkpoint-2330
Configuration saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-9/checkpoint-2330/config.json
Model weights saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-9/checkpoint-2330/pytorch_model.bin
The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
Saving mode

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,0.5767,0.545714,0.774844,0.722212,0.736264,0.712583,0.711538,0.707243,0.715886,0.851003,0.879674,0.824142,0.604096,0.55083,0.668766


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
[32m[I 2022-02-15 22:31:47,756][0m Trial 10 pruned. [0m
Trial:
loading configuration file https://huggingface.co/distilbert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/23454919702d26495337f3da04d1655c7ee010d5ec9d77bdb9e399e00302c0a1.91b885ab15d631bf9cee9dc9d25ece0afd932f2f5130eba28f2055b2220c0333
Model config DistilBertConfig {
  "_name_or_path": "distilbert-base-uncased",
  "activation": "gelu",
  "architectures": [
    "DistilBertForMaskedLM"
  ],
  "attention_dropout": 0.1,
  "dim": 768,
  "dropout": 0.1,
  "hidden_dim": 3072,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,0.577,0.545823,0.775488,0.725314,0.733727,0.720093,0.712383,0.726358,0.698935,0.851543,0.868567,0.835173,0.612016,0.565353,0.667075
2,0.4501,0.487436,0.803606,0.763968,0.760295,0.767929,0.767029,0.78169,0.752907,0.872591,0.863384,0.881997,0.652286,0.658714,0.645982
3,0.3095,0.523021,0.801674,0.757195,0.756946,0.75941,0.774038,0.809859,0.741252,0.872545,0.871899,0.873192,0.625,0.596473,0.656393


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
Saving model checkpoint to /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-11/checkpoint-1165
Configuration saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-11/checkpoint-1165/config.json
Model weights saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-11/checkpoint-1165/pytorch_model.bin
The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
Saving m

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,0.5873,0.552536,0.772698,0.719295,0.731891,0.709545,0.705882,0.688129,0.724576,0.85156,0.879304,0.825513,0.600444,0.561203,0.645585


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
[32m[I 2022-02-15 22:37:43,510][0m Trial 12 pruned. [0m
Trial:
loading configuration file https://huggingface.co/distilbert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/23454919702d26495337f3da04d1655c7ee010d5ec9d77bdb9e399e00302c0a1.91b885ab15d631bf9cee9dc9d25ece0afd932f2f5130eba28f2055b2220c0333
Model config DistilBertConfig {
  "_name_or_path": "distilbert-base-uncased",
  "activation": "gelu",
  "architectures": [
    "DistilBertForMaskedLM"
  ],
  "attention_dropout": 0.1,
  "dim": 768,
  "dropout": 0.1,
  "hidden_dim": 3072,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,0.5706,0.535501,0.77742,0.719692,0.740108,0.7051,0.707317,0.671026,0.747758,0.858202,0.899667,0.820392,0.593556,0.544606,0.652174


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
[32m[I 2022-02-15 22:39:31,657][0m Trial 13 pruned. [0m
Trial:
loading configuration file https://huggingface.co/distilbert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/23454919702d26495337f3da04d1655c7ee010d5ec9d77bdb9e399e00302c0a1.91b885ab15d631bf9cee9dc9d25ece0afd932f2f5130eba28f2055b2220c0333
Model config DistilBertConfig {
  "_name_or_path": "distilbert-base-uncased",
  "activation": "gelu",
  "architectures": [
    "DistilBertForMaskedLM"
  ],
  "attention_dropout": 0.1,
  "dim": 768,
  "dropout": 0.1,
  "hidden_dim": 3072,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,0.5798,0.545827,0.777849,0.725554,0.738168,0.716524,0.713634,0.708249,0.719101,0.854578,0.881155,0.829557,0.608451,0.560166,0.665845
2,0.4528,0.494306,0.805323,0.76601,0.761924,0.77074,0.772374,0.798793,0.747646,0.87287,0.863014,0.882955,0.652785,0.650415,0.655172
3,0.312,0.521457,0.80983,0.768092,0.767246,0.770667,0.784408,0.81992,0.751845,0.876972,0.874861,0.879092,0.642896,0.61722,0.6708


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
Saving model checkpoint to /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-14/checkpoint-1165
Configuration saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-14/checkpoint-1165/config.json
Model weights saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-14/checkpoint-1165/pytorch_model.bin
The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
Saving m

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,0.5682,0.525638,0.779996,0.725719,0.739332,0.715586,0.718397,0.703219,0.734244,0.858984,0.88856,0.831313,0.599776,0.554979,0.652439
2,0.4346,0.500007,0.81026,0.770456,0.765179,0.777765,0.776303,0.823944,0.733871,0.8786,0.864124,0.893568,0.656464,0.645228,0.668099
3,0.2823,0.548974,0.807899,0.763814,0.761962,0.767301,0.78616,0.822938,0.75253,0.879137,0.875231,0.883078,0.626143,0.603734,0.650279


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
Saving model checkpoint to /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-15/checkpoint-2330
Configuration saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-15/checkpoint-2330/config.json
Model weights saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-15/checkpoint-2330/pytorch_model.bin
The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
Saving m

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,0.5792,0.552108,0.774844,0.724039,0.732822,0.71859,0.715415,0.72837,0.702913,0.851187,0.869308,0.833807,0.605515,0.558091,0.661747


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
[32m[I 2022-02-15 22:51:35,471][0m Trial 16 pruned. [0m
Trial:
loading configuration file https://huggingface.co/distilbert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/23454919702d26495337f3da04d1655c7ee010d5ec9d77bdb9e399e00302c0a1.91b885ab15d631bf9cee9dc9d25ece0afd932f2f5130eba28f2055b2220c0333
Model config DistilBertConfig {
  "_name_or_path": "distilbert-base-uncased",
  "activation": "gelu",
  "architectures": [
    "DistilBertForMaskedLM"
  ],
  "attention_dropout": 0.1,
  "dim": 768,
  "dropout": 0.1,
  "hidden_dim": 3072,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,0.6608,0.539308,0.778708,0.733786,0.734179,0.740421,0.71208,0.788732,0.649007,0.854942,0.842281,0.867989,0.634337,0.590249,0.685542
2,0.4918,0.488721,0.805108,0.762797,0.765912,0.75985,0.750635,0.743461,0.757949,0.874243,0.881525,0.867079,0.663512,0.654564,0.672708


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
Saving model checkpoint to /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-17/checkpoint-583
Configuration saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-17/checkpoint-583/config.json
Model weights saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-17/checkpoint-583/pytorch_model.bin
The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
[32m[I 202

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,0.5714,0.528563,0.779566,0.719631,0.744569,0.704697,0.718637,0.700201,0.73807,0.858999,0.905591,0.816967,0.581257,0.508299,0.67867


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
[32m[I 2022-02-15 22:56:00,455][0m Trial 18 pruned. [0m
Trial:
loading configuration file https://huggingface.co/distilbert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/23454919702d26495337f3da04d1655c7ee010d5ec9d77bdb9e399e00302c0a1.91b885ab15d631bf9cee9dc9d25ece0afd932f2f5130eba28f2055b2220c0333
Model config DistilBertConfig {
  "_name_or_path": "distilbert-base-uncased",
  "activation": "gelu",
  "architectures": [
    "DistilBertForMaskedLM"
  ],
  "attention_dropout": 0.1,
  "dim": 768,
  "dropout": 0.1,
  "hidden_dim": 3072,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,0.58,0.541411,0.779996,0.729965,0.739507,0.72315,0.721805,0.724346,0.719281,0.855025,0.875602,0.835394,0.613065,0.569502,0.663845
2,0.4532,0.488538,0.804464,0.765035,0.75999,0.770723,0.771331,0.795775,0.748344,0.873568,0.860792,0.886728,0.650206,0.655602,0.644898
3,0.3117,0.517651,0.805752,0.763401,0.761211,0.767262,0.776606,0.814889,0.741758,0.875186,0.869678,0.880765,0.638412,0.61722,0.661111


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
Saving model checkpoint to /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-19/checkpoint-1165
Configuration saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-19/checkpoint-1165/config.json
Model weights saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-19/checkpoint-1165/pytorch_model.bin
The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
Saving m

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,0.5874,0.554778,0.773557,0.718508,0.736346,0.705696,0.701718,0.678068,0.727077,0.851766,0.88819,0.818213,0.602041,0.55083,0.66375


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
[32m[I 2022-02-15 23:02:00,834][0m Trial 20 pruned. [0m
Trial:
loading configuration file https://huggingface.co/distilbert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/23454919702d26495337f3da04d1655c7ee010d5ec9d77bdb9e399e00302c0a1.91b885ab15d631bf9cee9dc9d25ece0afd932f2f5130eba28f2055b2220c0333
Model config DistilBertConfig {
  "_name_or_path": "distilbert-base-uncased",
  "activation": "gelu",
  "architectures": [
    "DistilBertForMaskedLM"
  ],
  "attention_dropout": 0.1,
  "dim": 768,
  "dropout": 0.1,
  "hidden_dim": 3072,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,0.5886,0.546789,0.779996,0.723707,0.744099,0.709346,0.713235,0.683099,0.746154,0.858456,0.899297,0.821163,0.59943,0.545643,0.664981


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
[32m[I 2022-02-15 23:03:26,935][0m Trial 21 pruned. [0m
Trial:
loading configuration file https://huggingface.co/distilbert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/23454919702d26495337f3da04d1655c7ee010d5ec9d77bdb9e399e00302c0a1.91b885ab15d631bf9cee9dc9d25ece0afd932f2f5130eba28f2055b2220c0333
Model config DistilBertConfig {
  "_name_or_path": "distilbert-base-uncased",
  "activation": "gelu",
  "architectures": [
    "DistilBertForMaskedLM"
  ],
  "attention_dropout": 0.1,
  "dim": 768,
  "dropout": 0.1,
  "hidden_dim": 3072,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,0.5786,0.549758,0.773127,0.720486,0.731884,0.711859,0.713265,0.703219,0.723602,0.85098,0.876342,0.827044,0.597214,0.556017,0.645006


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
[32m[I 2022-02-15 23:04:53,441][0m Trial 22 pruned. [0m
Trial:
loading configuration file https://huggingface.co/distilbert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/23454919702d26495337f3da04d1655c7ee010d5ec9d77bdb9e399e00302c0a1.91b885ab15d631bf9cee9dc9d25ece0afd932f2f5130eba28f2055b2220c0333
Model config DistilBertConfig {
  "_name_or_path": "distilbert-base-uncased",
  "activation": "gelu",
  "architectures": [
    "DistilBertForMaskedLM"
  ],
  "attention_dropout": 0.1,
  "dim": 768,
  "dropout": 0.1,
  "hidden_dim": 3072,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,0.5814,0.547989,0.775274,0.723859,0.732243,0.717148,0.704211,0.698189,0.710338,0.854091,0.87338,0.835636,0.613275,0.579876,0.650757


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
[32m[I 2022-02-15 23:06:19,815][0m Trial 23 pruned. [0m
Trial:
loading configuration file https://huggingface.co/distilbert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/23454919702d26495337f3da04d1655c7ee010d5ec9d77bdb9e399e00302c0a1.91b885ab15d631bf9cee9dc9d25ece0afd932f2f5130eba28f2055b2220c0333
Model config DistilBertConfig {
  "_name_or_path": "distilbert-base-uncased",
  "activation": "gelu",
  "architectures": [
    "DistilBertForMaskedLM"
  ],
  "attention_dropout": 0.1,
  "dim": 768,
  "dropout": 0.1,
  "hidden_dim": 3072,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,0.577,0.5397,0.781713,0.730512,0.741796,0.72208,0.713996,0.708249,0.719836,0.85812,0.882266,0.835261,0.61942,0.575726,0.67029
2,0.4468,0.486918,0.802533,0.763567,0.757745,0.77029,0.765875,0.794769,0.739008,0.871515,0.85635,0.887227,0.653313,0.659751,0.646999


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
Saving model checkpoint to /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-24/checkpoint-1165
Configuration saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-24/checkpoint-1165/config.json
Model weights saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-24/checkpoint-1165/pytorch_model.bin
The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
[32m[I 

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,0.5721,0.529675,0.784718,0.730362,0.747095,0.718864,0.725691,0.71328,0.738542,0.861621,0.895594,0.83013,0.603774,0.547718,0.672611
2,0.4363,0.492741,0.802962,0.763443,0.757698,0.770411,0.770413,0.806841,0.737132,0.87194,0.85709,0.887313,0.647975,0.647303,0.648649


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
Saving model checkpoint to /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-25/checkpoint-2330
Configuration saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-25/checkpoint-2330/config.json
Model weights saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-25/checkpoint-2330/pytorch_model.bin
The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
[32m[I 

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,0.6774,0.546878,0.771625,0.724316,0.728131,0.728044,0.705451,0.774648,0.647603,0.84853,0.844132,0.852974,0.618966,0.565353,0.683814


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
[32m[I 2022-02-15 23:14:23,655][0m Trial 26 pruned. [0m
Trial:
loading configuration file https://huggingface.co/distilbert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/23454919702d26495337f3da04d1655c7ee010d5ec9d77bdb9e399e00302c0a1.91b885ab15d631bf9cee9dc9d25ece0afd932f2f5130eba28f2055b2220c0333
Model config DistilBertConfig {
  "_name_or_path": "distilbert-base-uncased",
  "activation": "gelu",
  "architectures": [
    "DistilBertForMaskedLM"
  ],
  "attention_dropout": 0.1,
  "dim": 768,
  "dropout": 0.1,
  "hidden_dim": 3072,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,No log,0.652525,0.710882,0.680343,0.678897,0.718906,0.650703,0.861167,0.522908,0.787828,0.694928,0.909399,0.602497,0.600622,0.604384


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
[32m[I 2022-02-15 23:15:34,808][0m Trial 27 pruned. [0m
Trial:
loading configuration file https://huggingface.co/distilbert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/23454919702d26495337f3da04d1655c7ee010d5ec9d77bdb9e399e00302c0a1.91b885ab15d631bf9cee9dc9d25ece0afd932f2f5130eba28f2055b2220c0333
Model config DistilBertConfig {
  "_name_or_path": "distilbert-base-uncased",
  "activation": "gelu",
  "architectures": [
    "DistilBertForMaskedLM"
  ],
  "attention_dropout": 0.1,
  "dim": 768,
  "dropout": 0.1,
  "hidden_dim": 3072,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,0.5849,0.551004,0.779996,0.725588,0.741655,0.714676,0.713849,0.705231,0.72268,0.857653,0.890041,0.827539,0.605263,0.548755,0.674745
2,0.4569,0.489462,0.802747,0.761717,0.758362,0.766125,0.767969,0.800805,0.73772,0.871987,0.863754,0.880377,0.645195,0.633817,0.656989


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
Saving model checkpoint to /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-28/checkpoint-1165
Configuration saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-28/checkpoint-1165/config.json
Model weights saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-28/checkpoint-1165/pytorch_model.bin
The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
[32m[I 

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,0.5741,0.534459,0.772269,0.710741,0.735427,0.694278,0.696905,0.656942,0.742045,0.855491,0.90411,0.811835,0.579827,0.521784,0.652399


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
[32m[I 2022-02-15 23:20:17,041][0m Trial 29 pruned. [0m
Trial:
loading configuration file https://huggingface.co/distilbert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/23454919702d26495337f3da04d1655c7ee010d5ec9d77bdb9e399e00302c0a1.91b885ab15d631bf9cee9dc9d25ece0afd932f2f5130eba28f2055b2220c0333
Model config DistilBertConfig {
  "_name_or_path": "distilbert-base-uncased",
  "activation": "gelu",
  "architectures": [
    "DistilBertForMaskedLM"
  ],
  "attention_dropout": 0.1,
  "dim": 768,
  "dropout": 0.1,
  "hidden_dim": 3072,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,0.5702,0.525938,0.781713,0.725878,0.74302,0.713957,0.713992,0.698189,0.730526,0.860904,0.895964,0.828483,0.60274,0.547718,0.670051
2,0.4346,0.50603,0.802747,0.763093,0.757319,0.770489,0.766444,0.808853,0.728261,0.871843,0.85635,0.887908,0.650993,0.646266,0.655789


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
Saving model checkpoint to /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-30/checkpoint-2330
Configuration saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-30/checkpoint-2330/config.json
Model weights saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-30/checkpoint-2330/pytorch_model.bin
The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
[32m[I 

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,0.5741,0.534459,0.772269,0.710741,0.735427,0.694278,0.696905,0.656942,0.742045,0.855491,0.90411,0.811835,0.579827,0.521784,0.652399


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
[32m[I 2022-02-15 23:25:43,988][0m Trial 31 pruned. [0m
Trial:
loading configuration file https://huggingface.co/distilbert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/23454919702d26495337f3da04d1655c7ee010d5ec9d77bdb9e399e00302c0a1.91b885ab15d631bf9cee9dc9d25ece0afd932f2f5130eba28f2055b2220c0333
Model config DistilBertConfig {
  "_name_or_path": "distilbert-base-uncased",
  "activation": "gelu",
  "architectures": [
    "DistilBertForMaskedLM"
  ],
  "attention_dropout": 0.1,
  "dim": 768,
  "dropout": 0.1,
  "hidden_dim": 3072,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,0.5748,0.542062,0.779566,0.718912,0.750597,0.699239,0.714286,0.669014,0.766129,0.858035,0.915217,0.807579,0.584416,0.513485,0.678082


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
[32m[I 2022-02-15 23:27:32,627][0m Trial 32 pruned. [0m
Trial:
loading configuration file https://huggingface.co/distilbert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/23454919702d26495337f3da04d1655c7ee010d5ec9d77bdb9e399e00302c0a1.91b885ab15d631bf9cee9dc9d25ece0afd932f2f5130eba28f2055b2220c0333
Model config DistilBertConfig {
  "_name_or_path": "distilbert-base-uncased",
  "activation": "gelu",
  "architectures": [
    "DistilBertForMaskedLM"
  ],
  "attention_dropout": 0.1,
  "dim": 768,
  "dropout": 0.1,
  "hidden_dim": 3072,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,No log,0.584149,0.752522,0.71035,0.717044,0.72855,0.684575,0.846076,0.574846,0.830644,0.790818,0.874693,0.615832,0.548755,0.701592


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
[32m[I 2022-02-15 23:28:43,574][0m Trial 33 pruned. [0m
Trial:
loading configuration file https://huggingface.co/distilbert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/23454919702d26495337f3da04d1655c7ee010d5ec9d77bdb9e399e00302c0a1.91b885ab15d631bf9cee9dc9d25ece0afd932f2f5130eba28f2055b2220c0333
Model config DistilBertConfig {
  "_name_or_path": "distilbert-base-uncased",
  "activation": "gelu",
  "architectures": [
    "DistilBertForMaskedLM"
  ],
  "attention_dropout": 0.1,
  "dim": 768,
  "dropout": 0.1,
  "hidden_dim": 3072,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,0.5759,0.527172,0.778493,0.724509,0.736172,0.715994,0.715736,0.709256,0.722336,0.858016,0.883747,0.833741,0.599776,0.554979,0.652439


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
[32m[I 2022-02-15 23:30:31,983][0m Trial 34 pruned. [0m
Trial:
loading configuration file https://huggingface.co/distilbert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/23454919702d26495337f3da04d1655c7ee010d5ec9d77bdb9e399e00302c0a1.91b885ab15d631bf9cee9dc9d25ece0afd932f2f5130eba28f2055b2220c0333
Model config DistilBertConfig {
  "_name_or_path": "distilbert-base-uncased",
  "activation": "gelu",
  "architectures": [
    "DistilBertForMaskedLM"
  ],
  "attention_dropout": 0.1,
  "dim": 768,
  "dropout": 0.1,
  "hidden_dim": 3072,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,0.5767,0.534817,0.780854,0.720808,0.746293,0.7041,0.715421,0.679074,0.755879,0.861296,0.910404,0.817215,0.585706,0.522822,0.665786


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
[32m[I 2022-02-15 23:32:20,143][0m Trial 35 pruned. [0m
Trial:
loading configuration file https://huggingface.co/distilbert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/23454919702d26495337f3da04d1655c7ee010d5ec9d77bdb9e399e00302c0a1.91b885ab15d631bf9cee9dc9d25ece0afd932f2f5130eba28f2055b2220c0333
Model config DistilBertConfig {
  "_name_or_path": "distilbert-base-uncased",
  "activation": "gelu",
  "architectures": [
    "DistilBertForMaskedLM"
  ],
  "attention_dropout": 0.1,
  "dim": 768,
  "dropout": 0.1,
  "hidden_dim": 3072,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,No log,0.5707,0.757029,0.717486,0.715435,0.734738,0.690355,0.820926,0.59562,0.83233,0.79304,0.875715,0.629773,0.590249,0.67497


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
[32m[I 2022-02-15 23:33:30,927][0m Trial 36 pruned. [0m
Trial:
loading configuration file https://huggingface.co/distilbert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/23454919702d26495337f3da04d1655c7ee010d5ec9d77bdb9e399e00302c0a1.91b885ab15d631bf9cee9dc9d25ece0afd932f2f5130eba28f2055b2220c0333
Model config DistilBertConfig {
  "_name_or_path": "distilbert-base-uncased",
  "activation": "gelu",
  "architectures": [
    "DistilBertForMaskedLM"
  ],
  "attention_dropout": 0.1,
  "dim": 768,
  "dropout": 0.1,
  "hidden_dim": 3072,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,0.6935,0.540339,0.778279,0.731107,0.733901,0.73105,0.712092,0.746479,0.680734,0.854297,0.85746,0.851158,0.626932,0.589212,0.669811
2,0.5045,0.490775,0.802103,0.75693,0.761862,0.752424,0.745918,0.735412,0.756729,0.874475,0.885968,0.863276,0.650398,0.635892,0.665581


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
Saving model checkpoint to /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-37/checkpoint-583
Configuration saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-37/checkpoint-583/config.json
Model weights saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-37/checkpoint-583/pytorch_model.bin
The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
[32m[I 202

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,0.5909,0.55535,0.772913,0.714591,0.736859,0.700531,0.708678,0.690141,0.728238,0.851956,0.894854,0.812984,0.583138,0.516598,0.669355


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
[32m[I 2022-02-15 23:37:29,047][0m Trial 38 pruned. [0m
Trial:
loading configuration file https://huggingface.co/distilbert-base-uncased/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/23454919702d26495337f3da04d1655c7ee010d5ec9d77bdb9e399e00302c0a1.91b885ab15d631bf9cee9dc9d25ece0afd932f2f5130eba28f2055b2220c0333
Model config DistilBertConfig {
  "_name_or_path": "distilbert-base-uncased",
  "activation": "gelu",
  "architectures": [
    "DistilBertForMaskedLM"
  ],
  "attention_dropout": 0.1,
  "dim": 768,
  "dropout": 0.1,
  "hidden_dim": 3072,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall,Hate F1,Hate Recall,Hate Precision,Offensive F1,Offensive Recall,Offensive Precision,Normal F1,Normal Recall,Normal Precision
1,0.571,0.519383,0.786649,0.736433,0.74422,0.73045,0.732763,0.732394,0.733132,0.863101,0.881155,0.845771,0.613436,0.577801,0.653756
2,0.4318,0.507086,0.804679,0.765809,0.758767,0.774588,0.777513,0.820926,0.738462,0.87325,0.854498,0.892843,0.646663,0.64834,0.644995
3,0.2841,0.561989,0.810474,0.768182,0.765854,0.772097,0.787326,0.82495,0.752984,0.879493,0.874121,0.884933,0.637728,0.61722,0.659645


The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
Saving model checkpoint to /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-39/checkpoint-2330
Configuration saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-39/checkpoint-2330/config.json
Model weights saved in /content/drive/MyDrive/Dissertation/disbert_optimal/hyper/results/run-39/checkpoint-2330/pytorch_model.bin
The following columns in the evaluation set  don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, input_ids_bert, token_type_ids_bert, attention_mask_bert, __index_level_0__.
***** Running Evaluation *****
  Num examples = 4659
  Batch size = 16
Saving m

In [None]:
best_trial

BestRun(run_id='6', objective=10.093154777381747, hyperparameters={'learning_rate': 3.5e-05, 'warmup_steps': 154, 'weight_decay': 0.18349723349789687, 'per_device_train_batch_size': 16})