In [1]:
#Need to compare the BERT model with the regular SVM model 

In [10]:
from datasets import load_dataset
from transformers import BertTokenizerFast, BertForSequenceClassification
from transformers import Trainer, TrainingArguments
from transformers import DataCollatorWithPadding
import pickle
import os
from sklearn.metrics import classification_report, accuracy_score, f1_score, plot_confusion_matrix,ConfusionMatrixDisplay, confusion_matrix
import pickle
os.environ["WANDB_DISABLED"] = "true"

In [14]:
model_name = "../FinalBERT/Models/Final_model/BERT_13classes_final"
max_length=128

In [15]:
#loading the label encoder
le = pickle.load(open("../FinalBERT/Data/label_encoder.pkl", "rb"))

In [16]:
tokenizer = BertTokenizerFast.from_pretrained(model_name, do_lower_case=True)

In [17]:
target_names=le.transform(le.classes_)

In [18]:
target_names

array([ 0,  1,  2,  3,  4,  5,  6,  7,  8,  9, 10, 11, 12])

In [23]:
""" Parameters to test"""    
params_combos= {
	  "per_gpu_batch_size": [8, 16, 32],
	  "learning_rate": [2e-5, 3e-5, 5e-5],
	  "num_epochs": [20, 30, 40]
      #"max_length": [32, 128, 256, 512]
	}

    

In [20]:
def preprocess_function(examples):
    #print(examples['TEXT'])
    return tokenizer(examples["text"], padding=True, truncation=True)

    """Uncomment the following to have max length set"""
    #return tokenizer(examples["text"],padding=True,truncation=True, max_length=max_length)
    
    """Uncomment the following to have max length change from the params"""
    #return to tokenizer(examples['text'], padding=True, truncation=True, max_length=params['max_length'][0])

In [24]:
#traying 5 combinations first
import random
params_combos = []
i = 0
while i<10:
    first = random.randint(0,2)
    second = random.randint(0,2)
    third = random.randint(0,2)
    param = {"batch_size": params["per_gpu_batch_size"][first],
             "lr": params["learning_rate"][second],
             "epochs": params["num_epochs"][third]}
    if param not in params_combos:
        params_combos.append(param)
        i+=1

In [25]:
params_combos

[{'batch_size': 32, 'lr': 5e-05, 'epochs': 40},
 {'batch_size': 8, 'lr': 3e-05, 'epochs': 40},
 {'batch_size': 32, 'lr': 3e-05, 'epochs': 30},
 {'batch_size': 16, 'lr': 3e-05, 'epochs': 40},
 {'batch_size': 16, 'lr': 5e-05, 'epochs': 30},
 {'batch_size': 16, 'lr': 3e-05, 'epochs': 30},
 {'batch_size': 16, 'lr': 5e-05, 'epochs': 20},
 {'batch_size': 32, 'lr': 5e-05, 'epochs': 20},
 {'batch_size': 32, 'lr': 5e-05, 'epochs': 30},
 {'batch_size': 8, 'lr': 2e-05, 'epochs': 20}]

In [27]:
def get_prediction(text):
    # prepare our text into tokenized sequence
    inputs = tokenizer(text, padding=True, 
                       truncation=True, 
                       #max_length=max_length,
                       return_tensors="pt").to("cuda")
    
    # perform inference to our model
    outputs = model(**inputs)
    #print(outputs)
    # get output probabilities by doing softmax
    probs = outputs[0].softmax(1)
    #print(outputs[0].softmax(1).argmax())
    # executing argmax function to get the candidate label
    return probs.argmax().item()

## Kfold

In [150]:
#Run kfold over here 
"""
results = []
f1_scores = []
best_model =[]
for i in range(5):
    train_dataset = load_dataset('csv', data_files={'train': 'Data/train.csv'})
    #train_dataset = load_dataset('csv', data_files={'train': 'Data/train2.csv'})
    testing_dataset =load_dataset("csv", data_files={'test':'Data/test.csv'}) 
    #eval_dataset =load_dataset("csv", data_files={'test':'Data/eval.csv'}) 

    #print(train_dataset["train"][0])

    tokenized_dataset_train =train_dataset.map(preprocess_function)
    #print(tokenized_dataset_train['train']['input_ids'])

    tokenized_dataset_test = testing_dataset.map(preprocess_function)
    
    data_collator = DataCollatorWithPadding(tokenizer=tokenizer)
    #dataset has been loaded correctly. 
    print("----------------------MODEL "+ str(i)+"--------------------------------")

    for p in params_combos:
        
        print("Combination: ", p)
        
        model=BertForSequenceClassification.from_pretrained(model_name, num_labels=13)
        #device="cpu"
        device="cuda"
        model.to(device)


        training_args = TrainingArguments(
        num_train_epochs=p["epochs"],
        learning_rate=p["lr"],
        per_device_train_batch_size=p["batch_size"],  # batch size per device during training
        weight_decay=0.01,               # strength of weight decay
        #oad_best_model_at_end=True,
        logging_steps=100,
        #valuation_strategy="steps",
        output_dir="Models/{NAME_OF_OUTPUT_FILE}" #Name of outputs to store checkpoints 
        )

        trainer = Trainer( model=model,
                      args=training_args,
                      train_dataset=tokenized_dataset_train['train'],
                      #eval_dataset=tokenized_dataset_valid['valid'],
                      tokenizer=tokenizer,
                      data_collator=data_collator
                     )


        trainer.train()

        y_pred=[]

        for text in tokenized_dataset_test["test"]["text"]:
            y_pred.append(get_prediction(text))

        predictions = le.inverse_transform(y_pred)
        y_true = tokenized_dataset_test['test']["label"]
        
        f1= f1_score(le.inverse_transform(y_true), predictions, average="macro")
        f1_scores.append(f1)
        
        #Saving the best model 
        if f1 > max(f1_scores):
            best_model = {'split': i, 
                          'params': p,
                          'f1_score': f1,
                          'accuracy': acc}

        acc = accuracy_score(le.inverse_transform(y_true), predictions)
        results.append(acc)
        print(classification_report(le.inverse_transform(y_true), predictions))
        
"""

Using custom data configuration default-39460bdd07acc7bf
Reusing dataset csv (C:\Users\adianidm\.cache\huggingface\datasets\csv\default-39460bdd07acc7bf\0.0.0\433e0ccc46f9880962cc2b12065189766fbb2bee57a221866138fb9203c83519)


  0%|          | 0/1 [00:00<?, ?it/s]

Using custom data configuration default-38d3ac2bff9f4eb2
Reusing dataset csv (C:\Users\adianidm\.cache\huggingface\datasets\csv\default-38d3ac2bff9f4eb2\0.0.0\433e0ccc46f9880962cc2b12065189766fbb2bee57a221866138fb9203c83519)


  0%|          | 0/1 [00:00<?, ?it/s]

Loading cached processed dataset at C:\Users\adianidm\.cache\huggingface\datasets\csv\default-39460bdd07acc7bf\0.0.0\433e0ccc46f9880962cc2b12065189766fbb2bee57a221866138fb9203c83519\cache-0c03d44608866328.arrow
Loading cached processed dataset at C:\Users\adianidm\.cache\huggingface\datasets\csv\default-38d3ac2bff9f4eb2\0.0.0\433e0ccc46f9880962cc2b12065189766fbb2bee57a221866138fb9203c83519\cache-96dbeb40b209ba5f.arrow
loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at C:\Users\adianidm/.cache\huggingface\transformers\3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
 

----------------------MODEL 1--------------------------------
Combination:  {'batch_size': 32, 'lr': 2e-05, 'epochs': 20}


loading weights file https://huggingface.co/bert-base-uncased/resolve/main/pytorch_model.bin from cache at C:\Users\adianidm/.cache\huggingface\transformers\a8041bf617d7f94ea26d15e218abd04afc2004805632abc0ed2066aa16d50d04.faf6ea826ae9c5867d12b22257f9877e6b8367890837bd60f7c54a29633f7f2f
Some weights of the model checkpoint at bert-base-uncased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.LayerNorm.bias', 'cls.seq_relationship.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.weight', 'cls.seq_relationship.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertFo

Step,Training Loss
100,1.5082
200,0.4676
300,0.1954
400,0.122




Training completed. Do not forget to share your model on huggingface.co/models =)


  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at C:\Users\adianidm/.cache\huggingface\transformers\3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LA

              precision    recall  f1-score   support

         ack       1.00      1.00      1.00         3
         dno       1.00      0.80      0.89         5
          fa       1.00      1.00      1.00         6
          fe       0.87      1.00      0.93        13
          fp       0.80      0.89      0.84         9
          ft       1.00      0.90      0.95        10
           n       0.86      0.92      0.89        13
         n-d       0.00      0.00      0.00         2
       query       1.00      1.00      1.00         4
         sno       0.89      0.90      0.90        83
          so       0.29      0.40      0.33         5
           y       0.89      1.00      0.94         8
         y-d       1.00      0.20      0.33         5

    accuracy                           0.87       166
   macro avg       0.81      0.77      0.77       166
weighted avg       0.88      0.87      0.86       166

Combination:  {'batch_size': 32, 'lr': 3e-05, 'epochs': 20}


loading weights file https://huggingface.co/bert-base-uncased/resolve/main/pytorch_model.bin from cache at C:\Users\adianidm/.cache\huggingface\transformers\a8041bf617d7f94ea26d15e218abd04afc2004805632abc0ed2066aa16d50d04.faf6ea826ae9c5867d12b22257f9877e6b8367890837bd60f7c54a29633f7f2f
Some weights of the model checkpoint at bert-base-uncased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.LayerNorm.bias', 'cls.seq_relationship.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.weight', 'cls.seq_relationship.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertFo

Step,Training Loss
100,1.4146
200,0.2804
300,0.0705
400,0.0439




Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at C:\Users\adianidm/.cache\huggingface\transformers\3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "LABEL_12"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0"

              precision    recall  f1-score   support

         ack       0.75      1.00      0.86         3
         dno       0.80      0.80      0.80         5
          fa       1.00      1.00      1.00         6
          fe       0.81      1.00      0.90        13
          fp       1.00      0.78      0.88         9
          ft       1.00      0.90      0.95        10
           n       0.80      0.92      0.86        13
         n-d       1.00      0.50      0.67         2
       query       1.00      0.75      0.86         4
         sno       0.91      0.88      0.90        83
          so       0.38      0.60      0.46         5
           y       0.89      1.00      0.94         8
         y-d       1.00      0.60      0.75         5

    accuracy                           0.87       166
   macro avg       0.87      0.83      0.83       166
weighted avg       0.89      0.87      0.88       166

Combination:  {'batch_size': 8, 'lr': 2e-05, 'epochs': 40}


loading weights file https://huggingface.co/bert-base-uncased/resolve/main/pytorch_model.bin from cache at C:\Users\adianidm/.cache\huggingface\transformers\a8041bf617d7f94ea26d15e218abd04afc2004805632abc0ed2066aa16d50d04.faf6ea826ae9c5867d12b22257f9877e6b8367890837bd60f7c54a29633f7f2f
Some weights of the model checkpoint at bert-base-uncased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.LayerNorm.bias', 'cls.seq_relationship.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.weight', 'cls.seq_relationship.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertFo

Step,Training Loss
100,2.0421
200,1.2688
300,0.6125
400,0.3545
500,0.2007
600,0.1084
700,0.0852
800,0.0506
900,0.0176
1000,0.0385


Saving model checkpoint to Models/BERT_13classes\checkpoint-500
Configuration saved in Models/BERT_13classes\checkpoint-500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-500\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-500\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-500\special_tokens_map.json
Saving model checkpoint to Models/BERT_13classes\checkpoint-1000
Configuration saved in Models/BERT_13classes\checkpoint-1000\config.json
Model weights saved in Models/BERT_13classes\checkpoint-1000\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-1000\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-1000\special_tokens_map.json
Saving model checkpoint to Models/BERT_13classes\checkpoint-1500
Configuration saved in Models/BERT_13classes\checkpoint-1500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-1500\pytorch_

              precision    recall  f1-score   support

         ack       1.00      1.00      1.00         3
         dno       0.80      0.80      0.80         5
          fa       1.00      1.00      1.00         6
          fe       0.87      1.00      0.93        13
          fp       0.88      0.78      0.82         9
          ft       1.00      1.00      1.00        10
           n       0.92      0.92      0.92        13
         n-d       1.00      0.50      0.67         2
       query       1.00      0.75      0.86         4
         sno       0.92      0.94      0.93        83
          so       0.40      0.40      0.40         5
           y       0.89      1.00      0.94         8
         y-d       1.00      0.60      0.75         5

    accuracy                           0.90       166
   macro avg       0.90      0.82      0.85       166
weighted avg       0.91      0.90      0.90       166

Combination:  {'batch_size': 8, 'lr': 5e-05, 'epochs': 40}


loading weights file https://huggingface.co/bert-base-uncased/resolve/main/pytorch_model.bin from cache at C:\Users\adianidm/.cache\huggingface\transformers\a8041bf617d7f94ea26d15e218abd04afc2004805632abc0ed2066aa16d50d04.faf6ea826ae9c5867d12b22257f9877e6b8367890837bd60f7c54a29633f7f2f
Some weights of the model checkpoint at bert-base-uncased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.LayerNorm.bias', 'cls.seq_relationship.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.weight', 'cls.seq_relationship.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertFo

Step,Training Loss
100,1.5166
200,0.637
300,0.3226
400,0.1825
500,0.0848
600,0.0531
700,0.0366
800,0.0358
900,0.0096
1000,0.033


Saving model checkpoint to Models/BERT_13classes\checkpoint-500
Configuration saved in Models/BERT_13classes\checkpoint-500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-500\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-500\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-500\special_tokens_map.json
Saving model checkpoint to Models/BERT_13classes\checkpoint-1000
Configuration saved in Models/BERT_13classes\checkpoint-1000\config.json
Model weights saved in Models/BERT_13classes\checkpoint-1000\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-1000\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-1000\special_tokens_map.json
Saving model checkpoint to Models/BERT_13classes\checkpoint-1500
Configuration saved in Models/BERT_13classes\checkpoint-1500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-1500\pytorch_

              precision    recall  f1-score   support

         ack       1.00      1.00      1.00         3
         dno       0.80      0.80      0.80         5
          fa       1.00      1.00      1.00         6
          fe       0.93      1.00      0.96        13
          fp       0.80      0.89      0.84         9
          ft       1.00      0.90      0.95        10
           n       0.86      0.92      0.89        13
         n-d       0.00      0.00      0.00         2
       query       1.00      1.00      1.00         4
         sno       0.89      0.90      0.90        83
          so       0.00      0.00      0.00         5
           y       0.89      1.00      0.94         8
         y-d       1.00      0.60      0.75         5

    accuracy                           0.87       166
   macro avg       0.78      0.77      0.77       166
weighted avg       0.87      0.87      0.87       166

Combination:  {'batch_size': 32, 'lr': 2e-05, 'epochs': 40}


loading weights file https://huggingface.co/bert-base-uncased/resolve/main/pytorch_model.bin from cache at C:\Users\adianidm/.cache\huggingface\transformers\a8041bf617d7f94ea26d15e218abd04afc2004805632abc0ed2066aa16d50d04.faf6ea826ae9c5867d12b22257f9877e6b8367890837bd60f7c54a29633f7f2f
Some weights of the model checkpoint at bert-base-uncased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.LayerNorm.bias', 'cls.seq_relationship.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.weight', 'cls.seq_relationship.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertFo

Step,Training Loss
100,1.4604
200,0.4173
300,0.1229
400,0.0557
500,0.0404
600,0.0309
700,0.0271
800,0.0264


Saving model checkpoint to Models/BERT_13classes\checkpoint-500
Configuration saved in Models/BERT_13classes\checkpoint-500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-500\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-500\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-500\special_tokens_map.json


Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at C:\Users\adianidm/.cache\huggingface\transformers\3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e


              precision    recall  f1-score   support

         ack       1.00      1.00      1.00         3
         dno       0.80      0.80      0.80         5
          fa       1.00      1.00      1.00         6
          fe       0.79      0.85      0.81        13
          fp       1.00      0.78      0.88         9
          ft       1.00      0.90      0.95        10
           n       0.86      0.92      0.89        13
         n-d       1.00      0.50      0.67         2
       query       1.00      1.00      1.00         4
         sno       0.90      0.93      0.91        83
          so       0.60      0.60      0.60         5
           y       0.89      1.00      0.94         8
         y-d       0.67      0.40      0.50         5

    accuracy                           0.89       166
   macro avg       0.88      0.82      0.84       166
weighted avg       0.89      0.89      0.88       166

Combination:  {'batch_size': 16, 'lr': 2e-05, 'epochs': 20}


Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "LABEL_12"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_10": 10,
    "LABEL_11": 11,
    "LABEL_12": 12,
    "LABEL_2": 2,
    "LABEL_3": 3,
    "LABEL_4": 4,
    "LABEL_5": 5,
    "LABEL_6": 6,
    "LABEL_7": 7,
    "LABEL_8": 8,
    "LABEL_9": 9
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
 

Step,Training Loss
100,1.664
200,0.6621
300,0.2627
400,0.1341
500,0.0612
600,0.0491
700,0.0388
800,0.0361


Saving model checkpoint to Models/BERT_13classes\checkpoint-500
Configuration saved in Models/BERT_13classes\checkpoint-500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-500\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-500\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-500\special_tokens_map.json


Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at C:\Users\adianidm/.cache\huggingface\transformers\3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e


              precision    recall  f1-score   support

         ack       0.60      1.00      0.75         3
         dno       1.00      0.80      0.89         5
          fa       1.00      1.00      1.00         6
          fe       0.85      0.85      0.85        13
          fp       1.00      0.89      0.94         9
          ft       1.00      1.00      1.00        10
           n       0.86      0.92      0.89        13
         n-d       1.00      0.50      0.67         2
       query       1.00      1.00      1.00         4
         sno       0.91      0.93      0.92        83
          so       0.40      0.40      0.40         5
           y       0.89      1.00      0.94         8
         y-d       1.00      0.40      0.57         5

    accuracy                           0.89       166
   macro avg       0.88      0.82      0.83       166
weighted avg       0.90      0.89      0.89       166

Combination:  {'batch_size': 8, 'lr': 2e-05, 'epochs': 20}


Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "LABEL_12"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_10": 10,
    "LABEL_11": 11,
    "LABEL_12": 12,
    "LABEL_2": 2,
    "LABEL_3": 3,
    "LABEL_4": 4,
    "LABEL_5": 5,
    "LABEL_6": 6,
    "LABEL_7": 7,
    "LABEL_8": 8,
    "LABEL_9": 9
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
 

Step,Training Loss
100,2.0433
200,1.2679
300,0.6375
400,0.3595
500,0.2063
600,0.1119
700,0.0931
800,0.0678
900,0.0242
1000,0.0435


Saving model checkpoint to Models/BERT_13classes\checkpoint-500
Configuration saved in Models/BERT_13classes\checkpoint-500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-500\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-500\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-500\special_tokens_map.json
Saving model checkpoint to Models/BERT_13classes\checkpoint-1000
Configuration saved in Models/BERT_13classes\checkpoint-1000\config.json
Model weights saved in Models/BERT_13classes\checkpoint-1000\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-1000\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-1000\special_tokens_map.json
Saving model checkpoint to Models/BERT_13classes\checkpoint-1500
Configuration saved in Models/BERT_13classes\checkpoint-1500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-1500\pytorch_

              precision    recall  f1-score   support

         ack       1.00      1.00      1.00         3
         dno       1.00      0.80      0.89         5
          fa       1.00      1.00      1.00         6
          fe       0.87      1.00      0.93        13
          fp       0.78      0.78      0.78         9
          ft       1.00      1.00      1.00        10
           n       0.80      0.92      0.86        13
         n-d       1.00      0.50      0.67         2
       query       1.00      0.75      0.86         4
         sno       0.89      0.92      0.90        83
          so       0.00      0.00      0.00         5
           y       0.89      1.00      0.94         8
         y-d       1.00      0.60      0.75         5

    accuracy                           0.88       166
   macro avg       0.86      0.79      0.81       166
weighted avg       0.87      0.88      0.87       166

Combination:  {'batch_size': 32, 'lr': 5e-05, 'epochs': 20}


loading weights file https://huggingface.co/bert-base-uncased/resolve/main/pytorch_model.bin from cache at C:\Users\adianidm/.cache\huggingface\transformers\a8041bf617d7f94ea26d15e218abd04afc2004805632abc0ed2066aa16d50d04.faf6ea826ae9c5867d12b22257f9877e6b8367890837bd60f7c54a29633f7f2f
Some weights of the model checkpoint at bert-base-uncased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.LayerNorm.bias', 'cls.seq_relationship.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.weight', 'cls.seq_relationship.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertFo

Step,Training Loss
100,1.1299
200,0.1453
300,0.0343
400,0.0253




Training completed. Do not forget to share your model on huggingface.co/models =)




              precision    recall  f1-score   support

         ack       0.75      1.00      0.86         3
         dno       0.80      0.80      0.80         5
          fa       1.00      1.00      1.00         6
          fe       0.92      0.92      0.92        13
          fp       0.89      0.89      0.89         9
          ft       1.00      0.90      0.95        10
           n       0.92      0.85      0.88        13
         n-d       0.67      1.00      0.80         2
       query       1.00      0.75      0.86         4
         sno       0.90      0.89      0.90        83
          so       0.25      0.40      0.31         5
           y       0.89      1.00      0.94         8
         y-d       1.00      0.60      0.75         5

    accuracy                           0.87       166
   macro avg       0.85      0.85      0.83       166
weighted avg       0.89      0.87      0.88       166

Combination:  {'batch_size': 32, 'lr': 5e-05, 'epochs': 40}


loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at C:\Users\adianidm/.cache\huggingface\transformers\3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "LABEL_12"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_10": 10,
    "LABEL_11": 11,
    "LABEL_12": 12,
   

Step,Training Loss
100,1.1244
200,0.133
300,0.0299
400,0.0218
500,0.0199
600,0.0174
700,0.0158
800,0.0161


Saving model checkpoint to Models/BERT_13classes\checkpoint-500
Configuration saved in Models/BERT_13classes\checkpoint-500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-500\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-500\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-500\special_tokens_map.json


Training completed. Do not forget to share your model on huggingface.co/models =)




              precision    recall  f1-score   support

         ack       1.00      1.00      1.00         3
         dno       0.80      0.80      0.80         5
          fa       0.86      1.00      0.92         6
          fe       0.86      0.92      0.89        13
          fp       0.88      0.78      0.82         9
          ft       1.00      0.90      0.95        10
           n       0.87      1.00      0.93        13
         n-d       1.00      0.50      0.67         2
       query       1.00      0.75      0.86         4
         sno       0.90      0.89      0.90        83
          so       0.29      0.40      0.33         5
           y       0.89      1.00      0.94         8
         y-d       1.00      0.60      0.75         5

    accuracy                           0.87       166
   macro avg       0.87      0.81      0.83       166
weighted avg       0.88      0.87      0.87       166

Combination:  {'batch_size': 16, 'lr': 2e-05, 'epochs': 30}


loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at C:\Users\adianidm/.cache\huggingface\transformers\3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "LABEL_12"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_10": 10,
    "LABEL_11": 11,
    "LABEL_12": 12,
   

Step,Training Loss
100,1.6581
200,0.6498
300,0.2435
400,0.117
500,0.0507
600,0.0406
700,0.0308
800,0.0291
900,0.0257
1000,0.024


Saving model checkpoint to Models/BERT_13classes\checkpoint-500
Configuration saved in Models/BERT_13classes\checkpoint-500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-500\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-500\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-500\special_tokens_map.json
Saving model checkpoint to Models/BERT_13classes\checkpoint-1000
Configuration saved in Models/BERT_13classes\checkpoint-1000\config.json
Model weights saved in Models/BERT_13classes\checkpoint-1000\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-1000\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-1000\special_tokens_map.json


Training completed. Do not forget to share your model on huggingface.co/models =)


Using custom data configuration default-c94492fa8977105f
Reusing dataset csv (C:\Users\adianidm\.cache\huggingface\datase

              precision    recall  f1-score   support

         ack       1.00      1.00      1.00         3
         dno       0.80      0.80      0.80         5
          fa       1.00      1.00      1.00         6
          fe       0.86      0.92      0.89        13
          fp       1.00      0.78      0.88         9
          ft       1.00      1.00      1.00        10
           n       0.75      0.92      0.83        13
         n-d       0.00      0.00      0.00         2
       query       0.75      0.75      0.75         4
         sno       0.90      0.90      0.90        83
          so       0.33      0.40      0.36         5
           y       0.89      1.00      0.94         8
         y-d       1.00      0.40      0.57         5

    accuracy                           0.87       166
   macro avg       0.79      0.76      0.76       166
weighted avg       0.87      0.87      0.86       166



  0%|          | 0/1 [00:00<?, ?it/s]

Using custom data configuration default-b39b13b3f218eb93
Reusing dataset csv (C:\Users\adianidm\.cache\huggingface\datasets\csv\default-b39b13b3f218eb93\0.0.0\433e0ccc46f9880962cc2b12065189766fbb2bee57a221866138fb9203c83519)


  0%|          | 0/1 [00:00<?, ?it/s]

Loading cached processed dataset at C:\Users\adianidm\.cache\huggingface\datasets\csv\default-c94492fa8977105f\0.0.0\433e0ccc46f9880962cc2b12065189766fbb2bee57a221866138fb9203c83519\cache-64e36aca893dd606.arrow
Loading cached processed dataset at C:\Users\adianidm\.cache\huggingface\datasets\csv\default-b39b13b3f218eb93\0.0.0\433e0ccc46f9880962cc2b12065189766fbb2bee57a221866138fb9203c83519\cache-ec3292cc75413797.arrow
loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at C:\Users\adianidm/.cache\huggingface\transformers\3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
 

----------------------MODEL 1--------------------------------
Combination:  {'batch_size': 32, 'lr': 2e-05, 'epochs': 20}


loading weights file https://huggingface.co/bert-base-uncased/resolve/main/pytorch_model.bin from cache at C:\Users\adianidm/.cache\huggingface\transformers\a8041bf617d7f94ea26d15e218abd04afc2004805632abc0ed2066aa16d50d04.faf6ea826ae9c5867d12b22257f9877e6b8367890837bd60f7c54a29633f7f2f
Some weights of the model checkpoint at bert-base-uncased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.LayerNorm.bias', 'cls.seq_relationship.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.weight', 'cls.seq_relationship.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertFo

Step,Training Loss
100,1.5015
200,0.4247
300,0.1842
400,0.1166




Training completed. Do not forget to share your model on huggingface.co/models =)


  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at C:\Users\adianidm/.cache\huggingface\transformers\3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LA

              precision    recall  f1-score   support

         ack       0.00      0.00      0.00         1
         dno       0.50      0.50      0.50         6
          fa       0.90      0.90      0.90        10
          fe       1.00      0.82      0.90        11
          fp       0.93      0.87      0.90        15
          ft       1.00      1.00      1.00         6
           n       0.90      0.90      0.90        10
         n-d       0.00      0.00      0.00         2
       query       0.71      1.00      0.83         5
         sno       0.86      0.86      0.86        81
          so       0.22      0.33      0.27         6
           y       0.67      1.00      0.80         8
         y-d       1.00      0.40      0.57         5

    accuracy                           0.82       166
   macro avg       0.67      0.66      0.65       166
weighted avg       0.83      0.82      0.82       166

Combination:  {'batch_size': 32, 'lr': 3e-05, 'epochs': 20}


loading weights file https://huggingface.co/bert-base-uncased/resolve/main/pytorch_model.bin from cache at C:\Users\adianidm/.cache\huggingface\transformers\a8041bf617d7f94ea26d15e218abd04afc2004805632abc0ed2066aa16d50d04.faf6ea826ae9c5867d12b22257f9877e6b8367890837bd60f7c54a29633f7f2f
Some weights of the model checkpoint at bert-base-uncased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.LayerNorm.bias', 'cls.seq_relationship.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.weight', 'cls.seq_relationship.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertFo

Step,Training Loss
100,1.4492
200,0.3137
300,0.0916
400,0.0522




Training completed. Do not forget to share your model on huggingface.co/models =)


  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))


              precision    recall  f1-score   support

         ack       0.00      0.00      0.00         1
         dno       0.60      0.50      0.55         6
          fa       0.90      0.90      0.90        10
          fe       1.00      0.91      0.95        11
          fp       0.93      0.87      0.90        15
          ft       1.00      1.00      1.00         6
           n       0.64      0.90      0.75        10
         n-d       0.00      0.00      0.00         2
       query       0.83      1.00      0.91         5
         sno       0.90      0.89      0.89        81
          so       0.57      0.67      0.62         6
           y       0.73      1.00      0.84         8
         y-d       1.00      0.60      0.75         5

    accuracy                           0.86       166
   macro avg       0.70      0.71      0.70       166
weighted avg       0.85      0.86      0.85       166

Combination:  {'batch_size': 8, 'lr': 2e-05, 'epochs': 40}


loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at C:\Users\adianidm/.cache\huggingface\transformers\3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "LABEL_12"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_10": 10,
    "LABEL_11": 11,
    "LABEL_12": 12,
   

Step,Training Loss
100,1.9377
200,1.064
300,0.5475
400,0.2883
500,0.1635
600,0.0994
700,0.0704
800,0.0391
900,0.047
1000,0.0349


Saving model checkpoint to Models/BERT_13classes\checkpoint-500
Configuration saved in Models/BERT_13classes\checkpoint-500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-500\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-500\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-500\special_tokens_map.json
Saving model checkpoint to Models/BERT_13classes\checkpoint-1000
Configuration saved in Models/BERT_13classes\checkpoint-1000\config.json
Model weights saved in Models/BERT_13classes\checkpoint-1000\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-1000\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-1000\special_tokens_map.json
Saving model checkpoint to Models/BERT_13classes\checkpoint-1500
Configuration saved in Models/BERT_13classes\checkpoint-1500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-1500\pytorch_

              precision    recall  f1-score   support

         ack       0.00      0.00      0.00         1
         dno       0.60      0.50      0.55         6
          fa       0.90      0.90      0.90        10
          fe       1.00      0.73      0.84        11
          fp       0.93      0.87      0.90        15
          ft       1.00      1.00      1.00         6
           n       0.69      0.90      0.78        10
         n-d       0.00      0.00      0.00         2
       query       0.83      1.00      0.91         5
         sno       0.87      0.89      0.88        81
          so       0.57      0.67      0.62         6
           y       0.73      1.00      0.84         8
         y-d       1.00      0.60      0.75         5

    accuracy                           0.84       166
   macro avg       0.70      0.70      0.69       166
weighted avg       0.84      0.84      0.84       166

Combination:  {'batch_size': 8, 'lr': 5e-05, 'epochs': 40}


loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at C:\Users\adianidm/.cache\huggingface\transformers\3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "LABEL_12"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_10": 10,
    "LABEL_11": 11,
    "LABEL_12": 12,
   

Step,Training Loss
100,1.5653
200,0.6855
300,0.3205
400,0.2117
500,0.1228
600,0.071
700,0.0437
800,0.0405
900,0.0442
1000,0.0317


Saving model checkpoint to Models/BERT_13classes\checkpoint-500
Configuration saved in Models/BERT_13classes\checkpoint-500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-500\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-500\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-500\special_tokens_map.json
Saving model checkpoint to Models/BERT_13classes\checkpoint-1000
Configuration saved in Models/BERT_13classes\checkpoint-1000\config.json
Model weights saved in Models/BERT_13classes\checkpoint-1000\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-1000\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-1000\special_tokens_map.json
Saving model checkpoint to Models/BERT_13classes\checkpoint-1500
Configuration saved in Models/BERT_13classes\checkpoint-1500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-1500\pytorch_

              precision    recall  f1-score   support

         ack       0.00      0.00      0.00         1
         dno       0.67      0.67      0.67         6
          fa       0.90      0.90      0.90        10
          fe       1.00      0.73      0.84        11
          fp       1.00      0.87      0.93        15
          ft       1.00      1.00      1.00         6
           n       0.80      0.80      0.80        10
         n-d       0.00      0.00      0.00         2
       query       0.83      1.00      0.91         5
         sno       0.87      0.90      0.88        81
          so       0.60      0.50      0.55         6
           y       0.73      1.00      0.84         8
         y-d       1.00      0.60      0.75         5

    accuracy                           0.84       166
   macro avg       0.72      0.69      0.70       166
weighted avg       0.86      0.84      0.84       166

Combination:  {'batch_size': 32, 'lr': 2e-05, 'epochs': 40}


loading weights file https://huggingface.co/bert-base-uncased/resolve/main/pytorch_model.bin from cache at C:\Users\adianidm/.cache\huggingface\transformers\a8041bf617d7f94ea26d15e218abd04afc2004805632abc0ed2066aa16d50d04.faf6ea826ae9c5867d12b22257f9877e6b8367890837bd60f7c54a29633f7f2f
Some weights of the model checkpoint at bert-base-uncased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.LayerNorm.bias', 'cls.seq_relationship.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.weight', 'cls.seq_relationship.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertFo

Step,Training Loss
100,1.4704
200,0.4072
300,0.1261
400,0.0606
500,0.045
600,0.0352
700,0.0324
800,0.0272


Saving model checkpoint to Models/BERT_13classes\checkpoint-500
Configuration saved in Models/BERT_13classes\checkpoint-500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-500\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-500\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-500\special_tokens_map.json


Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at C:\Users\adianidm/.cache\huggingface\transformers\3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
 

              precision    recall  f1-score   support

         ack       0.00      0.00      0.00         1
         dno       0.50      0.50      0.50         6
          fa       0.90      0.90      0.90        10
          fe       1.00      0.91      0.95        11
          fp       0.93      0.93      0.93        15
          ft       1.00      1.00      1.00         6
           n       0.69      0.90      0.78        10
         n-d       0.00      0.00      0.00         2
       query       0.83      1.00      0.91         5
         sno       0.92      0.89      0.91        81
          so       0.50      0.50      0.50         6
           y       0.73      1.00      0.84         8
         y-d       1.00      0.60      0.75         5

    accuracy                           0.86       166
   macro avg       0.69      0.70      0.69       166
weighted avg       0.86      0.86      0.85       166

Combination:  {'batch_size': 16, 'lr': 2e-05, 'epochs': 20}


loading weights file https://huggingface.co/bert-base-uncased/resolve/main/pytorch_model.bin from cache at C:\Users\adianidm/.cache\huggingface\transformers\a8041bf617d7f94ea26d15e218abd04afc2004805632abc0ed2066aa16d50d04.faf6ea826ae9c5867d12b22257f9877e6b8367890837bd60f7c54a29633f7f2f
Some weights of the model checkpoint at bert-base-uncased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.LayerNorm.bias', 'cls.seq_relationship.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.weight', 'cls.seq_relationship.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertFo

Step,Training Loss
100,1.6858
200,0.6962
300,0.2951
400,0.1541
500,0.0867
600,0.0593
700,0.0483
800,0.0439


Saving model checkpoint to Models/BERT_13classes\checkpoint-500
Configuration saved in Models/BERT_13classes\checkpoint-500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-500\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-500\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-500\special_tokens_map.json


Training completed. Do not forget to share your model on huggingface.co/models =)


  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at C:\Users\adianidm/.cache\huggingface\transformers\3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"

              precision    recall  f1-score   support

         ack       0.00      0.00      0.00         1
         dno       0.60      0.50      0.55         6
          fa       0.90      0.90      0.90        10
          fe       1.00      0.73      0.84        11
          fp       0.88      0.93      0.90        15
          ft       1.00      1.00      1.00         6
           n       0.82      0.90      0.86        10
         n-d       0.00      0.00      0.00         2
       query       0.83      1.00      0.91         5
         sno       0.91      0.93      0.92        81
          so       0.38      0.50      0.43         6
           y       0.80      1.00      0.89         8
         y-d       1.00      0.80      0.89         5

    accuracy                           0.87       166
   macro avg       0.70      0.71      0.70       166
weighted avg       0.86      0.87      0.86       166

Combination:  {'batch_size': 8, 'lr': 2e-05, 'epochs': 20}


loading weights file https://huggingface.co/bert-base-uncased/resolve/main/pytorch_model.bin from cache at C:\Users\adianidm/.cache\huggingface\transformers\a8041bf617d7f94ea26d15e218abd04afc2004805632abc0ed2066aa16d50d04.faf6ea826ae9c5867d12b22257f9877e6b8367890837bd60f7c54a29633f7f2f
Some weights of the model checkpoint at bert-base-uncased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.LayerNorm.bias', 'cls.seq_relationship.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.weight', 'cls.seq_relationship.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertFo

Step,Training Loss
100,1.932
200,1.0219
300,0.5229
400,0.2929
500,0.163
600,0.0998
700,0.0767
800,0.04
900,0.0448
1000,0.0371


Saving model checkpoint to Models/BERT_13classes\checkpoint-500
Configuration saved in Models/BERT_13classes\checkpoint-500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-500\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-500\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-500\special_tokens_map.json
Saving model checkpoint to Models/BERT_13classes\checkpoint-1000
Configuration saved in Models/BERT_13classes\checkpoint-1000\config.json
Model weights saved in Models/BERT_13classes\checkpoint-1000\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-1000\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-1000\special_tokens_map.json
Saving model checkpoint to Models/BERT_13classes\checkpoint-1500
Configuration saved in Models/BERT_13classes\checkpoint-1500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-1500\pytorch_

              precision    recall  f1-score   support

         ack       0.00      0.00      0.00         1
         dno       0.60      0.50      0.55         6
          fa       0.90      0.90      0.90        10
          fe       1.00      0.73      0.84        11
          fp       1.00      0.87      0.93        15
          ft       1.00      1.00      1.00         6
           n       0.69      0.90      0.78        10
         n-d       0.00      0.00      0.00         2
       query       0.71      1.00      0.83         5
         sno       0.87      0.88      0.87        81
          so       0.57      0.67      0.62         6
           y       0.67      1.00      0.80         8
         y-d       1.00      0.40      0.57         5

    accuracy                           0.83       166
   macro avg       0.69      0.68      0.67       166
weighted avg       0.84      0.83      0.83       166

Combination:  {'batch_size': 32, 'lr': 5e-05, 'epochs': 20}


loading weights file https://huggingface.co/bert-base-uncased/resolve/main/pytorch_model.bin from cache at C:\Users\adianidm/.cache\huggingface\transformers\a8041bf617d7f94ea26d15e218abd04afc2004805632abc0ed2066aa16d50d04.faf6ea826ae9c5867d12b22257f9877e6b8367890837bd60f7c54a29633f7f2f
Some weights of the model checkpoint at bert-base-uncased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.LayerNorm.bias', 'cls.seq_relationship.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.weight', 'cls.seq_relationship.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertFo

Step,Training Loss
100,1.1917
200,0.166
300,0.0464
400,0.0303




Training completed. Do not forget to share your model on huggingface.co/models =)


  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at C:\Users\adianidm/.cache\huggingface\transformers\3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e


              precision    recall  f1-score   support

         ack       0.00      0.00      0.00         1
         dno       0.60      0.50      0.55         6
          fa       0.90      0.90      0.90        10
          fe       1.00      0.82      0.90        11
          fp       1.00      0.87      0.93        15
          ft       1.00      1.00      1.00         6
           n       0.64      0.90      0.75        10
         n-d       0.00      0.00      0.00         2
       query       0.62      1.00      0.77         5
         sno       0.92      0.88      0.90        81
          so       0.44      0.67      0.53         6
           y       0.73      1.00      0.84         8
         y-d       1.00      0.60      0.75         5

    accuracy                           0.84       166
   macro avg       0.68      0.70      0.68       166
weighted avg       0.86      0.84      0.84       166

Combination:  {'batch_size': 32, 'lr': 5e-05, 'epochs': 40}


Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "LABEL_12"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_10": 10,
    "LABEL_11": 11,
    "LABEL_12": 12,
    "LABEL_2": 2,
    "LABEL_3": 3,
    "LABEL_4": 4,
    "LABEL_5": 5,
    "LABEL_6": 6,
    "LABEL_7": 7,
    "LABEL_8": 8,
    "LABEL_9": 9
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
 

Step,Training Loss
100,1.1739
200,0.1394
300,0.0494
400,0.0288
500,0.0238
600,0.0196
700,0.018
800,0.0159


Saving model checkpoint to Models/BERT_13classes\checkpoint-500
Configuration saved in Models/BERT_13classes\checkpoint-500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-500\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-500\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-500\special_tokens_map.json


Training completed. Do not forget to share your model on huggingface.co/models =)


  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at C:\Users\adianidm/.cache\huggingface\transformers\3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"

              precision    recall  f1-score   support

         ack       0.00      0.00      0.00         1
         dno       0.67      0.67      0.67         6
          fa       0.90      0.90      0.90        10
          fe       0.90      0.82      0.86        11
          fp       1.00      0.87      0.93        15
          ft       1.00      1.00      1.00         6
           n       0.69      0.90      0.78        10
         n-d       0.00      0.00      0.00         2
       query       0.83      1.00      0.91         5
         sno       0.88      0.89      0.88        81
          so       0.60      0.50      0.55         6
           y       0.89      1.00      0.94         8
         y-d       1.00      1.00      1.00         5

    accuracy                           0.86       166
   macro avg       0.72      0.73      0.72       166
weighted avg       0.85      0.86      0.86       166

Combination:  {'batch_size': 16, 'lr': 2e-05, 'epochs': 30}


loading weights file https://huggingface.co/bert-base-uncased/resolve/main/pytorch_model.bin from cache at C:\Users\adianidm/.cache\huggingface\transformers\a8041bf617d7f94ea26d15e218abd04afc2004805632abc0ed2066aa16d50d04.faf6ea826ae9c5867d12b22257f9877e6b8367890837bd60f7c54a29633f7f2f
Some weights of the model checkpoint at bert-base-uncased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.LayerNorm.bias', 'cls.seq_relationship.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.weight', 'cls.seq_relationship.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertFo

Step,Training Loss
100,1.6797
200,0.677
300,0.2731
400,0.1336
500,0.0715
600,0.0461
700,0.0401
800,0.0369
900,0.0311
1000,0.0282


Saving model checkpoint to Models/BERT_13classes\checkpoint-500
Configuration saved in Models/BERT_13classes\checkpoint-500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-500\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-500\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-500\special_tokens_map.json
Saving model checkpoint to Models/BERT_13classes\checkpoint-1000
Configuration saved in Models/BERT_13classes\checkpoint-1000\config.json
Model weights saved in Models/BERT_13classes\checkpoint-1000\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-1000\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-1000\special_tokens_map.json


Training completed. Do not forget to share your model on huggingface.co/models =)




              precision    recall  f1-score   support

         ack       0.00      0.00      0.00         1
         dno       0.50      0.50      0.50         6
          fa       0.90      0.90      0.90        10
          fe       1.00      0.73      0.84        11
          fp       0.93      0.93      0.93        15
          ft       1.00      1.00      1.00         6
           n       0.82      0.90      0.86        10
         n-d       0.00      0.00      0.00         2
       query       0.71      1.00      0.83         5
         sno       0.92      0.88      0.90        81
          so       0.30      0.50      0.37         6
           y       0.80      1.00      0.89         8
         y-d       1.00      0.80      0.89         5

    accuracy                           0.84       166
   macro avg       0.68      0.70      0.69       166
weighted avg       0.86      0.84      0.85       166



Using custom data configuration default-98ddc8d7580f8bc3
Reusing dataset csv (C:\Users\adianidm\.cache\huggingface\datasets\csv\default-98ddc8d7580f8bc3\0.0.0\433e0ccc46f9880962cc2b12065189766fbb2bee57a221866138fb9203c83519)


  0%|          | 0/1 [00:00<?, ?it/s]

Using custom data configuration default-b99673641499d8f3
Reusing dataset csv (C:\Users\adianidm\.cache\huggingface\datasets\csv\default-b99673641499d8f3\0.0.0\433e0ccc46f9880962cc2b12065189766fbb2bee57a221866138fb9203c83519)


  0%|          | 0/1 [00:00<?, ?it/s]

Loading cached processed dataset at C:\Users\adianidm\.cache\huggingface\datasets\csv\default-98ddc8d7580f8bc3\0.0.0\433e0ccc46f9880962cc2b12065189766fbb2bee57a221866138fb9203c83519\cache-4c0b0d8e8ad7522e.arrow
Loading cached processed dataset at C:\Users\adianidm\.cache\huggingface\datasets\csv\default-b99673641499d8f3\0.0.0\433e0ccc46f9880962cc2b12065189766fbb2bee57a221866138fb9203c83519\cache-49089b73dceb9b21.arrow
loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at C:\Users\adianidm/.cache\huggingface\transformers\3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
 

----------------------MODEL 1--------------------------------
Combination:  {'batch_size': 32, 'lr': 2e-05, 'epochs': 20}


loading weights file https://huggingface.co/bert-base-uncased/resolve/main/pytorch_model.bin from cache at C:\Users\adianidm/.cache\huggingface\transformers\a8041bf617d7f94ea26d15e218abd04afc2004805632abc0ed2066aa16d50d04.faf6ea826ae9c5867d12b22257f9877e6b8367890837bd60f7c54a29633f7f2f
Some weights of the model checkpoint at bert-base-uncased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.LayerNorm.bias', 'cls.seq_relationship.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.weight', 'cls.seq_relationship.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertFo

Step,Training Loss
100,1.5251
200,0.489
300,0.2305
400,0.1464




Training completed. Do not forget to share your model on huggingface.co/models =)


  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at C:\Users\adianidm/.cache\huggingface\transformers\3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LA

              precision    recall  f1-score   support

         ack       0.50      1.00      0.67         1
         dno       0.85      0.79      0.81        14
          fa       1.00      1.00      1.00        12
          fe       1.00      0.91      0.95        11
          fp       0.85      0.85      0.85        13
          ft       0.89      1.00      0.94         8
           n       1.00      0.78      0.88         9
         n-d       0.00      0.00      0.00         1
       query       1.00      0.86      0.92         7
         sno       0.90      0.99      0.94        73
          so       1.00      0.50      0.67         4
           y       1.00      0.80      0.89        10
         y-d       0.67      1.00      0.80         2

    accuracy                           0.91       165
   macro avg       0.82      0.80      0.79       165
weighted avg       0.91      0.91      0.90       165

Combination:  {'batch_size': 32, 'lr': 3e-05, 'epochs': 20}


loading weights file https://huggingface.co/bert-base-uncased/resolve/main/pytorch_model.bin from cache at C:\Users\adianidm/.cache\huggingface\transformers\a8041bf617d7f94ea26d15e218abd04afc2004805632abc0ed2066aa16d50d04.faf6ea826ae9c5867d12b22257f9877e6b8367890837bd60f7c54a29633f7f2f
Some weights of the model checkpoint at bert-base-uncased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.LayerNorm.bias', 'cls.seq_relationship.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.weight', 'cls.seq_relationship.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertFo

Step,Training Loss
100,1.3736
200,0.2694
300,0.087
400,0.0509




Training completed. Do not forget to share your model on huggingface.co/models =)


  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))


              precision    recall  f1-score   support

         ack       0.50      1.00      0.67         1
         dno       1.00      0.79      0.88        14
          fa       1.00      0.92      0.96        12
          fe       1.00      0.91      0.95        11
          fp       0.92      0.85      0.88        13
          ft       0.89      1.00      0.94         8
           n       1.00      0.89      0.94         9
         n-d       0.00      0.00      0.00         1
       query       0.86      0.86      0.86         7
         sno       0.88      0.99      0.93        73
          so       0.50      0.50      0.50         4
           y       1.00      0.70      0.82        10
         y-d       0.50      0.50      0.50         2

    accuracy                           0.90       165
   macro avg       0.77      0.76      0.76       165
weighted avg       0.90      0.90      0.89       165

Combination:  {'batch_size': 8, 'lr': 2e-05, 'epochs': 40}


loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at C:\Users\adianidm/.cache\huggingface\transformers\3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "LABEL_12"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_10": 10,
    "LABEL_11": 11,
    "LABEL_12": 12,
   

Step,Training Loss
100,1.992
200,1.0727
300,0.61
400,0.3379
500,0.2059
600,0.1275
700,0.0791
800,0.0649
900,0.0556
1000,0.0402


Saving model checkpoint to Models/BERT_13classes\checkpoint-500
Configuration saved in Models/BERT_13classes\checkpoint-500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-500\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-500\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-500\special_tokens_map.json
Saving model checkpoint to Models/BERT_13classes\checkpoint-1000
Configuration saved in Models/BERT_13classes\checkpoint-1000\config.json
Model weights saved in Models/BERT_13classes\checkpoint-1000\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-1000\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-1000\special_tokens_map.json
Saving model checkpoint to Models/BERT_13classes\checkpoint-1500
Configuration saved in Models/BERT_13classes\checkpoint-1500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-1500\pytorch_

              precision    recall  f1-score   support

         ack       0.50      1.00      0.67         1
         dno       0.92      0.79      0.85        14
          fa       1.00      1.00      1.00        12
          fe       1.00      1.00      1.00        11
          fp       0.92      0.85      0.88        13
          ft       0.89      1.00      0.94         8
           n       1.00      0.89      0.94         9
         n-d       0.00      0.00      0.00         1
       query       0.86      0.86      0.86         7
         sno       0.91      0.95      0.93        73
          so       0.29      0.50      0.36         4
           y       1.00      0.70      0.82        10
         y-d       0.50      0.50      0.50         2

    accuracy                           0.89       165
   macro avg       0.75      0.77      0.75       165
weighted avg       0.90      0.89      0.89       165

Combination:  {'batch_size': 8, 'lr': 5e-05, 'epochs': 40}


Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "LABEL_12"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_10": 10,
    "LABEL_11": 11,
    "LABEL_12": 12,
    "LABEL_2": 2,
    "LABEL_3": 3,
    "LABEL_4": 4,
    "LABEL_5": 5,
    "LABEL_6": 6,
    "LABEL_7": 7,
    "LABEL_8": 8,
    "LABEL_9": 9
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
 

Step,Training Loss
100,1.5571
200,0.6198
300,0.3462
400,0.187
500,0.102
600,0.0634
700,0.052
800,0.0499
900,0.0539
1000,0.0319


Saving model checkpoint to Models/BERT_13classes\checkpoint-500
Configuration saved in Models/BERT_13classes\checkpoint-500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-500\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-500\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-500\special_tokens_map.json
Saving model checkpoint to Models/BERT_13classes\checkpoint-1000
Configuration saved in Models/BERT_13classes\checkpoint-1000\config.json
Model weights saved in Models/BERT_13classes\checkpoint-1000\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-1000\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-1000\special_tokens_map.json
Saving model checkpoint to Models/BERT_13classes\checkpoint-1500
Configuration saved in Models/BERT_13classes\checkpoint-1500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-1500\pytorch_

              precision    recall  f1-score   support

         ack       0.50      1.00      0.67         1
         dno       1.00      0.79      0.88        14
          fa       1.00      1.00      1.00        12
          fe       1.00      0.91      0.95        11
          fp       0.92      0.85      0.88        13
          ft       0.89      1.00      0.94         8
           n       1.00      0.78      0.88         9
         n-d       1.00      1.00      1.00         1
       query       0.86      0.86      0.86         7
         sno       0.90      0.99      0.94        73
          so       1.00      0.50      0.67         4
           y       0.89      0.80      0.84        10
         y-d       0.67      1.00      0.80         2

    accuracy                           0.92       165
   macro avg       0.89      0.88      0.87       165
weighted avg       0.92      0.92      0.91       165

Combination:  {'batch_size': 32, 'lr': 2e-05, 'epochs': 40}


Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "LABEL_12"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_10": 10,
    "LABEL_11": 11,
    "LABEL_12": 12,
    "LABEL_2": 2,
    "LABEL_3": 3,
    "LABEL_4": 4,
    "LABEL_5": 5,
    "LABEL_6": 6,
    "LABEL_7": 7,
    "LABEL_8": 8,
    "LABEL_9": 9
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
 

Step,Training Loss
100,1.5094
200,0.4575
300,0.1478
400,0.0685
500,0.0487
600,0.0388
700,0.0375
800,0.0368


Saving model checkpoint to Models/BERT_13classes\checkpoint-500
Configuration saved in Models/BERT_13classes\checkpoint-500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-500\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-500\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-500\special_tokens_map.json


Training completed. Do not forget to share your model on huggingface.co/models =)


  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at C:\Users\adianidm/.cache\huggingface\transformers\3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"

              precision    recall  f1-score   support

         ack       0.33      1.00      0.50         1
         dno       1.00      0.86      0.92        14
          fa       1.00      1.00      1.00        12
          fe       1.00      0.91      0.95        11
          fp       0.92      0.85      0.88        13
          ft       0.89      1.00      0.94         8
           n       1.00      0.78      0.88         9
         n-d       0.00      0.00      0.00         1
       query       0.86      0.86      0.86         7
         sno       0.90      1.00      0.95        73
          so       1.00      0.50      0.67         4
           y       1.00      0.70      0.82        10
         y-d       0.67      1.00      0.80         2

    accuracy                           0.92       165
   macro avg       0.81      0.80      0.78       165
weighted avg       0.92      0.92      0.91       165

Combination:  {'batch_size': 16, 'lr': 2e-05, 'epochs': 20}


loading weights file https://huggingface.co/bert-base-uncased/resolve/main/pytorch_model.bin from cache at C:\Users\adianidm/.cache\huggingface\transformers\a8041bf617d7f94ea26d15e218abd04afc2004805632abc0ed2066aa16d50d04.faf6ea826ae9c5867d12b22257f9877e6b8367890837bd60f7c54a29633f7f2f
Some weights of the model checkpoint at bert-base-uncased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.LayerNorm.bias', 'cls.seq_relationship.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.weight', 'cls.seq_relationship.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertFo

Step,Training Loss
100,1.6663
200,0.7683
300,0.3307
400,0.1665
500,0.0934
600,0.0614
700,0.0508
800,0.0489


Saving model checkpoint to Models/BERT_13classes\checkpoint-500
Configuration saved in Models/BERT_13classes\checkpoint-500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-500\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-500\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-500\special_tokens_map.json


Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at C:\Users\adianidm/.cache\huggingface\transformers\3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
 

              precision    recall  f1-score   support

         ack       0.50      1.00      0.67         1
         dno       0.92      0.79      0.85        14
          fa       1.00      1.00      1.00        12
          fe       1.00      0.91      0.95        11
          fp       0.92      0.85      0.88        13
          ft       0.89      1.00      0.94         8
           n       1.00      0.78      0.88         9
         n-d       0.00      0.00      0.00         1
       query       0.86      0.86      0.86         7
         sno       0.90      0.99      0.94        73
          so       1.00      0.50      0.67         4
           y       1.00      0.80      0.89        10
         y-d       0.67      1.00      0.80         2

    accuracy                           0.91       165
   macro avg       0.82      0.80      0.79       165
weighted avg       0.92      0.91      0.91       165

Combination:  {'batch_size': 8, 'lr': 2e-05, 'epochs': 20}


loading weights file https://huggingface.co/bert-base-uncased/resolve/main/pytorch_model.bin from cache at C:\Users\adianidm/.cache\huggingface\transformers\a8041bf617d7f94ea26d15e218abd04afc2004805632abc0ed2066aa16d50d04.faf6ea826ae9c5867d12b22257f9877e6b8367890837bd60f7c54a29633f7f2f
Some weights of the model checkpoint at bert-base-uncased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.LayerNorm.bias', 'cls.seq_relationship.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.weight', 'cls.seq_relationship.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertFo

Step,Training Loss
100,1.9954
200,1.09
300,0.6121
400,0.3525
500,0.2217
600,0.1396
700,0.0967
800,0.0758
900,0.062
1000,0.0441


Saving model checkpoint to Models/BERT_13classes\checkpoint-500
Configuration saved in Models/BERT_13classes\checkpoint-500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-500\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-500\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-500\special_tokens_map.json
Saving model checkpoint to Models/BERT_13classes\checkpoint-1000
Configuration saved in Models/BERT_13classes\checkpoint-1000\config.json
Model weights saved in Models/BERT_13classes\checkpoint-1000\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-1000\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-1000\special_tokens_map.json
Saving model checkpoint to Models/BERT_13classes\checkpoint-1500
Configuration saved in Models/BERT_13classes\checkpoint-1500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-1500\pytorch_

              precision    recall  f1-score   support

         ack       0.50      1.00      0.67         1
         dno       0.92      0.79      0.85        14
          fa       1.00      0.92      0.96        12
          fe       1.00      0.91      0.95        11
          fp       0.92      0.85      0.88        13
          ft       0.89      1.00      0.94         8
           n       1.00      0.78      0.88         9
         n-d       0.00      0.00      0.00         1
       query       0.86      0.86      0.86         7
         sno       0.89      0.96      0.92        73
          so       0.40      0.50      0.44         4
           y       1.00      0.80      0.89        10
         y-d       0.67      1.00      0.80         2

    accuracy                           0.89       165
   macro avg       0.77      0.80      0.77       165
weighted avg       0.90      0.89      0.89       165

Combination:  {'batch_size': 32, 'lr': 5e-05, 'epochs': 20}


loading weights file https://huggingface.co/bert-base-uncased/resolve/main/pytorch_model.bin from cache at C:\Users\adianidm/.cache\huggingface\transformers\a8041bf617d7f94ea26d15e218abd04afc2004805632abc0ed2066aa16d50d04.faf6ea826ae9c5867d12b22257f9877e6b8367890837bd60f7c54a29633f7f2f
Some weights of the model checkpoint at bert-base-uncased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.LayerNorm.bias', 'cls.seq_relationship.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.weight', 'cls.seq_relationship.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertFo

Step,Training Loss
100,1.3373
200,0.1785
300,0.0526
400,0.032




Training completed. Do not forget to share your model on huggingface.co/models =)


  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at C:\Users\adianidm/.cache\huggingface\transformers\3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LA

              precision    recall  f1-score   support

         ack       1.00      1.00      1.00         1
         dno       1.00      0.79      0.88        14
          fa       1.00      1.00      1.00        12
          fe       1.00      0.91      0.95        11
          fp       0.92      0.85      0.88        13
          ft       0.89      1.00      0.94         8
           n       1.00      0.89      0.94         9
         n-d       0.00      0.00      0.00         1
       query       0.86      0.86      0.86         7
         sno       0.90      0.95      0.92        73
          so       0.25      0.50      0.33         4
           y       1.00      0.70      0.82        10
         y-d       0.67      1.00      0.80         2

    accuracy                           0.89       165
   macro avg       0.81      0.80      0.79       165
weighted avg       0.91      0.89      0.89       165

Combination:  {'batch_size': 32, 'lr': 5e-05, 'epochs': 40}


loading weights file https://huggingface.co/bert-base-uncased/resolve/main/pytorch_model.bin from cache at C:\Users\adianidm/.cache\huggingface\transformers\a8041bf617d7f94ea26d15e218abd04afc2004805632abc0ed2066aa16d50d04.faf6ea826ae9c5867d12b22257f9877e6b8367890837bd60f7c54a29633f7f2f
Some weights of the model checkpoint at bert-base-uncased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.LayerNorm.bias', 'cls.seq_relationship.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.weight', 'cls.seq_relationship.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertFo

Step,Training Loss
100,1.3374
200,0.1565
300,0.0586
400,0.032
500,0.0295
600,0.0217
700,0.0227
800,0.0232


Saving model checkpoint to Models/BERT_13classes\checkpoint-500
Configuration saved in Models/BERT_13classes\checkpoint-500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-500\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-500\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-500\special_tokens_map.json


Training completed. Do not forget to share your model on huggingface.co/models =)


  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at C:\Users\adianidm/.cache\huggingface\transformers\3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"

              precision    recall  f1-score   support

         ack       0.50      1.00      0.67         1
         dno       1.00      0.86      0.92        14
          fa       1.00      1.00      1.00        12
          fe       1.00      0.82      0.90        11
          fp       0.92      0.85      0.88        13
          ft       0.89      1.00      0.94         8
           n       0.88      0.78      0.82         9
         n-d       0.00      0.00      0.00         1
       query       0.86      0.86      0.86         7
         sno       0.89      0.97      0.93        73
          so       0.67      0.50      0.57         4
           y       1.00      0.70      0.82        10
         y-d       0.50      1.00      0.67         2

    accuracy                           0.90       165
   macro avg       0.78      0.79      0.77       165
weighted avg       0.90      0.90      0.89       165

Combination:  {'batch_size': 16, 'lr': 2e-05, 'epochs': 30}


loading weights file https://huggingface.co/bert-base-uncased/resolve/main/pytorch_model.bin from cache at C:\Users\adianidm/.cache\huggingface\transformers\a8041bf617d7f94ea26d15e218abd04afc2004805632abc0ed2066aa16d50d04.faf6ea826ae9c5867d12b22257f9877e6b8367890837bd60f7c54a29633f7f2f
Some weights of the model checkpoint at bert-base-uncased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.LayerNorm.bias', 'cls.seq_relationship.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.weight', 'cls.seq_relationship.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertFo

Step,Training Loss
100,1.6637
200,0.759
300,0.3067
400,0.1403
500,0.0779
600,0.0504
700,0.0422
800,0.0425
900,0.0368
1000,0.0371


Saving model checkpoint to Models/BERT_13classes\checkpoint-500
Configuration saved in Models/BERT_13classes\checkpoint-500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-500\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-500\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-500\special_tokens_map.json
Saving model checkpoint to Models/BERT_13classes\checkpoint-1000
Configuration saved in Models/BERT_13classes\checkpoint-1000\config.json
Model weights saved in Models/BERT_13classes\checkpoint-1000\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-1000\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-1000\special_tokens_map.json


Training completed. Do not forget to share your model on huggingface.co/models =)


  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf

              precision    recall  f1-score   support

         ack       0.50      1.00      0.67         1
         dno       1.00      0.86      0.92        14
          fa       1.00      1.00      1.00        12
          fe       1.00      0.82      0.90        11
          fp       0.92      0.85      0.88        13
          ft       0.89      1.00      0.94         8
           n       1.00      0.78      0.88         9
         n-d       0.00      0.00      0.00         1
       query       0.86      0.86      0.86         7
         sno       0.89      1.00      0.94        73
          so       0.67      0.50      0.57         4
           y       1.00      0.70      0.82        10
         y-d       0.67      1.00      0.80         2

    accuracy                           0.91       165
   macro avg       0.80      0.80      0.78       165
weighted avg       0.91      0.91      0.90       165



Using custom data configuration default-bbdf4ddd915aa9c5
Reusing dataset csv (C:\Users\adianidm\.cache\huggingface\datasets\csv\default-bbdf4ddd915aa9c5\0.0.0\433e0ccc46f9880962cc2b12065189766fbb2bee57a221866138fb9203c83519)


  0%|          | 0/1 [00:00<?, ?it/s]

Using custom data configuration default-9bb1bee6ba541638
Reusing dataset csv (C:\Users\adianidm\.cache\huggingface\datasets\csv\default-9bb1bee6ba541638\0.0.0\433e0ccc46f9880962cc2b12065189766fbb2bee57a221866138fb9203c83519)


  0%|          | 0/1 [00:00<?, ?it/s]

Loading cached processed dataset at C:\Users\adianidm\.cache\huggingface\datasets\csv\default-bbdf4ddd915aa9c5\0.0.0\433e0ccc46f9880962cc2b12065189766fbb2bee57a221866138fb9203c83519\cache-f2e42b6cc0805d1e.arrow
Loading cached processed dataset at C:\Users\adianidm\.cache\huggingface\datasets\csv\default-9bb1bee6ba541638\0.0.0\433e0ccc46f9880962cc2b12065189766fbb2bee57a221866138fb9203c83519\cache-c26567e1cc560e28.arrow
loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at C:\Users\adianidm/.cache\huggingface\transformers\3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e


----------------------MODEL 1--------------------------------
Combination:  {'batch_size': 32, 'lr': 2e-05, 'epochs': 20}


Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "LABEL_12"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_10": 10,
    "LABEL_11": 11,
    "LABEL_12": 12,
    "LABEL_2": 2,
    "LABEL_3": 3,
    "LABEL_4": 4,
    "LABEL_5": 5,
    "LABEL_6": 6,
    "LABEL_7": 7,
    "LABEL_8": 8,
    "LABEL_9": 9
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
 

Step,Training Loss
100,1.508
200,0.4253
300,0.1816
400,0.1137




Training completed. Do not forget to share your model on huggingface.co/models =)


  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at C:\Users\adianidm/.cache\huggingface\transformers\3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LA

              precision    recall  f1-score   support

         ack       0.80      0.80      0.80         5
         dno       0.69      1.00      0.82         9
          fa       0.83      1.00      0.91         5
          fe       1.00      0.88      0.93         8
          fp       0.70      0.70      0.70        10
          ft       1.00      1.00      1.00         8
           n       0.70      1.00      0.82         7
         n-d       0.00      0.00      0.00         3
       query       1.00      0.80      0.89        10
         sno       0.90      0.92      0.91        75
          so       0.00      0.00      0.00         7
           y       0.93      0.93      0.93        14
         y-d       0.60      0.75      0.67         4

    accuracy                           0.85       165
   macro avg       0.70      0.75      0.72       165
weighted avg       0.82      0.85      0.83       165

Combination:  {'batch_size': 32, 'lr': 3e-05, 'epochs': 20}


loading weights file https://huggingface.co/bert-base-uncased/resolve/main/pytorch_model.bin from cache at C:\Users\adianidm/.cache\huggingface\transformers\a8041bf617d7f94ea26d15e218abd04afc2004805632abc0ed2066aa16d50d04.faf6ea826ae9c5867d12b22257f9877e6b8367890837bd60f7c54a29633f7f2f
Some weights of the model checkpoint at bert-base-uncased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.LayerNorm.bias', 'cls.seq_relationship.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.weight', 'cls.seq_relationship.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertFo

Step,Training Loss
100,1.4745
200,0.2984
300,0.0929
400,0.0475




Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at C:\Users\adianidm/.cache\huggingface\transformers\3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e


              precision    recall  f1-score   support

         ack       0.80      0.80      0.80         5
         dno       0.69      1.00      0.82         9
          fa       0.83      1.00      0.91         5
          fe       1.00      1.00      1.00         8
          fp       0.73      0.80      0.76        10
          ft       1.00      1.00      1.00         8
           n       0.64      1.00      0.78         7
         n-d       0.00      0.00      0.00         3
       query       1.00      0.80      0.89        10
         sno       0.93      0.88      0.90        75
          so       0.00      0.00      0.00         7
           y       1.00      0.93      0.96        14
         y-d       0.80      1.00      0.89         4

    accuracy                           0.85       165
   macro avg       0.72      0.79      0.75       165
weighted avg       0.84      0.85      0.84       165

Combination:  {'batch_size': 8, 'lr': 2e-05, 'epochs': 40}


Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "LABEL_12"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_10": 10,
    "LABEL_11": 11,
    "LABEL_12": 12,
    "LABEL_2": 2,
    "LABEL_3": 3,
    "LABEL_4": 4,
    "LABEL_5": 5,
    "LABEL_6": 6,
    "LABEL_7": 7,
    "LABEL_8": 8,
    "LABEL_9": 9
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
 

Step,Training Loss
100,1.9175
200,0.8789
300,0.4565
400,0.2341
500,0.1299
600,0.0825
700,0.0355
800,0.0439
900,0.0332
1000,0.0335


Saving model checkpoint to Models/BERT_13classes\checkpoint-500
Configuration saved in Models/BERT_13classes\checkpoint-500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-500\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-500\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-500\special_tokens_map.json
Saving model checkpoint to Models/BERT_13classes\checkpoint-1000
Configuration saved in Models/BERT_13classes\checkpoint-1000\config.json
Model weights saved in Models/BERT_13classes\checkpoint-1000\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-1000\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-1000\special_tokens_map.json
Saving model checkpoint to Models/BERT_13classes\checkpoint-1500
Configuration saved in Models/BERT_13classes\checkpoint-1500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-1500\pytorch_

              precision    recall  f1-score   support

         ack       0.80      0.80      0.80         5
         dno       0.73      0.89      0.80         9
          fa       1.00      1.00      1.00         5
          fe       1.00      1.00      1.00         8
          fp       0.73      0.80      0.76        10
          ft       1.00      1.00      1.00         8
           n       0.70      1.00      0.82         7
         n-d       0.00      0.00      0.00         3
       query       1.00      0.80      0.89        10
         sno       0.90      0.92      0.91        75
          so       0.00      0.00      0.00         7
           y       1.00      0.93      0.96        14
         y-d       0.80      1.00      0.89         4

    accuracy                           0.86       165
   macro avg       0.74      0.78      0.76       165
weighted avg       0.84      0.86      0.85       165

Combination:  {'batch_size': 8, 'lr': 5e-05, 'epochs': 40}


Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "LABEL_12"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_10": 10,
    "LABEL_11": 11,
    "LABEL_12": 12,
    "LABEL_2": 2,
    "LABEL_3": 3,
    "LABEL_4": 4,
    "LABEL_5": 5,
    "LABEL_6": 6,
    "LABEL_7": 7,
    "LABEL_8": 8,
    "LABEL_9": 9
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
 

Step,Training Loss
100,1.4842
200,0.5761
300,0.3163
400,0.1769
500,0.0925
600,0.0668
700,0.0153
800,0.0298
900,0.0277
1000,0.0238


Saving model checkpoint to Models/BERT_13classes\checkpoint-500
Configuration saved in Models/BERT_13classes\checkpoint-500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-500\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-500\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-500\special_tokens_map.json
Saving model checkpoint to Models/BERT_13classes\checkpoint-1000
Configuration saved in Models/BERT_13classes\checkpoint-1000\config.json
Model weights saved in Models/BERT_13classes\checkpoint-1000\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-1000\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-1000\special_tokens_map.json
Saving model checkpoint to Models/BERT_13classes\checkpoint-1500
Configuration saved in Models/BERT_13classes\checkpoint-1500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-1500\pytorch_

              precision    recall  f1-score   support

         ack       0.67      0.80      0.73         5
         dno       0.75      1.00      0.86         9
          fa       1.00      1.00      1.00         5
          fe       1.00      0.88      0.93         8
          fp       0.73      0.80      0.76        10
          ft       1.00      1.00      1.00         8
           n       0.67      0.86      0.75         7
         n-d       0.33      0.33      0.33         3
       query       1.00      0.90      0.95        10
         sno       0.93      0.91      0.92        75
          so       0.40      0.29      0.33         7
           y       1.00      0.93      0.96        14
         y-d       1.00      1.00      1.00         4

    accuracy                           0.87       165
   macro avg       0.81      0.82      0.81       165
weighted avg       0.88      0.87      0.87       165

Combination:  {'batch_size': 32, 'lr': 2e-05, 'epochs': 40}


loading weights file https://huggingface.co/bert-base-uncased/resolve/main/pytorch_model.bin from cache at C:\Users\adianidm/.cache\huggingface\transformers\a8041bf617d7f94ea26d15e218abd04afc2004805632abc0ed2066aa16d50d04.faf6ea826ae9c5867d12b22257f9877e6b8367890837bd60f7c54a29633f7f2f
Some weights of the model checkpoint at bert-base-uncased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.LayerNorm.bias', 'cls.seq_relationship.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.weight', 'cls.seq_relationship.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertFo

Step,Training Loss
100,1.4171
200,0.377
300,0.1175
400,0.05
500,0.0364
600,0.0336
700,0.0273
800,0.0248


Saving model checkpoint to Models/BERT_13classes\checkpoint-500
Configuration saved in Models/BERT_13classes\checkpoint-500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-500\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-500\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-500\special_tokens_map.json


Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at C:\Users\adianidm/.cache\huggingface\transformers\3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e


              precision    recall  f1-score   support

         ack       0.67      0.80      0.73         5
         dno       0.64      1.00      0.78         9
          fa       1.00      1.00      1.00         5
          fe       1.00      1.00      1.00         8
          fp       0.73      0.80      0.76        10
          ft       1.00      1.00      1.00         8
           n       0.58      1.00      0.74         7
         n-d       0.00      0.00      0.00         3
       query       1.00      0.80      0.89        10
         sno       0.93      0.88      0.90        75
          so       0.00      0.00      0.00         7
           y       1.00      0.93      0.96        14
         y-d       0.80      1.00      0.89         4

    accuracy                           0.85       165
   macro avg       0.72      0.79      0.74       165
weighted avg       0.84      0.85      0.84       165

Combination:  {'batch_size': 16, 'lr': 2e-05, 'epochs': 20}


Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "LABEL_12"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_10": 10,
    "LABEL_11": 11,
    "LABEL_12": 12,
    "LABEL_2": 2,
    "LABEL_3": 3,
    "LABEL_4": 4,
    "LABEL_5": 5,
    "LABEL_6": 6,
    "LABEL_7": 7,
    "LABEL_8": 8,
    "LABEL_9": 9
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
 

Step,Training Loss
100,1.6238
200,0.7048
300,0.2802
400,0.1129
500,0.0752
600,0.0515
700,0.0361
800,0.0375


Saving model checkpoint to Models/BERT_13classes\checkpoint-500
Configuration saved in Models/BERT_13classes\checkpoint-500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-500\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-500\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-500\special_tokens_map.json


Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at C:\Users\adianidm/.cache\huggingface\transformers\3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e


              precision    recall  f1-score   support

         ack       0.57      0.80      0.67         5
         dno       0.64      1.00      0.78         9
          fa       1.00      1.00      1.00         5
          fe       1.00      0.88      0.93         8
          fp       0.73      0.80      0.76        10
          ft       1.00      1.00      1.00         8
           n       0.58      1.00      0.74         7
         n-d       1.00      0.33      0.50         3
       query       1.00      0.90      0.95        10
         sno       0.93      0.87      0.90        75
          so       0.00      0.00      0.00         7
           y       0.80      0.86      0.83        14
         y-d       1.00      0.50      0.67         4

    accuracy                           0.83       165
   macro avg       0.79      0.76      0.75       165
weighted avg       0.84      0.83      0.82       165

Combination:  {'batch_size': 8, 'lr': 2e-05, 'epochs': 20}


Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "LABEL_12"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_10": 10,
    "LABEL_11": 11,
    "LABEL_12": 12,
    "LABEL_2": 2,
    "LABEL_3": 3,
    "LABEL_4": 4,
    "LABEL_5": 5,
    "LABEL_6": 6,
    "LABEL_7": 7,
    "LABEL_8": 8,
    "LABEL_9": 9
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
 

Step,Training Loss
100,1.9211
200,0.89
300,0.4692
400,0.2508
500,0.1312
600,0.0938
700,0.0414
800,0.0517
900,0.0375
1000,0.0377


Saving model checkpoint to Models/BERT_13classes\checkpoint-500
Configuration saved in Models/BERT_13classes\checkpoint-500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-500\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-500\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-500\special_tokens_map.json
Saving model checkpoint to Models/BERT_13classes\checkpoint-1000
Configuration saved in Models/BERT_13classes\checkpoint-1000\config.json
Model weights saved in Models/BERT_13classes\checkpoint-1000\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-1000\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-1000\special_tokens_map.json
Saving model checkpoint to Models/BERT_13classes\checkpoint-1500
Configuration saved in Models/BERT_13classes\checkpoint-1500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-1500\pytorch_

              precision    recall  f1-score   support

         ack       0.67      0.80      0.73         5
         dno       0.67      0.89      0.76         9
          fa       1.00      1.00      1.00         5
          fe       1.00      1.00      1.00         8
          fp       0.73      0.80      0.76        10
          ft       1.00      1.00      1.00         8
           n       0.60      0.86      0.71         7
         n-d       0.00      0.00      0.00         3
       query       1.00      0.80      0.89        10
         sno       0.91      0.92      0.91        75
          so       0.00      0.00      0.00         7
           y       0.93      0.93      0.93        14
         y-d       0.75      0.75      0.75         4

    accuracy                           0.85       165
   macro avg       0.71      0.75      0.73       165
weighted avg       0.82      0.85      0.83       165

Combination:  {'batch_size': 32, 'lr': 5e-05, 'epochs': 20}


loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at C:\Users\adianidm/.cache\huggingface\transformers\3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "LABEL_12"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_10": 10,
    "LABEL_11": 11,
    "LABEL_12": 12,
   

Step,Training Loss
100,1.2601
200,0.1494
300,0.0387
400,0.0236




Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at C:\Users\adianidm/.cache\huggingface\transformers\3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "LABEL_12"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0"

              precision    recall  f1-score   support

         ack       0.57      0.80      0.67         5
         dno       0.69      1.00      0.82         9
          fa       1.00      1.00      1.00         5
          fe       1.00      1.00      1.00         8
          fp       0.67      0.80      0.73        10
          ft       1.00      1.00      1.00         8
           n       0.70      1.00      0.82         7
         n-d       0.00      0.00      0.00         3
       query       1.00      0.90      0.95        10
         sno       0.94      0.88      0.91        75
          so       0.40      0.29      0.33         7
           y       1.00      0.86      0.92        14
         y-d       0.80      1.00      0.89         4

    accuracy                           0.86       165
   macro avg       0.75      0.81      0.77       165
weighted avg       0.86      0.86      0.86       165

Combination:  {'batch_size': 32, 'lr': 5e-05, 'epochs': 40}


loading weights file https://huggingface.co/bert-base-uncased/resolve/main/pytorch_model.bin from cache at C:\Users\adianidm/.cache\huggingface\transformers\a8041bf617d7f94ea26d15e218abd04afc2004805632abc0ed2066aa16d50d04.faf6ea826ae9c5867d12b22257f9877e6b8367890837bd60f7c54a29633f7f2f
Some weights of the model checkpoint at bert-base-uncased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.LayerNorm.bias', 'cls.seq_relationship.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.weight', 'cls.seq_relationship.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertFo

Step,Training Loss
100,1.1535
200,0.1041
300,0.0343
400,0.0232
500,0.0188
600,0.0188
700,0.0158
800,0.0152


Saving model checkpoint to Models/BERT_13classes\checkpoint-500
Configuration saved in Models/BERT_13classes\checkpoint-500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-500\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-500\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-500\special_tokens_map.json


Training completed. Do not forget to share your model on huggingface.co/models =)




              precision    recall  f1-score   support

         ack       0.67      0.80      0.73         5
         dno       0.75      1.00      0.86         9
          fa       0.83      1.00      0.91         5
          fe       1.00      0.88      0.93         8
          fp       0.67      0.80      0.73        10
          ft       1.00      1.00      1.00         8
           n       0.78      1.00      0.88         7
         n-d       0.33      0.33      0.33         3
       query       1.00      0.80      0.89        10
         sno       0.90      0.85      0.88        75
          so       0.20      0.14      0.17         7
           y       0.93      0.93      0.93        14
         y-d       0.75      0.75      0.75         4

    accuracy                           0.84       165
   macro avg       0.75      0.79      0.77       165
weighted avg       0.84      0.84      0.83       165

Combination:  {'batch_size': 16, 'lr': 2e-05, 'epochs': 30}


loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at C:\Users\adianidm/.cache\huggingface\transformers\3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "LABEL_12"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_10": 10,
    "LABEL_11": 11,
    "LABEL_12": 12,
   

Step,Training Loss
100,1.6171
200,0.6777
300,0.251
400,0.0945
500,0.0623
600,0.0414
700,0.028
800,0.0295
900,0.0292
1000,0.0177


Saving model checkpoint to Models/BERT_13classes\checkpoint-500
Configuration saved in Models/BERT_13classes\checkpoint-500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-500\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-500\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-500\special_tokens_map.json
Saving model checkpoint to Models/BERT_13classes\checkpoint-1000
Configuration saved in Models/BERT_13classes\checkpoint-1000\config.json
Model weights saved in Models/BERT_13classes\checkpoint-1000\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-1000\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-1000\special_tokens_map.json


Training completed. Do not forget to share your model on huggingface.co/models =)




              precision    recall  f1-score   support

         ack       0.57      0.80      0.67         5
         dno       0.69      1.00      0.82         9
          fa       0.83      1.00      0.91         5
          fe       1.00      1.00      1.00         8
          fp       0.73      0.80      0.76        10
          ft       1.00      1.00      1.00         8
           n       0.64      1.00      0.78         7
         n-d       1.00      0.33      0.50         3
       query       1.00      0.90      0.95        10
         sno       0.94      0.87      0.90        75
          so       0.00      0.00      0.00         7
           y       0.92      0.86      0.89        14
         y-d       1.00      1.00      1.00         4

    accuracy                           0.85       165
   macro avg       0.79      0.81      0.78       165
weighted avg       0.86      0.85      0.85       165



Using custom data configuration default-aa12508fefee773d
Reusing dataset csv (C:\Users\adianidm\.cache\huggingface\datasets\csv\default-aa12508fefee773d\0.0.0\433e0ccc46f9880962cc2b12065189766fbb2bee57a221866138fb9203c83519)


  0%|          | 0/1 [00:00<?, ?it/s]

Using custom data configuration default-22230474c63e2a7d
Reusing dataset csv (C:\Users\adianidm\.cache\huggingface\datasets\csv\default-22230474c63e2a7d\0.0.0\433e0ccc46f9880962cc2b12065189766fbb2bee57a221866138fb9203c83519)


  0%|          | 0/1 [00:00<?, ?it/s]

Loading cached processed dataset at C:\Users\adianidm\.cache\huggingface\datasets\csv\default-aa12508fefee773d\0.0.0\433e0ccc46f9880962cc2b12065189766fbb2bee57a221866138fb9203c83519\cache-8369730ef2a65754.arrow
Loading cached processed dataset at C:\Users\adianidm\.cache\huggingface\datasets\csv\default-22230474c63e2a7d\0.0.0\433e0ccc46f9880962cc2b12065189766fbb2bee57a221866138fb9203c83519\cache-2f7f6c95caa541ef.arrow
loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at C:\Users\adianidm/.cache\huggingface\transformers\3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
 

----------------------MODEL 1--------------------------------
Combination:  {'batch_size': 32, 'lr': 2e-05, 'epochs': 20}


loading weights file https://huggingface.co/bert-base-uncased/resolve/main/pytorch_model.bin from cache at C:\Users\adianidm/.cache\huggingface\transformers\a8041bf617d7f94ea26d15e218abd04afc2004805632abc0ed2066aa16d50d04.faf6ea826ae9c5867d12b22257f9877e6b8367890837bd60f7c54a29633f7f2f
Some weights of the model checkpoint at bert-base-uncased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.LayerNorm.bias', 'cls.seq_relationship.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.weight', 'cls.seq_relationship.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertFo

Step,Training Loss
100,1.5331
200,0.4683
300,0.1956
400,0.1279




Training completed. Do not forget to share your model on huggingface.co/models =)


  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at C:\Users\adianidm/.cache\huggingface\transformers\3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LA

              precision    recall  f1-score   support

         ack       1.00      1.00      1.00         3
         dno       1.00      0.70      0.82        10
          fa       1.00      1.00      1.00         9
          fe       0.82      0.90      0.86        10
          fp       0.93      0.88      0.90        16
          ft       0.90      1.00      0.95         9
           n       1.00      0.90      0.95        10
         n-d       0.00      0.00      0.00         2
       query       1.00      0.75      0.86         8
         sno       0.81      0.94      0.87        69
          so       0.33      0.12      0.18         8
           y       0.86      0.60      0.71        10
         y-d       0.20      1.00      0.33         1

    accuracy                           0.84       165
   macro avg       0.76      0.75      0.73       165
weighted avg       0.84      0.84      0.83       165

Combination:  {'batch_size': 32, 'lr': 3e-05, 'epochs': 20}


loading weights file https://huggingface.co/bert-base-uncased/resolve/main/pytorch_model.bin from cache at C:\Users\adianidm/.cache\huggingface\transformers\a8041bf617d7f94ea26d15e218abd04afc2004805632abc0ed2066aa16d50d04.faf6ea826ae9c5867d12b22257f9877e6b8367890837bd60f7c54a29633f7f2f
Some weights of the model checkpoint at bert-base-uncased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.LayerNorm.bias', 'cls.seq_relationship.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.weight', 'cls.seq_relationship.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertFo

Step,Training Loss
100,1.4407
200,0.2792
300,0.0681
400,0.0405




Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at C:\Users\adianidm/.cache\huggingface\transformers\3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e


              precision    recall  f1-score   support

         ack       1.00      1.00      1.00         3
         dno       1.00      0.70      0.82        10
          fa       1.00      1.00      1.00         9
          fe       0.82      0.90      0.86        10
          fp       0.93      0.88      0.90        16
          ft       0.90      1.00      0.95         9
           n       1.00      0.70      0.82        10
         n-d       0.67      1.00      0.80         2
       query       1.00      0.62      0.77         8
         sno       0.80      0.94      0.87        69
          so       0.50      0.25      0.33         8
           y       0.86      0.60      0.71        10
         y-d       0.00      0.00      0.00         1

    accuracy                           0.84       165
   macro avg       0.81      0.74      0.76       165
weighted avg       0.85      0.84      0.83       165

Combination:  {'batch_size': 8, 'lr': 2e-05, 'epochs': 40}


Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "LABEL_12"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_10": 10,
    "LABEL_11": 11,
    "LABEL_12": 12,
    "LABEL_2": 2,
    "LABEL_3": 3,
    "LABEL_4": 4,
    "LABEL_5": 5,
    "LABEL_6": 6,
    "LABEL_7": 7,
    "LABEL_8": 8,
    "LABEL_9": 9
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
 

Step,Training Loss
100,1.8426
200,0.9892
300,0.4796
400,0.2556
500,0.1911
600,0.0939
700,0.0723
800,0.0406
900,0.0287
1000,0.0274


Saving model checkpoint to Models/BERT_13classes\checkpoint-500
Configuration saved in Models/BERT_13classes\checkpoint-500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-500\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-500\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-500\special_tokens_map.json
Saving model checkpoint to Models/BERT_13classes\checkpoint-1000
Configuration saved in Models/BERT_13classes\checkpoint-1000\config.json
Model weights saved in Models/BERT_13classes\checkpoint-1000\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-1000\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-1000\special_tokens_map.json
Saving model checkpoint to Models/BERT_13classes\checkpoint-1500
Configuration saved in Models/BERT_13classes\checkpoint-1500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-1500\pytorch_

              precision    recall  f1-score   support

         ack       0.75      1.00      0.86         3
         dno       1.00      0.80      0.89        10
          fa       1.00      1.00      1.00         9
          fe       0.83      1.00      0.91        10
          fp       0.93      0.88      0.90        16
          ft       0.90      1.00      0.95         9
           n       0.88      0.70      0.78        10
         n-d       0.50      0.50      0.50         2
       query       0.83      0.62      0.71         8
         sno       0.83      0.93      0.88        69
          so       0.33      0.12      0.18         8
           y       0.86      0.60      0.71        10
         y-d       0.25      1.00      0.40         1

    accuracy                           0.84       165
   macro avg       0.76      0.78      0.74       165
weighted avg       0.84      0.84      0.83       165

Combination:  {'batch_size': 8, 'lr': 5e-05, 'epochs': 40}


Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "LABEL_12"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_10": 10,
    "LABEL_11": 11,
    "LABEL_12": 12,
    "LABEL_2": 2,
    "LABEL_3": 3,
    "LABEL_4": 4,
    "LABEL_5": 5,
    "LABEL_6": 6,
    "LABEL_7": 7,
    "LABEL_8": 8,
    "LABEL_9": 9
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
 

Step,Training Loss
100,1.4865
200,0.6284
300,0.2872
400,0.1325
500,0.1147
600,0.0483
700,0.0423
800,0.0278
900,0.0254
1000,0.0164


Saving model checkpoint to Models/BERT_13classes\checkpoint-500
Configuration saved in Models/BERT_13classes\checkpoint-500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-500\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-500\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-500\special_tokens_map.json
Saving model checkpoint to Models/BERT_13classes\checkpoint-1000
Configuration saved in Models/BERT_13classes\checkpoint-1000\config.json
Model weights saved in Models/BERT_13classes\checkpoint-1000\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-1000\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-1000\special_tokens_map.json
Saving model checkpoint to Models/BERT_13classes\checkpoint-1500
Configuration saved in Models/BERT_13classes\checkpoint-1500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-1500\pytorch_

              precision    recall  f1-score   support

         ack       1.00      1.00      1.00         3
         dno       1.00      0.70      0.82        10
          fa       1.00      1.00      1.00         9
          fe       0.83      1.00      0.91        10
          fp       0.88      0.88      0.88        16
          ft       0.90      1.00      0.95         9
           n       0.88      0.70      0.78        10
         n-d       0.50      0.50      0.50         2
       query       1.00      0.75      0.86         8
         sno       0.83      0.94      0.88        69
          so       0.67      0.25      0.36         8
           y       0.86      0.60      0.71        10
         y-d       0.25      1.00      0.40         1

    accuracy                           0.85       165
   macro avg       0.81      0.79      0.77       165
weighted avg       0.86      0.85      0.84       165

Combination:  {'batch_size': 32, 'lr': 2e-05, 'epochs': 40}


loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at C:\Users\adianidm/.cache\huggingface\transformers\3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "LABEL_12"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_10": 10,
    "LABEL_11": 11,
    "LABEL_12": 12,
   

Step,Training Loss
100,1.4799
200,0.4256
300,0.1128
400,0.0531
500,0.0332
600,0.0261
700,0.0217
800,0.0235


Saving model checkpoint to Models/BERT_13classes\checkpoint-500
Configuration saved in Models/BERT_13classes\checkpoint-500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-500\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-500\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-500\special_tokens_map.json


Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at C:\Users\adianidm/.cache\huggingface\transformers\3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
 

              precision    recall  f1-score   support

         ack       0.75      1.00      0.86         3
         dno       1.00      0.80      0.89        10
          fa       1.00      1.00      1.00         9
          fe       0.82      0.90      0.86        10
          fp       0.93      0.88      0.90        16
          ft       0.90      1.00      0.95         9
           n       0.89      0.80      0.84        10
         n-d       0.50      0.50      0.50         2
       query       1.00      0.62      0.77         8
         sno       0.82      0.94      0.88        69
          so       0.50      0.12      0.20         8
           y       0.86      0.60      0.71        10
         y-d       0.25      1.00      0.40         1

    accuracy                           0.84       165
   macro avg       0.79      0.78      0.75       165
weighted avg       0.85      0.84      0.83       165

Combination:  {'batch_size': 16, 'lr': 2e-05, 'epochs': 20}


loading weights file https://huggingface.co/bert-base-uncased/resolve/main/pytorch_model.bin from cache at C:\Users\adianidm/.cache\huggingface\transformers\a8041bf617d7f94ea26d15e218abd04afc2004805632abc0ed2066aa16d50d04.faf6ea826ae9c5867d12b22257f9877e6b8367890837bd60f7c54a29633f7f2f
Some weights of the model checkpoint at bert-base-uncased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.LayerNorm.bias', 'cls.seq_relationship.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.weight', 'cls.seq_relationship.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertFo

Step,Training Loss
100,1.6737
200,0.738
300,0.3222
400,0.1425
500,0.0742
600,0.0492
700,0.0423
800,0.0316


Saving model checkpoint to Models/BERT_13classes\checkpoint-500
Configuration saved in Models/BERT_13classes\checkpoint-500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-500\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-500\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-500\special_tokens_map.json


Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at C:\Users\adianidm/.cache\huggingface\transformers\3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
 

              precision    recall  f1-score   support

         ack       0.75      1.00      0.86         3
         dno       1.00      0.70      0.82        10
          fa       1.00      1.00      1.00         9
          fe       0.90      0.90      0.90        10
          fp       0.93      0.81      0.87        16
          ft       0.90      1.00      0.95         9
           n       0.89      0.80      0.84        10
         n-d       1.00      0.50      0.67         2
       query       1.00      0.75      0.86         8
         sno       0.80      0.96      0.87        69
          so       0.50      0.12      0.20         8
           y       0.86      0.60      0.71        10
         y-d       0.25      1.00      0.40         1

    accuracy                           0.84       165
   macro avg       0.83      0.78      0.76       165
weighted avg       0.85      0.84      0.83       165

Combination:  {'batch_size': 8, 'lr': 2e-05, 'epochs': 20}


loading weights file https://huggingface.co/bert-base-uncased/resolve/main/pytorch_model.bin from cache at C:\Users\adianidm/.cache\huggingface\transformers\a8041bf617d7f94ea26d15e218abd04afc2004805632abc0ed2066aa16d50d04.faf6ea826ae9c5867d12b22257f9877e6b8367890837bd60f7c54a29633f7f2f
Some weights of the model checkpoint at bert-base-uncased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.LayerNorm.bias', 'cls.seq_relationship.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.weight', 'cls.seq_relationship.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertFo

Step,Training Loss
100,1.8493
200,1.0185
300,0.5171
400,0.2799
500,0.2027
600,0.109
700,0.0943
800,0.055
900,0.0414
1000,0.0306


Saving model checkpoint to Models/BERT_13classes\checkpoint-500
Configuration saved in Models/BERT_13classes\checkpoint-500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-500\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-500\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-500\special_tokens_map.json
Saving model checkpoint to Models/BERT_13classes\checkpoint-1000
Configuration saved in Models/BERT_13classes\checkpoint-1000\config.json
Model weights saved in Models/BERT_13classes\checkpoint-1000\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-1000\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-1000\special_tokens_map.json
Saving model checkpoint to Models/BERT_13classes\checkpoint-1500
Configuration saved in Models/BERT_13classes\checkpoint-1500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-1500\pytorch_

              precision    recall  f1-score   support

         ack       0.75      1.00      0.86         3
         dno       1.00      0.80      0.89        10
          fa       1.00      1.00      1.00         9
          fe       0.82      0.90      0.86        10
          fp       0.88      0.88      0.88        16
          ft       1.00      1.00      1.00         9
           n       1.00      0.80      0.89        10
         n-d       0.67      1.00      0.80         2
       query       1.00      0.75      0.86         8
         sno       0.84      0.94      0.89        69
          so       0.33      0.12      0.18         8
           y       0.86      0.60      0.71        10
         y-d       0.25      1.00      0.40         1

    accuracy                           0.85       165
   macro avg       0.80      0.83      0.78       165
weighted avg       0.86      0.85      0.85       165

Combination:  {'batch_size': 32, 'lr': 5e-05, 'epochs': 20}


loading weights file https://huggingface.co/bert-base-uncased/resolve/main/pytorch_model.bin from cache at C:\Users\adianidm/.cache\huggingface\transformers\a8041bf617d7f94ea26d15e218abd04afc2004805632abc0ed2066aa16d50d04.faf6ea826ae9c5867d12b22257f9877e6b8367890837bd60f7c54a29633f7f2f
Some weights of the model checkpoint at bert-base-uncased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.LayerNorm.bias', 'cls.seq_relationship.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.weight', 'cls.seq_relationship.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertFo

Step,Training Loss
100,1.0376
200,0.1157
300,0.0303
400,0.0206




Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at C:\Users\adianidm/.cache\huggingface\transformers\3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "LABEL_12"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0"

              precision    recall  f1-score   support

         ack       1.00      1.00      1.00         3
         dno       1.00      0.90      0.95        10
          fa       1.00      1.00      1.00         9
          fe       0.83      1.00      0.91        10
          fp       0.93      0.81      0.87        16
          ft       0.90      1.00      0.95         9
           n       1.00      0.70      0.82        10
         n-d       0.67      1.00      0.80         2
       query       1.00      0.75      0.86         8
         sno       0.85      0.97      0.91        69
          so       1.00      0.25      0.40         8
           y       0.86      0.60      0.71        10
         y-d       0.25      1.00      0.40         1

    accuracy                           0.87       165
   macro avg       0.87      0.84      0.81       165
weighted avg       0.90      0.87      0.87       165

Combination:  {'batch_size': 32, 'lr': 5e-05, 'epochs': 40}


loading weights file https://huggingface.co/bert-base-uncased/resolve/main/pytorch_model.bin from cache at C:\Users\adianidm/.cache\huggingface\transformers\a8041bf617d7f94ea26d15e218abd04afc2004805632abc0ed2066aa16d50d04.faf6ea826ae9c5867d12b22257f9877e6b8367890837bd60f7c54a29633f7f2f
Some weights of the model checkpoint at bert-base-uncased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.LayerNorm.bias', 'cls.seq_relationship.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.weight', 'cls.seq_relationship.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertFo

Step,Training Loss
100,1.0313
200,0.1128
300,0.0231
400,0.0181
500,0.0149
600,0.0134
700,0.0116
800,0.013


Saving model checkpoint to Models/BERT_13classes\checkpoint-500
Configuration saved in Models/BERT_13classes\checkpoint-500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-500\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-500\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-500\special_tokens_map.json


Training completed. Do not forget to share your model on huggingface.co/models =)




              precision    recall  f1-score   support

         ack       1.00      1.00      1.00         3
         dno       1.00      0.80      0.89        10
          fa       1.00      1.00      1.00         9
          fe       0.82      0.90      0.86        10
          fp       0.93      0.88      0.90        16
          ft       0.90      1.00      0.95         9
           n       1.00      0.70      0.82        10
         n-d       0.67      1.00      0.80         2
       query       1.00      0.75      0.86         8
         sno       0.84      0.93      0.88        69
          so       0.50      0.38      0.43         8
           y       0.86      0.60      0.71        10
         y-d       0.25      1.00      0.40         1

    accuracy                           0.85       165
   macro avg       0.83      0.84      0.81       165
weighted avg       0.87      0.85      0.85       165

Combination:  {'batch_size': 16, 'lr': 2e-05, 'epochs': 30}


loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at C:\Users\adianidm/.cache\huggingface\transformers\3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2",
    "3": "LABEL_3",
    "4": "LABEL_4",
    "5": "LABEL_5",
    "6": "LABEL_6",
    "7": "LABEL_7",
    "8": "LABEL_8",
    "9": "LABEL_9",
    "10": "LABEL_10",
    "11": "LABEL_11",
    "12": "LABEL_12"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_10": 10,
    "LABEL_11": 11,
    "LABEL_12": 12,
   

Step,Training Loss
100,1.6827
200,0.7376
300,0.2958
400,0.1223
500,0.0558
600,0.0341
700,0.0307
800,0.024
900,0.0218
1000,0.0227


Saving model checkpoint to Models/BERT_13classes\checkpoint-500
Configuration saved in Models/BERT_13classes\checkpoint-500\config.json
Model weights saved in Models/BERT_13classes\checkpoint-500\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-500\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-500\special_tokens_map.json
Saving model checkpoint to Models/BERT_13classes\checkpoint-1000
Configuration saved in Models/BERT_13classes\checkpoint-1000\config.json
Model weights saved in Models/BERT_13classes\checkpoint-1000\pytorch_model.bin
tokenizer config file saved in Models/BERT_13classes\checkpoint-1000\tokenizer_config.json
Special tokens file saved in Models/BERT_13classes\checkpoint-1000\special_tokens_map.json


Training completed. Do not forget to share your model on huggingface.co/models =)




              precision    recall  f1-score   support

         ack       0.75      1.00      0.86         3
         dno       1.00      0.80      0.89        10
          fa       1.00      1.00      1.00         9
          fe       0.83      1.00      0.91        10
          fp       0.88      0.88      0.88        16
          ft       1.00      1.00      1.00         9
           n       0.80      0.80      0.80        10
         n-d       1.00      0.50      0.67         2
       query       1.00      0.62      0.77         8
         sno       0.83      0.93      0.88        69
          so       0.33      0.12      0.18         8
           y       0.86      0.60      0.71        10
         y-d       0.25      1.00      0.40         1

    accuracy                           0.84       165
   macro avg       0.81      0.79      0.76       165
weighted avg       0.84      0.84      0.83       165



In [18]:
# Best model parameters-Comment out if using KFold
best params ={'epochs': 40, 
              'lr': 5e-5,
              'batch_size': 8}
            

In [None]:
#Comment out when not using KFold
#best_params = best_model['p']
#best_split = best_model['split']

## Train best estimator for classification report and confusion matrix

In [None]:
#Run kfold over here 
results = []
f1_scores=[]
best_model = []
i = 2 #Choose the split of data or just use train/test
train_dataset = load_dataset('csv', data_files={'train': 'Data/train.csv'})
#train_dataset = load_dataset('csv', data_files={'train': 'Data/train2.csv'})
testing_dataset =load_dataset("csv", data_files={'test':'Data/test.csv'}) 
#eval_dataset =load_dataset("csv", data_files={'test':'Data/eval.csv'}) 
#print(train_dataset["train"][0])

tokenized_dataset_train =train_dataset.map(preprocess_function)
#print(tokenized_dataset_train['train']['input_ids'])

tokenized_dataset_test = testing_dataset.map(preprocess_function)

data_collator = DataCollatorWithPadding(tokenizer=tokenizer)
#dataset has been loaded correctly. 
print("----------------------MODEL " + str(i)+"-------------------------------")


model=BertForSequenceClassification.from_pretrained(model_name, num_labels=13)
#device="cpu"
device="cuda"
model.to(device)


training_args = TrainingArguments(
num_train_epochs=best_params["epochs"],
learning_rate=best_params["lr"],
per_device_train_batch_size=best_params["batch_size"],  # batch size per device during training
weight_decay=0.01,               # strength of weight decay
#oad_best_model_at_end=True,
logging_steps=100,
#valuation_strategy="steps",
output_dir="Models/BERT_13classes_output"
)

trainer = Trainer( model=model,
              args=training_args,
              train_dataset=tokenized_dataset_train['train'],
              #eval_dataset=tokenized_dataset_valid['valid'],
              tokenizer=tokenizer,
              data_collator=data_collator
             )


trainer.train()

y_pred=[]

for text in tokenized_dataset_test["test"]["text"]:
    y_pred.append(get_prediction(text))

predictions = le.inverse_transform(y_pred)
y_true = tokenized_dataset_test['test']["label"]

acc = accuracy_score(le.inverse_transform(y_true), predictions)
#f1_score = f1_score(le.inverse_transform(y_true), predictions, average="macro")
#f1_scores.append(f1_score)
results.append(acc)
print(classification_report(le.inverse_transform(y_true), predictions))
f1= f1_score(le.inverse_transform(y_true), predictions, average="macro")
f1_scores.append(f1)
cm = confusion_matrix(le.inverse_transform(y_true), predictions)
disp = ConfusionMatrixDisplay(confusion_matrix=cm, display_labels=le.classes_)
disp.plot()

trainer.save_model("Models/{NAME_OF_OUTPUT_FOLDER_FOR_FINAL_MODEL}")