In [1]:
import torch
import transformers
import torch.nn as nn
from torch.utils.data import DataLoader
from tqdm.notebook import tqdm

from transformers import Trainer, TrainingArguments
from transformers import BertTokenizer
from transformers import BertPreTrainedModel, BertModel, DistilBertPreTrainedModel, DistilBertModel, DistilBertConfig
from transformers import RobertaTokenizer

import pandas as pd
import numpy as np
import os
import csv

from sklearn.metrics import classification_report

# just checking somethingdf
from datasets import Dataset

# my custom function
import utils
import importlib
from sklearn.model_selection import train_test_split

# import the libraries from bert
from bert import BERT_PCL, PCLDataset, Trainer_PCL, DistillBert_PCL, RobertaPCL
import bert

if not torch.cuda.is_available():
  print('WARNING: You may want to change the runtime to GPU for faster training!')
  DEVICE = 'cpu'
else:
  DEVICE = 'cuda:0'

import os
import pickle
from itertools import product
content = os.path.abspath('/vol/bitbucket/ahf119/')

In [2]:
importlib.reload(bert)

<module 'bert' from '/homes/ahf119/Desktop/nlp_cw/bert.py'>

In [3]:
EPOCHS = 7

In [4]:
def write_dict_to_csv(file_path, data_dict):
    # Extract fieldnames from the first dictionary key
    fieldnames = list(data_dict.keys())

    # Check if the file already exists or not
    file_exists = True
    try:
        with open(file_path, 'r') as file:
            reader = csv.DictReader(file)
            if not reader.fieldnames:
                file_exists = False
    except FileNotFoundError:
        file_exists = False

    # Write data to CSV
    with open(file_path, 'a', newline='') as file:
        writer = csv.DictWriter(file, fieldnames=fieldnames)

        # Write header if the file is empty
        if not file_exists:
            writer.writeheader()

        # Write data
        writer.writerow(data_dict)

In [5]:
params = {
    'lr': [0.00001, 0.00005],
    # 'warmup_ratio': [0.1, 0.2],
    'learning_schedule': ['linear', 'constant'],
    'augmentation': {
        'augment0': {
            'inserted': False,
            'subbed': False,
            'back_translated': False,
            'deleted': False,
            'swapped': False
        },
        'augment1': {        
            'inserted': True,
            'subbed': False,
            'back_translated': False,
            'deleted': False,
            'swapped': False
            },
            'augment2': {
                'inserted': False,
                'subbed': True,
                'back_translated': False,
                'deleted': False,
                'swapped': False
            },
            'augment3': {
                'inserted': False,
                'subbed': False,
                'back_translated': True,
                'deleted': False,
                'swapped': False
            },
            'augment4': {
                'inserted': False,
                'subbed': False,
                'back_translated': False,
                'deleted': True,
                'swapped': False
            },
            'augment5': {
                'inserted': False,
                'subbed': False,
                'back_translated': False,
                'deleted': False,
                'swapped': True
            }
        }
    }

# Generate all possible combinations of parameters
param_grid = list(product(*params.values()))
print(len(param_grid))

24


In [6]:
def train_once(lr, learning_schedule, augment_dict, best_f1):
    model_output=f'{content}/wandtest_model'
    model_type = 'bert-base-cased'
    
    if model_type.startswith('bert'):
        model = BERT_PCL.from_pretrained(model_type)
    elif model_type.startswith('distil'):
        model = DistillBert_PCL.from_pretrained(model_type)
    elif model_type.startswith('roberta'):
        model = RobertaPCL.from_pretrained(model_type)
    
    args = TrainingArguments(
        output_dir=f'{content}/wandtest',
        learning_rate=lr,
        logging_steps=10,
        remove_unused_columns=False,
        per_device_train_batch_size=32,
        per_device_eval_batch_size=32,
        num_train_epochs=EPOCHS,
        seed=42,
        evaluation_strategy='steps',
        eval_steps=100,
        save_strategy='steps',
        save_steps=100,
        load_best_model_at_end=True,
        metric_for_best_model='f1',
        greater_is_better=True,
        lr_scheduler_type=learning_schedule,
        warmup_ratio=0.1,
    )

    train_dataset, val_dataset, test_dataset = bert.all_augmentations(model_type, inserted = augment_dict['inserted'], subbed = augment_dict['subbed'], back_translated = augment_dict['back_translated'], 
                                                                      deleted = augment_dict['deleted'], swapped = augment_dict['swapped'])

    trainer = bert.main_PCL_v1(model=model, args=args, train_dataset=train_dataset, val_dataset=val_dataset, model_output=model_output)
    if model_type.startswith('bert'):
        model = BERT_PCL.from_pretrained(model_output)
    elif model_type.startswith('distil'):
        model = DistillBert_PCL.from_pretrained(model_output)
    elif model_type.startswith('roberta'):
        model = RobertaPCL.from_pretrained(model_output)
    metrics = bert.evaluate(model, DataLoader(val_dataset))
    f1 = metrics['PCL']['f1-score']

    if f1 > best_f1:
        best_f1 = f1
        trainer.save_model(f'{content}/best_model')
        with open('saved_metrics.pkl', 'wb') as f:
            pickle.dump(metrics, f)

    model_data = metrics['PCL'].copy()
    model_data['learning_rate'] = lr
    model_data['learning_schedule'] = learning_schedule
    model_data['inserted'] = augment_dict['inserted']
    model_data['deleted'] = augment_dict['deleted']
    model_data['subbed'] = augment_dict['subbed']
    model_data['back_translated'] = augment_dict['back_translated']
    model_data['swapped'] = augment_dict['swapped']

    write_dict_to_csv(file_path = 'hyperparam_res_{}.csv'.format(model_type), data_dict = model_data)
    
    return best_f1
    

In [7]:
best_f1 = -1

current_parameter = 0
for i, param_set in enumerate(param_grid):
    if i < current_parameter:
        continue
    best_f1 = train_once(param_set[0], param_set[1], params['augmentation'][param_set[2]], best_f1)
    print(f'Finished param set with index: {i}')

Some weights of BERT_PCL were not initialized from the model checkpoint at bert-base-cased and are newly initialized: ['classification.1.bias', 'classification.1.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


inserted False
subbed False
back_translated False
deleted False
swapped False


[34m[1mwandb[0m: Currently logged in as: [33manders-frelin19[0m ([33mhugo-frelin[0m). Use [1m`wandb login --relogin`[0m to force relogin


Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
100,0.3913,0.452175,0.897732,0.0,0.0,0.0
200,0.3396,0.380004,0.903303,0.554688,0.276265,0.368831
300,0.3598,0.410615,0.906088,0.62963,0.198444,0.301775
400,0.3188,0.318992,0.902507,0.523256,0.525292,0.524272
500,0.2045,0.389605,0.916832,0.653846,0.396887,0.493947
600,0.2625,0.383187,0.90967,0.566372,0.498054,0.530021
700,0.1744,0.395918,0.912455,0.59204,0.463035,0.519651
800,0.1707,0.384158,0.912455,0.58296,0.505837,0.541667
900,0.0909,0.470213,0.913649,0.603093,0.455253,0.518847
1000,0.1032,0.46696,0.911659,0.578475,0.501946,0.5375


  _warn_prf(average, modifier, f"{metric.capitalize()} is", len(result))


  0%|          | 0/2513 [00:00<?, ?it/s]

Finished param set with index: 0


Some weights of BERT_PCL were not initialized from the model checkpoint at bert-base-cased and are newly initialized: ['classification.1.bias', 'classification.1.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


inserted True
subbed False
back_translated False
deleted False
swapped False


Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
100,0.5072,0.427849,0.890569,0.235294,0.031128,0.054983
200,0.3956,0.34764,0.901313,0.526627,0.346304,0.41784
300,0.2752,0.330351,0.897732,0.5,0.55642,0.526703
400,0.29,0.332517,0.912455,0.610778,0.396887,0.481132
500,0.1694,0.35163,0.898528,0.503546,0.552529,0.526902
600,0.1297,0.386845,0.909272,0.568075,0.470817,0.514894
700,0.1713,0.567069,0.909272,0.623932,0.284047,0.390374
800,0.1484,0.51923,0.912455,0.620915,0.36965,0.463415


Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-100 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-200 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-300 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-400 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-500 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-600 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Chec

  0%|          | 0/2513 [00:00<?, ?it/s]

Finished param set with index: 1


Some weights of BERT_PCL were not initialized from the model checkpoint at bert-base-cased and are newly initialized: ['classification.1.bias', 'classification.1.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


inserted False
subbed True
back_translated False
deleted False
swapped False


Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
100,0.4885,0.446671,0.886988,0.373832,0.155642,0.21978
200,0.4123,0.354166,0.898926,0.511278,0.264591,0.348718
300,0.3082,0.326873,0.905292,0.540084,0.498054,0.518219
400,0.2939,0.301634,0.910068,0.567686,0.505837,0.534979
500,0.2144,0.332144,0.913251,0.592417,0.486381,0.534188
600,0.1754,0.320942,0.90768,0.549801,0.536965,0.543307
700,0.1393,0.412458,0.913649,0.60101,0.463035,0.523077
800,0.1723,0.441372,0.911659,0.571429,0.544747,0.557769
900,0.13,0.514354,0.920812,0.679012,0.428016,0.52506
1000,0.0442,0.598027,0.917628,0.701613,0.338521,0.456693


Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-100 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-200 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-300 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-400 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-500 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-600 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Chec

  0%|          | 0/2513 [00:00<?, ?it/s]

Finished param set with index: 2


Some weights of BERT_PCL were not initialized from the model checkpoint at bert-base-cased and are newly initialized: ['classification.1.bias', 'classification.1.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


inserted False
subbed False
back_translated True
deleted False
swapped False


Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
100,0.4425,0.437105,0.879427,0.290909,0.124514,0.174387
200,0.3208,0.357494,0.904099,0.567797,0.2607,0.357333
300,0.2227,0.360805,0.903701,0.541899,0.377432,0.444954
400,0.2696,0.319748,0.887784,0.460568,0.568093,0.508711
500,0.1381,0.438471,0.900915,0.521978,0.36965,0.432802
600,0.1572,0.398241,0.902109,0.527363,0.412451,0.462882
700,0.1097,0.557332,0.912057,0.657895,0.291829,0.404313


Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-100 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-200 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-300 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-400 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-500 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-600 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Chec

  0%|          | 0/2513 [00:00<?, ?it/s]

Finished param set with index: 3


Some weights of BERT_PCL were not initialized from the model checkpoint at bert-base-cased and are newly initialized: ['classification.1.bias', 'classification.1.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


inserted False
subbed False
back_translated False
deleted True
swapped False


Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
100,0.533,0.43261,0.89813,0.6,0.011673,0.022901
200,0.4367,0.343437,0.890171,0.458874,0.412451,0.434426
300,0.2982,0.342843,0.910864,0.598802,0.389105,0.471698
400,0.3022,0.333512,0.914843,0.616216,0.44358,0.515837
500,0.2271,0.408409,0.911659,0.633588,0.322957,0.427835
600,0.1193,0.41749,0.911659,0.61745,0.357977,0.453202
700,0.1486,0.521845,0.912455,0.624161,0.361868,0.458128


Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-100 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-200 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-300 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-400 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-500 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-600 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Chec

  0%|          | 0/2513 [00:00<?, ?it/s]

Finished param set with index: 4


Some weights of BERT_PCL were not initialized from the model checkpoint at bert-base-cased and are newly initialized: ['classification.1.bias', 'classification.1.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


inserted False
subbed False
back_translated False
deleted False
swapped True


Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
100,0.5043,0.428044,0.895344,0.392857,0.042802,0.077193
200,0.4174,0.347771,0.90569,0.590909,0.252918,0.354223
300,0.2829,0.338104,0.912057,0.645161,0.311284,0.419948
400,0.2896,0.333583,0.911261,0.60625,0.377432,0.465228
500,0.2148,0.406702,0.912455,0.620915,0.36965,0.463415
600,0.1039,0.394725,0.90967,0.58427,0.404669,0.478161
700,0.1594,0.539195,0.914445,0.661538,0.33463,0.444444
800,0.13,0.505593,0.915639,0.627119,0.431907,0.511521
900,0.0981,0.584233,0.914047,0.699029,0.280156,0.4
1000,0.0264,0.692544,0.915241,0.711538,0.287938,0.409972


Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-100 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-200 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-300 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-400 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-500 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-600 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Chec

  0%|          | 0/2513 [00:00<?, ?it/s]

IOPub message rate exceeded.
The Jupyter server will temporarily stop sending output
to the client in order to avoid crashing it.
To change this limit, set the config variable
`--ServerApp.iopub_msg_rate_limit`.

Current values:
ServerApp.iopub_msg_rate_limit=1000.0 (msgs/sec)
ServerApp.rate_limit_window=3.0 (secs)

  _warn_prf(average, modifier, f"{metric.capitalize()} is", len(result))
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-100 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-200 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-300 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-400 already exists and is non-empty.

  0%|          | 0/2513 [00:00<?, ?it/s]

Finished param set with index: 6


Some weights of BERT_PCL were not initialized from the model checkpoint at bert-base-cased and are newly initialized: ['classification.1.bias', 'classification.1.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


inserted True
subbed False
back_translated False
deleted False
swapped False


Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
100,0.4389,0.375124,0.896936,0.482759,0.108949,0.177778
200,0.3712,0.326474,0.906088,0.55615,0.404669,0.468468
300,0.2361,0.321337,0.901313,0.515358,0.587549,0.549091
400,0.2593,0.304711,0.907282,0.547619,0.536965,0.54224
500,0.1326,0.340335,0.899721,0.508306,0.595331,0.548387
600,0.1245,0.387266,0.902507,0.52521,0.486381,0.505051


Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-100 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-200 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-300 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-400 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-500 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-600 already exists and is non-empty. Saving will proceed but saved results may be invalid.


  0%|          | 0/2513 [00:00<?, ?it/s]

Finished param set with index: 7


Some weights of BERT_PCL were not initialized from the model checkpoint at bert-base-cased and are newly initialized: ['classification.1.bias', 'classification.1.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


inserted False
subbed True
back_translated False
deleted False
swapped False


Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
100,0.4176,0.389649,0.89813,0.504505,0.217899,0.304348
200,0.352,0.335474,0.910068,0.597484,0.36965,0.456731
300,0.2809,0.341291,0.893752,0.483333,0.564202,0.520646
400,0.2725,0.332117,0.90967,0.579787,0.424125,0.489888
500,0.1492,0.397622,0.886988,0.458462,0.579767,0.512027
600,0.1429,0.375623,0.902507,0.527027,0.455253,0.488518


Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-100 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-200 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-300 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-400 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-500 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-600 already exists and is non-empty. Saving will proceed but saved results may be invalid.


  0%|          | 0/2513 [00:00<?, ?it/s]

Finished param set with index: 8


Some weights of BERT_PCL were not initialized from the model checkpoint at bert-base-cased and are newly initialized: ['classification.1.bias', 'classification.1.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


inserted False
subbed False
back_translated True
deleted False
swapped False


Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
100,0.3193,0.396221,0.897334,0.496599,0.284047,0.361386
200,0.3142,0.358855,0.906486,0.583333,0.299611,0.395887
300,0.2161,0.361081,0.898528,0.504425,0.44358,0.47205
400,0.2319,0.333986,0.910466,0.594118,0.392996,0.473068
500,0.1222,0.502434,0.908078,0.691176,0.182879,0.289231
600,0.1472,0.404116,0.89614,0.492248,0.494163,0.493204
700,0.0647,0.650515,0.910466,0.677778,0.237354,0.351585
800,0.0657,0.554961,0.915639,0.771084,0.249027,0.376471
900,0.0267,0.591651,0.916435,0.644172,0.40856,0.5
1000,0.0455,0.700581,0.912853,0.706522,0.252918,0.372493


Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-100 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-200 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-300 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-400 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-500 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-600 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Chec

  0%|          | 0/2513 [00:00<?, ?it/s]

Finished param set with index: 9


Some weights of BERT_PCL were not initialized from the model checkpoint at bert-base-cased and are newly initialized: ['classification.1.bias', 'classification.1.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


inserted False
subbed False
back_translated False
deleted True
swapped False


Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
100,0.4168,0.383633,0.901313,0.540541,0.233463,0.326087
200,0.3811,0.324414,0.902507,0.527273,0.451362,0.486373
300,0.2522,0.325451,0.906486,0.551402,0.459144,0.501062
400,0.2464,0.317727,0.914843,0.60804,0.470817,0.530702
500,0.1587,0.370211,0.89614,0.492857,0.536965,0.513966
600,0.1204,0.457912,0.914445,0.645833,0.361868,0.46384
700,0.1474,0.617611,0.914047,0.684685,0.29572,0.413043


Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-100 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-200 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-300 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-400 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-500 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-600 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Chec

  0%|          | 0/2513 [00:00<?, ?it/s]

Finished param set with index: 10


Some weights of BERT_PCL were not initialized from the model checkpoint at bert-base-cased and are newly initialized: ['classification.1.bias', 'classification.1.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


inserted False
subbed False
back_translated False
deleted False
swapped True


Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
100,0.405,0.358808,0.900119,0.529412,0.210117,0.300836
200,0.3531,0.313798,0.910466,0.583333,0.435798,0.498886
300,0.2223,0.336664,0.908874,0.568627,0.451362,0.503254
400,0.2471,0.324442,0.90768,0.557078,0.474708,0.512605
500,0.1287,0.38852,0.90768,0.55102,0.525292,0.537849
600,0.0972,0.438518,0.913251,0.602094,0.447471,0.513393
700,0.1486,0.552303,0.911261,0.594444,0.416342,0.489703
800,0.1,0.542628,0.912057,0.579646,0.509728,0.542443
900,0.066,0.706193,0.920812,0.674699,0.435798,0.529551
1000,0.0222,0.921992,0.917628,0.784091,0.268482,0.4


Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-100 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-200 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-300 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-400 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-500 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-600 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Chec

  0%|          | 0/2513 [00:00<?, ?it/s]

Finished param set with index: 11


Some weights of BERT_PCL were not initialized from the model checkpoint at bert-base-cased and are newly initialized: ['classification.1.bias', 'classification.1.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


inserted False
subbed False
back_translated False
deleted False
swapped False


Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
100,0.3366,0.393738,0.90569,0.763158,0.11284,0.19661
200,0.335,0.314871,0.906088,0.559322,0.385214,0.456221
300,0.2549,0.357992,0.906088,0.558011,0.392996,0.461187
400,0.1638,0.462734,0.905292,0.544601,0.451362,0.493617
500,0.0769,0.51927,0.905292,0.543379,0.463035,0.5
600,0.1462,0.578329,0.916435,0.691057,0.330739,0.447368
700,0.0466,0.600526,0.902905,0.524904,0.533074,0.528958
800,0.0006,0.761098,0.904895,0.5375,0.501946,0.519115
900,0.0013,0.812805,0.915241,0.629412,0.416342,0.501171
1000,0.0004,0.873077,0.913251,0.616766,0.400778,0.485849


Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-100 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-200 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-300 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-400 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-500 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-600 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Chec

  0%|          | 0/2513 [00:00<?, ?it/s]

Finished param set with index: 12


Some weights of BERT_PCL were not initialized from the model checkpoint at bert-base-cased and are newly initialized: ['classification.1.bias', 'classification.1.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


inserted True
subbed False
back_translated False
deleted False
swapped False


Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
100,0.4594,0.424278,0.899721,1.0,0.019455,0.038168
200,0.3344,0.327341,0.908874,0.573684,0.424125,0.487696
300,0.2405,0.371572,0.912455,0.619355,0.373541,0.466019
400,0.2701,0.299201,0.890967,0.474164,0.607004,0.532423
500,0.1322,0.435505,0.881417,0.446194,0.661479,0.532915
600,0.0322,0.429575,0.897334,0.498054,0.498054,0.498054
700,0.0833,0.653009,0.90967,0.588235,0.389105,0.468384
800,0.0261,0.634579,0.912853,0.595,0.463035,0.520788


Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-100 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-200 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-300 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-400 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-500 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-600 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Chec

  0%|          | 0/2513 [00:00<?, ?it/s]

Finished param set with index: 13


Some weights of BERT_PCL were not initialized from the model checkpoint at bert-base-cased and are newly initialized: ['classification.1.bias', 'classification.1.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


inserted False
subbed True
back_translated False
deleted False
swapped False


Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
100,0.4089,0.446972,0.898528,1.0,0.007782,0.015444
200,0.3502,0.331253,0.907282,0.575949,0.354086,0.438554
300,0.2052,0.398616,0.910068,0.6,0.361868,0.451456
400,0.242,0.3159,0.892559,0.480826,0.634241,0.54698
500,0.1032,0.417115,0.893752,0.483221,0.560311,0.518919
600,0.0794,0.443858,0.88659,0.45858,0.603113,0.521008
700,0.1921,0.676481,0.913251,0.624204,0.381323,0.47343


Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-100 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-200 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-300 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-400 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-500 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-600 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Chec

  0%|          | 0/2513 [00:00<?, ?it/s]

Finished param set with index: 14


Some weights of BERT_PCL were not initialized from the model checkpoint at bert-base-cased and are newly initialized: ['classification.1.bias', 'classification.1.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


inserted False
subbed False
back_translated True
deleted False
swapped False


Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
100,0.2937,0.464372,0.901711,0.647059,0.085603,0.151203
200,0.2806,0.397937,0.901711,0.527778,0.36965,0.434783
300,0.1742,0.447437,0.906884,0.592,0.287938,0.387435
400,0.1888,0.33232,0.910068,0.582011,0.428016,0.493274
500,0.0706,0.574023,0.892161,0.473282,0.48249,0.477842
600,0.0243,0.703947,0.901711,0.532895,0.315175,0.396088
700,0.0439,0.91432,0.911659,0.769231,0.194553,0.310559


Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-100 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-200 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-300 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-400 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-500 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-600 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Chec

  0%|          | 0/2513 [00:00<?, ?it/s]

Finished param set with index: 15


Some weights of BERT_PCL were not initialized from the model checkpoint at bert-base-cased and are newly initialized: ['classification.1.bias', 'classification.1.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


inserted False
subbed False
back_translated False
deleted True
swapped False


Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
100,0.4799,0.39219,0.902905,0.76,0.07393,0.134752
200,0.4661,0.415472,0.81337,0.326797,0.77821,0.460299
300,0.2261,0.404924,0.886988,0.458967,0.587549,0.515358
400,0.1986,0.414408,0.904895,0.534351,0.544747,0.539499
500,0.1316,0.428796,0.902507,0.525,0.490272,0.507042
600,0.0396,0.598494,0.902507,0.525641,0.478599,0.501018
700,0.0649,0.783715,0.910864,0.627907,0.315175,0.419689


Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-100 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-200 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-300 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-400 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-500 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-600 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Chec

  0%|          | 0/2513 [00:00<?, ?it/s]

Finished param set with index: 16


Some weights of BERT_PCL were not initialized from the model checkpoint at bert-base-cased and are newly initialized: ['classification.1.bias', 'classification.1.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


inserted False
subbed False
back_translated False
deleted False
swapped True


Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
100,0.3944,0.34599,0.88659,0.453333,0.529183,0.48833
200,0.381,0.362794,0.825706,0.343696,0.774319,0.476077
300,0.2271,0.350858,0.900915,0.517241,0.466926,0.490798
400,0.2657,0.336412,0.894946,0.488599,0.583658,0.531915
500,0.1072,0.385698,0.891365,0.476048,0.618677,0.538071
600,0.1145,0.445377,0.91723,0.671329,0.373541,0.48
700,0.0835,0.667668,0.914047,0.612022,0.435798,0.509091
800,0.0688,0.650151,0.918026,0.666667,0.396887,0.497561


Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-100 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-200 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-300 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-400 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-500 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-600 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Chec

  0%|          | 0/2513 [00:00<?, ?it/s]

Finished param set with index: 17


Some weights of BERT_PCL were not initialized from the model checkpoint at bert-base-cased and are newly initialized: ['classification.1.bias', 'classification.1.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


inserted False
subbed False
back_translated False
deleted False
swapped False


Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
100,0.24,0.383785,0.89813,0.502392,0.40856,0.450644
200,0.2756,0.351272,0.908078,0.568421,0.420233,0.483221
300,0.2348,0.458219,0.904099,0.653846,0.132296,0.220065
400,0.2727,0.368733,0.881417,0.44058,0.59144,0.504983
500,0.1815,0.589018,0.901313,0.524064,0.381323,0.441441
600,0.1432,0.611166,0.904099,0.54,0.420233,0.472648
700,0.1464,0.613906,0.906884,0.552511,0.470817,0.508403
800,0.0454,0.674882,0.906088,0.554974,0.412451,0.473214
900,0.0135,1.002568,0.910466,0.617647,0.326848,0.427481
1000,0.0002,1.0629,0.910864,0.613793,0.346304,0.442786


Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-100 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-200 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-300 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-400 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-500 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-600 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Chec

  0%|          | 0/2513 [00:00<?, ?it/s]

Finished param set with index: 18


Some weights of BERT_PCL were not initialized from the model checkpoint at bert-base-cased and are newly initialized: ['classification.1.bias', 'classification.1.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


inserted True
subbed False
back_translated False
deleted False
swapped False


Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
100,0.3709,0.339601,0.910864,0.708861,0.217899,0.333333
200,0.3859,0.369829,0.897732,0.5,0.023346,0.04461
300,0.227,0.342463,0.903701,0.535211,0.44358,0.485106
400,0.213,0.309198,0.902905,0.521886,0.603113,0.559567
500,0.0976,0.393405,0.88659,0.461326,0.649805,0.53958
600,0.0551,0.479376,0.903701,0.533937,0.459144,0.493724
700,0.0712,0.745364,0.914445,0.677966,0.311284,0.426667


Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-100 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-200 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-300 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-400 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-500 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-600 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Chec

  0%|          | 0/2513 [00:00<?, ?it/s]

Finished param set with index: 19


Some weights of BERT_PCL were not initialized from the model checkpoint at bert-base-cased and are newly initialized: ['classification.1.bias', 'classification.1.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


inserted False
subbed True
back_translated False
deleted False
swapped False


Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
100,0.4508,0.42061,0.896936,0.375,0.011673,0.022642
200,0.3674,0.342538,0.913649,0.613636,0.420233,0.498845
300,0.2089,0.349494,0.871866,0.419355,0.657588,0.512121
400,0.2729,0.360638,0.90967,0.582418,0.412451,0.482916
500,0.1024,0.473617,0.906884,0.553488,0.463035,0.504237
600,0.0791,0.555158,0.876641,0.415335,0.505837,0.45614


Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-100 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-200 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-300 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-400 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-500 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-600 already exists and is non-empty. Saving will proceed but saved results may be invalid.


  0%|          | 0/2513 [00:00<?, ?it/s]

Finished param set with index: 20


Some weights of BERT_PCL were not initialized from the model checkpoint at bert-base-cased and are newly initialized: ['classification.1.bias', 'classification.1.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


inserted False
subbed False
back_translated True
deleted False
swapped False


Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
100,0.3157,0.377218,0.896936,0.492308,0.249027,0.330749
200,0.2772,0.350064,0.898528,0.50463,0.424125,0.460888
300,0.1551,0.517569,0.906884,0.595041,0.280156,0.380952
400,0.1704,0.469832,0.911261,0.625,0.330739,0.43257
500,0.1518,0.780353,0.881815,0.42126,0.416342,0.418787


Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-100 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-200 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-300 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-400 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-500 already exists and is non-empty. Saving will proceed but saved results may be invalid.


  0%|          | 0/2513 [00:00<?, ?it/s]

Finished param set with index: 21


Some weights of BERT_PCL were not initialized from the model checkpoint at bert-base-cased and are newly initialized: ['classification.1.bias', 'classification.1.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


inserted False
subbed False
back_translated False
deleted True
swapped False


Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
100,0.397,0.350792,0.901711,0.647059,0.085603,0.151203
200,0.4161,0.440858,0.787903,0.302292,0.821012,0.441885
300,0.1395,0.400424,0.911261,0.590426,0.431907,0.498876
400,0.1906,0.491225,0.914047,0.651852,0.342412,0.44898
500,0.1522,0.565083,0.914843,0.693694,0.299611,0.418478
600,0.0482,0.617061,0.908874,0.570707,0.439689,0.496703


Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-100 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-200 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-300 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-400 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-500 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-600 already exists and is non-empty. Saving will proceed but saved results may be invalid.


  0%|          | 0/2513 [00:00<?, ?it/s]

Finished param set with index: 22


Some weights of BERT_PCL were not initialized from the model checkpoint at bert-base-cased and are newly initialized: ['classification.1.bias', 'classification.1.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


inserted False
subbed False
back_translated False
deleted False
swapped True


Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
100,0.3991,0.347497,0.909272,0.635514,0.264591,0.373626
200,0.3596,0.390731,0.789097,0.298969,0.789883,0.433761
300,0.1783,0.311135,0.89415,0.484642,0.552529,0.516364
400,0.1715,0.395407,0.907282,0.5625,0.420233,0.481069
500,0.1202,0.432937,0.900915,0.515504,0.51751,0.516505
600,0.1072,0.49684,0.879029,0.427692,0.540856,0.477663
700,0.0527,0.800219,0.911261,0.634921,0.311284,0.417755
800,0.0473,0.707041,0.912853,0.620253,0.381323,0.472289


Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-100 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-200 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-300 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-400 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-500 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Checkpoint destination directory /vol/bitbucket/ahf119/wandtest/checkpoint-600 already exists and is non-empty. Saving will proceed but saved results may be invalid.
Chec

  0%|          | 0/2513 [00:00<?, ?it/s]

Finished param set with index: 23
