In [1]:
import os
from tqdm import tqdm
import numpy as np
from pathlib import Path
import argparse
import logging
import torch
from torch.utils.data import DataLoader
import wandb
from sklearn.metrics import mean_squared_error
import datasets
from transformers import (Trainer, TrainingArguments, DataCollatorWithPadding,
                          AutoTokenizer, AutoModelForSequenceClassification)

In [2]:
assert torch.cuda.is_available(), 'GPU not found. You should fix this.'

In [3]:
wandb.login()

Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.
[34m[1mwandb[0m: Currently logged in as: [33mtiedaar1[0m ([33mai-aloe[0m). Use [1m`wandb login --relogin`[0m to force relogin


True

In [4]:
DATA = '../../../data/spancat/'

In [5]:
model_name_or_path = 'microsoft/deberta-v3-large'
dataset_path = DATA+'strategies-ds.hf'
output_dir = DATA+'spancat/results/hp-tuning'
model_max_length = 2056
eval_steps = 1000
eval_accumulation_steps = 2
save_total_limit = 4
batch_size = 16
sweep_id = None
dry_run = False
metric = 'f1'
entity = 'ai-aloe'
project_name = 'metacognitive_classifier'

In [6]:
import evaluate
import numpy as np

clf_metrics = evaluate.combine(["accuracy", "f1", "precision", "recall"])

def sigmoid(x):
   return 1/(1 + np.exp(-x))

def compute_metrics(eval_pred):
   predictions, labels = eval_pred
   predictions = sigmoid(predictions)
   predictions = (predictions > 0.5).astype(int).reshape(-1)
   return clf_metrics.compute(predictions=predictions, references=labels.astype(int).reshape(-1))

In [7]:
def load_dataset(dataset_path):
    ds = datasets.load_from_disk(dataset_path)
    return ds

In [8]:
ds = load_dataset(DATA+'strategies-ds.hf')

In [9]:
def train():
    ''' The main training loop.
    '''
    wandb.init()
    
    config = wandb.config

    model = AutoModelForSequenceClassification.from_pretrained(model_name_or_path,
                                                               num_labels=8,
                                                               problem_type = "multi_label_classification")
        
    training_args = TrainingArguments(
        output_dir=output_dir,
        evaluation_strategy='epoch',
        save_strategy='epoch',
        logging_strategy='epoch',
        # eval_steps=eval_steps,
        # save_steps=eval_steps,
        # eval_accumulation_steps=eval_accumulation_steps,
        save_total_limit=save_total_limit,
        optim='adamw_torch',
        learning_rate=config.learning_rate,
        num_train_epochs=config.epochs,
        weight_decay=config.weight_decay,
        warmup_steps = config.warmup_steps,
        per_device_train_batch_size=batch_size,
        per_device_eval_batch_size=batch_size,
        disable_tqdm=False,
        report_to='wandb',
    )

    trainer = Trainer(
        model=model,
        args=training_args,
        train_dataset=ds['train'],
        eval_dataset=ds['test'],
        data_collator=data_collator,
        compute_metrics=compute_metrics,
        tokenizer=tokenizer,
    )

    trainer.train()

In [10]:
tokenizer = AutoTokenizer.from_pretrained(
    model_name_or_path,
    max_length=model_max_length,
    )



In [11]:
data_collator = DataCollatorWithPadding(tokenizer=tokenizer, pad_to_multiple_of=16, return_tensors='pt')

# if not sweep_id:
sweep_goal = 'maximize'
    
if dry_run:
    sweep_name = 'dry-run'
else:
    sweep_name = f'{model_name_or_path}'
        
sweep_config = {
    'name': sweep_name,
    'method': 'bayes',
    'metric': {
        'name': f'eval/{metric}',
        'goal': sweep_goal,
    },
    'parameters':
    {
        'epochs': {
            'values': [1, 2, 3, 4, 5, 6, 7, 8, 9, 10]
        },
        # 'dropout': {
        #     'values': [0, 0.15, 0.3]
        # },
        'learning_rate': {
            'distribution': 'uniform',
            'min': 5e-6,
            'max': 1e-5,
        },
        'weight_decay': {
            'values': [0.01]
        },
        'warmup_steps': {
            'values': [50, 100, 500, 1000]
        },
    },
}

sweep_id = wandb.sweep(sweep_config, entity=entity, project=project_name)

# else:
#     sweep_id = sweep_id
        
wandb.agent(sweep_id, train, count=30)

Create sweep with ID: 8ellv5tx
Sweep URL: https://wandb.ai/ai-aloe/metacognitive_classifier/sweeps/8ellv5tx


[34m[1mwandb[0m: Agent Starting Run: jmnm51f5 with config:
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 8.484830074719205e-06
[34m[1mwandb[0m: 	warmup_steps: 500
[34m[1mwandb[0m: 	weight_decay: 0.01
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of DebertaV2ForSequenceClassification were not initialized from the model checkpoint at microsoft/deberta-v3-large and are newly initialized: ['classifier.bias', 'classifier.weight', 'pooler.dense.bias', 'pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.7296,0.711866,0.518955,0.142466,0.099744,0.249201
2,0.5561,0.382462,0.872951,0.51938,0.660099,0.428115
3,0.3639,0.331549,0.88166,0.492308,0.788732,0.357827
4,0.3226,0.302206,0.89498,0.5629,0.846154,0.421725
5,0.2936,0.279921,0.901639,0.591489,0.88535,0.444089
6,0.2586,0.25621,0.910348,0.665392,0.828571,0.555911
7,0.2235,0.225138,0.92418,0.734767,0.836735,0.654952


VBox(children=(Label(value='0.008 MB of 0.008 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
eval/accuracy,▁▇▇▇███
eval/f1,▁▅▅▆▆▇█
eval/loss,█▃▃▂▂▁▁
eval/precision,▁▆▇██▇█
eval/recall,▁▄▃▄▄▆█
eval/runtime,▁▅▄▃▅▆█
eval/samples_per_second,█▄▅▆▄▃▁
eval/steps_per_second,█▄▅▆▄▃▁
train/epoch,▁▁▂▂▃▃▅▅▆▆▇▇███
train/global_step,▁▁▂▂▃▃▅▅▆▆▇▇███

0,1
eval/accuracy,0.92418
eval/f1,0.73477
eval/loss,0.22514
eval/precision,0.83673
eval/recall,0.65495
eval/runtime,2.7837
eval/samples_per_second,87.652
eval/steps_per_second,5.748
total_flos,2421223110623232.0
train/epoch,7.0


[34m[1mwandb[0m: Agent Starting Run: 1ns8lrpb with config:
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 5.8843975438419745e-06
[34m[1mwandb[0m: 	warmup_steps: 100
[34m[1mwandb[0m: 	weight_decay: 0.01
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of DebertaV2ForSequenceClassification were not initialized from the model checkpoint at microsoft/deberta-v3-large and are newly initialized: ['classifier.bias', 'classifier.weight', 'pooler.dense.bias', 'pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.633,0.516587,0.844775,0.09009,0.75,0.047923
2,0.4002,0.345871,0.876537,0.492632,0.722222,0.373802
3,0.3276,0.303212,0.895492,0.542601,0.909774,0.386581
4,0.2885,0.27483,0.908811,0.62605,0.91411,0.476038
5,0.26,0.26224,0.905225,0.615385,0.880952,0.472843
6,0.2389,0.248109,0.915984,0.679688,0.874372,0.555911
7,0.2255,0.246807,0.915984,0.683398,0.863415,0.565495


VBox(children=(Label(value='0.008 MB of 0.016 MB uploaded\r'), FloatProgress(value=0.4786386676321506, max=1.0…

0,1
eval/accuracy,▁▄▆▇▇██
eval/f1,▁▆▆▇▇██
eval/loss,█▄▂▂▁▁▁
eval/precision,▂▁██▇▇▆
eval/recall,▁▅▆▇▇██
eval/runtime,▁▄██▇▅▇
eval/samples_per_second,█▅▁▁▂▄▂
eval/steps_per_second,█▅▁▁▂▄▂
train/epoch,▁▁▂▂▃▃▅▅▆▆▇▇███
train/global_step,▁▁▂▂▃▃▅▅▆▆▇▇███

0,1
eval/accuracy,0.91598
eval/f1,0.6834
eval/loss,0.24681
eval/precision,0.86341
eval/recall,0.5655
eval/runtime,2.7708
eval/samples_per_second,88.063
eval/steps_per_second,5.775
total_flos,2421223110623232.0
train/epoch,7.0


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: po4dh1mn with config:
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 8.354398112150327e-06
[34m[1mwandb[0m: 	warmup_steps: 1000
[34m[1mwandb[0m: 	weight_decay: 0.01
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of DebertaV2ForSequenceClassification were not initialized from the model checkpoint at microsoft/deberta-v3-large and are newly initialized: ['classifier.bias', 'classifier.weight', 'pooler.dense.bias', 'pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.6591,0.652402,0.65625,0.341511,0.246459,0.555911
2,0.636,0.575325,0.85502,0.383442,0.60274,0.28115
3,0.4961,0.396498,0.861168,0.320802,0.744186,0.204473
4,0.3776,0.349461,0.871414,0.518234,0.649038,0.43131
5,0.3447,0.321933,0.885246,0.523404,0.783439,0.392971
6,0.3157,0.313111,0.890369,0.561475,0.782857,0.4377
7,0.2904,0.288757,0.901639,0.649635,0.757447,0.56869


VBox(children=(Label(value='0.008 MB of 0.008 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
eval/accuracy,▁▇▇▇███
eval/f1,▁▂▁▅▅▆█
eval/loss,█▇▃▂▂▁▁
eval/precision,▁▆▇▆███
eval/recall,█▂▁▅▅▅█
eval/runtime,▁▃▅▇▁█▄
eval/samples_per_second,█▆▄▂█▁▅
eval/steps_per_second,▇▆▄▃█▁▅
train/epoch,▁▁▂▂▃▃▅▅▆▆▇▇███
train/global_step,▁▁▂▂▃▃▅▅▆▆▇▇███

0,1
eval/accuracy,0.90164
eval/f1,0.64964
eval/loss,0.28876
eval/precision,0.75745
eval/recall,0.56869
eval/runtime,2.7755
eval/samples_per_second,87.912
eval/steps_per_second,5.765
total_flos,2421223110623232.0
train/epoch,7.0


[34m[1mwandb[0m: Agent Starting Run: ri1wjx9u with config:
[34m[1mwandb[0m: 	epochs: 9
[34m[1mwandb[0m: 	learning_rate: 5.644455160928555e-06
[34m[1mwandb[0m: 	warmup_steps: 50
[34m[1mwandb[0m: 	weight_decay: 0.01
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of DebertaV2ForSequenceClassification were not initialized from the model checkpoint at microsoft/deberta-v3-large and are newly initialized: ['classifier.bias', 'classifier.weight', 'pooler.dense.bias', 'pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.5917,0.3945,0.871414,0.492929,0.67033,0.389776
2,0.361,0.332918,0.880635,0.485651,0.785714,0.351438
3,0.3154,0.294608,0.89498,0.54343,0.897059,0.389776
4,0.2813,0.268635,0.904201,0.589011,0.943662,0.428115
5,0.2553,0.260587,0.907787,0.637097,0.863388,0.504792
6,0.2325,0.247704,0.913422,0.694394,0.8,0.613419
7,0.2146,0.235275,0.920082,0.715328,0.834043,0.626198
8,0.2031,0.228048,0.922643,0.719852,0.858407,0.619808
9,0.1961,0.227506,0.921619,0.720293,0.84188,0.629393


VBox(children=(Label(value='0.008 MB of 0.008 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
eval/accuracy,▁▂▄▅▆▇███
eval/f1,▁▁▃▄▆▇███
eval/loss,█▅▄▃▂▂▁▁▁
eval/precision,▁▄▇█▆▄▅▆▅
eval/recall,▂▁▂▃▅████
eval/runtime,▁▁▄▅▃▂▂█▃
eval/samples_per_second,██▅▄▆▇▇▁▆
eval/steps_per_second,██▅▄▆▇▇▁▆
train/epoch,▁▁▂▂▃▃▄▄▅▅▅▅▆▆▇▇███
train/global_step,▁▁▂▂▃▃▄▄▅▅▅▅▆▆▇▇███

0,1
eval/accuracy,0.92162
eval/f1,0.72029
eval/loss,0.22751
eval/precision,0.84188
eval/recall,0.62939
eval/runtime,2.7755
eval/samples_per_second,87.913
eval/steps_per_second,5.765
total_flos,3104813238276096.0
train/epoch,9.0


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: dea0icu6 with config:
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 5.362834488047011e-06
[34m[1mwandb[0m: 	warmup_steps: 1000
[34m[1mwandb[0m: 	weight_decay: 0.01
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of DebertaV2ForSequenceClassification were not initialized from the model checkpoint at microsoft/deberta-v3-large and are newly initialized: ['classifier.bias', 'classifier.weight', 'pooler.dense.bias', 'pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.6492,0.643563,0.726947,0.043088,0.04918,0.038339
2,0.6387,0.624475,0.728484,0.043321,0.049793,0.038339
3,0.58,0.477495,0.839139,0.0,0.0,0.0
4,0.4174,0.362416,0.868852,0.509579,0.636364,0.42492
5,0.3591,0.339867,0.877561,0.511247,0.710227,0.399361


VBox(children=(Label(value='0.008 MB of 0.026 MB uploaded\r'), FloatProgress(value=0.28716742081447966, max=1.…

0,1
eval/accuracy,▁▁▆██
eval/f1,▂▂▁██
eval/loss,██▄▂▁
eval/precision,▁▁▁▇█
eval/recall,▂▂▁██
eval/runtime,▁▇▆█▇
eval/samples_per_second,█▂▃▁▂
eval/steps_per_second,█▂▃▁▂
train/epoch,▁▁▃▃▅▅▆▆███
train/global_step,▁▁▃▃▅▅▆▆███

0,1
eval/accuracy,0.87756
eval/f1,0.51125
eval/loss,0.33987
eval/precision,0.71023
eval/recall,0.39936
eval/runtime,2.7767
eval/samples_per_second,87.875
eval/steps_per_second,5.762
total_flos,1737574735686144.0
train/epoch,5.0


[34m[1mwandb[0m: Agent Starting Run: f323tvy9 with config:
[34m[1mwandb[0m: 	epochs: 8
[34m[1mwandb[0m: 	learning_rate: 8.29837661672417e-06
[34m[1mwandb[0m: 	warmup_steps: 500
[34m[1mwandb[0m: 	weight_decay: 0.01
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of DebertaV2ForSequenceClassification were not initialized from the model checkpoint at microsoft/deberta-v3-large and are newly initialized: ['classifier.bias', 'classifier.weight', 'pooler.dense.bias', 'pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.6673,0.652067,0.622439,0.075282,0.061983,0.095847
2,0.5555,0.39404,0.874488,0.505051,0.686813,0.399361
3,0.3704,0.339378,0.880635,0.49676,0.766667,0.367412
4,0.3316,0.317041,0.88832,0.488263,0.920354,0.332268
5,0.2997,0.2915,0.900615,0.583691,0.888889,0.434505
6,0.268,0.259799,0.907275,0.623701,0.892857,0.479233
7,0.2296,0.230224,0.923668,0.728597,0.847458,0.638978
8,0.1947,0.205776,0.929303,0.737643,0.910798,0.619808


VBox(children=(Label(value='0.008 MB of 0.008 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
eval/accuracy,▁▇▇▇▇▇██
eval/f1,▁▆▅▅▆▇██
eval/loss,█▄▃▃▂▂▁▁
eval/precision,▁▆▇███▇█
eval/recall,▁▅▅▄▅▆██
eval/runtime,▁█▅▄▅▄▃▄
eval/samples_per_second,█▁▄▅▄▅▆▅
eval/steps_per_second,█▁▅▅▄▅▆▅
train/epoch,▁▁▂▂▃▃▄▄▅▅▆▆▇▇███
train/global_step,▁▁▂▂▃▃▄▄▅▅▆▆▇▇███

0,1
eval/accuracy,0.9293
eval/f1,0.73764
eval/loss,0.20578
eval/precision,0.9108
eval/recall,0.61981
eval/runtime,2.7731
eval/samples_per_second,87.989
eval/steps_per_second,5.77
total_flos,2764882087544832.0
train/epoch,8.0


[34m[1mwandb[0m: Agent Starting Run: pmmg0ky3 with config:
[34m[1mwandb[0m: 	epochs: 9
[34m[1mwandb[0m: 	learning_rate: 8.769156724059092e-06
[34m[1mwandb[0m: 	warmup_steps: 500
[34m[1mwandb[0m: 	weight_decay: 0.01
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of DebertaV2ForSequenceClassification were not initialized from the model checkpoint at microsoft/deberta-v3-large and are newly initialized: ['classifier.bias', 'classifier.weight', 'pooler.dense.bias', 'pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.6473,0.606745,0.802766,0.455446,0.408629,0.514377
2,0.5255,0.413413,0.856045,0.495512,0.565574,0.440895
3,0.3742,0.334779,0.88166,0.507463,0.762821,0.380192
4,0.3271,0.31118,0.891906,0.508159,0.939655,0.348243
5,0.2933,0.28639,0.901639,0.582609,0.911565,0.428115
6,0.2656,0.270338,0.91291,0.658635,0.886486,0.523962
7,0.2363,0.25407,0.915984,0.696296,0.828194,0.600639
8,0.2129,0.224474,0.924693,0.716763,0.902913,0.594249
9,0.1779,0.213148,0.928279,0.746377,0.861925,0.658147


VBox(children=(Label(value='0.027 MB of 0.027 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
eval/accuracy,▁▄▅▆▇▇▇██
eval/f1,▁▂▂▂▄▆▇▇█
eval/loss,█▅▃▃▂▂▂▁▁
eval/precision,▁▃▆██▇▇█▇
eval/recall,▅▃▂▁▃▅▇▇█
eval/runtime,▁▅▅▄▆█▅▄▄
eval/samples_per_second,█▄▄▅▃▁▄▅▅
eval/steps_per_second,█▄▄▄▃▁▄▄▅
train/epoch,▁▁▂▂▃▃▄▄▅▅▅▅▆▆▇▇███
train/global_step,▁▁▂▂▃▃▄▄▅▅▅▅▆▆▇▇███

0,1
eval/accuracy,0.92828
eval/f1,0.74638
eval/loss,0.21315
eval/precision,0.86192
eval/recall,0.65815
eval/runtime,2.77
eval/samples_per_second,88.088
eval/steps_per_second,5.776
total_flos,3104813238276096.0
train/epoch,9.0


[34m[1mwandb[0m: Agent Starting Run: n24i4tyi with config:
[34m[1mwandb[0m: 	epochs: 9
[34m[1mwandb[0m: 	learning_rate: 8.775835474193544e-06
[34m[1mwandb[0m: 	warmup_steps: 100
[34m[1mwandb[0m: 	weight_decay: 0.01
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of DebertaV2ForSequenceClassification were not initialized from the model checkpoint at microsoft/deberta-v3-large and are newly initialized: ['classifier.bias', 'classifier.weight', 'pooler.dense.bias', 'pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.6017,0.423137,0.86834,0.506718,0.634615,0.421725
2,0.3624,0.330135,0.882172,0.465116,0.854701,0.319489
3,0.3069,0.300151,0.89293,0.576065,0.788889,0.453674
4,0.2734,0.273684,0.900102,0.584222,0.878205,0.4377
5,0.242,0.250643,0.914447,0.670611,0.876289,0.543131
6,0.2183,0.244185,0.913422,0.675624,0.846154,0.5623
7,0.2,0.239216,0.913934,0.694545,0.805907,0.610224
8,0.1856,0.225085,0.923156,0.723247,0.855895,0.626198
9,0.176,0.226587,0.923156,0.726277,0.846809,0.635783


VBox(children=(Label(value='0.008 MB of 0.008 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
eval/accuracy,▁▃▄▅▇▇▇██
eval/f1,▂▁▄▄▇▇▇██
eval/loss,█▅▄▃▂▂▁▁▁
eval/precision,▁▇▅██▇▆▇▇
eval/recall,▃▁▄▄▆▆▇██
eval/runtime,▁▇▅▄▄▅▄▄█
eval/samples_per_second,█▂▄▅▅▄▅▅▁
eval/steps_per_second,█▂▄▅▅▄▅▅▁
train/epoch,▁▁▂▂▃▃▄▄▅▅▅▅▆▆▇▇███
train/global_step,▁▁▂▂▃▃▄▄▅▅▅▅▆▆▇▇███

0,1
eval/accuracy,0.92316
eval/f1,0.72628
eval/loss,0.22659
eval/precision,0.84681
eval/recall,0.63578
eval/runtime,2.786
eval/samples_per_second,87.582
eval/steps_per_second,5.743
total_flos,3104813238276096.0
train/epoch,9.0


[34m[1mwandb[0m: Agent Starting Run: 5gkztf3c with config:
[34m[1mwandb[0m: 	epochs: 9
[34m[1mwandb[0m: 	learning_rate: 9.809754664356172e-06
[34m[1mwandb[0m: 	warmup_steps: 500
[34m[1mwandb[0m: 	weight_decay: 0.01
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of DebertaV2ForSequenceClassification were not initialized from the model checkpoint at microsoft/deberta-v3-large and are newly initialized: ['classifier.bias', 'classifier.weight', 'pooler.dense.bias', 'pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.6449,0.628419,0.726947,0.043088,0.04918,0.038339
2,0.5428,0.391648,0.873463,0.514735,0.668367,0.41853
3,0.3648,0.336325,0.877561,0.488223,0.74026,0.364217
4,0.3205,0.298889,0.895492,0.546667,0.89781,0.392971
5,0.2808,0.277832,0.904713,0.600858,0.915033,0.447284
6,0.247,0.258068,0.913422,0.676864,0.842857,0.565495
7,0.2183,0.238489,0.918033,0.708029,0.825532,0.619808
8,0.183,0.205925,0.925717,0.733945,0.862069,0.638978


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: cmta4fs4 with config:
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	learning_rate: 9.946303722432942e-06
[34m[1mwandb[0m: 	warmup_steps: 500
[34m[1mwandb[0m: 	weight_decay: 0.01
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of DebertaV2ForSequenceClassification were not initialized from the model checkpoint at microsoft/deberta-v3-large and are newly initialized: ['classifier.bias', 'classifier.weight', 'pooler.dense.bias', 'pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.6448,0.628113,0.726947,0.043088,0.04918,0.038339
2,0.5412,0.390291,0.872439,0.516505,0.658416,0.42492
3,0.3643,0.336299,0.877561,0.490405,0.737179,0.367412
4,0.32,0.297989,0.897541,0.55157,0.924812,0.392971
5,0.2795,0.277218,0.904713,0.600858,0.915033,0.447284
6,0.2448,0.255414,0.915984,0.697417,0.825328,0.603834
7,0.2169,0.235942,0.915984,0.705036,0.806584,0.626198
8,0.1809,0.201734,0.928279,0.735849,0.898618,0.623003
9,0.142,0.184074,0.941086,0.80737,0.848592,0.769968
10,0.112,0.163717,0.94877,0.830508,0.884477,0.782748


VBox(children=(Label(value='0.008 MB of 0.008 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
eval/accuracy,▁▆▆▆▇▇▇▇██
eval/f1,▁▅▅▆▆▇▇▇██
eval/loss,█▄▄▃▃▂▂▂▁▁
eval/precision,▁▆▇██▇▇█▇█
eval/recall,▁▅▄▄▅▆▇▆██
eval/runtime,▆▃▁▂█▂▁▅▁▃
eval/samples_per_second,▃▆█▇▁▇█▄█▆
eval/steps_per_second,▃▆▇▆▁▇█▄█▆
train/epoch,▁▁▂▂▃▃▃▃▄▄▅▅▆▆▆▆▇▇███
train/global_step,▁▁▂▂▃▃▃▃▄▄▅▅▆▆▆▆▇▇███

0,1
eval/accuracy,0.94877
eval/f1,0.83051
eval/loss,0.16372
eval/precision,0.88448
eval/recall,0.78275
eval/runtime,2.7824
eval/samples_per_second,87.696
eval/steps_per_second,5.751
total_flos,3444860883575808.0
train/epoch,10.0


[34m[1mwandb[0m: Agent Starting Run: stjqabbv with config:
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	learning_rate: 9.917868095538506e-06
[34m[1mwandb[0m: 	warmup_steps: 500
[34m[1mwandb[0m: 	weight_decay: 0.01
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of DebertaV2ForSequenceClassification were not initialized from the model checkpoint at microsoft/deberta-v3-large and are newly initialized: ['classifier.bias', 'classifier.weight', 'pooler.dense.bias', 'pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.6724,0.655856,0.726947,0.043088,0.04918,0.038339
2,0.5855,0.421109,0.842725,0.055385,0.75,0.028754
3,0.3768,0.34526,0.873463,0.452328,0.73913,0.325879
4,0.3312,0.302165,0.89498,0.541387,0.902985,0.386581
5,0.2905,0.273927,0.907275,0.610753,0.934211,0.453674
6,0.2519,0.247193,0.91752,0.690979,0.865385,0.57508
7,0.2161,0.223997,0.924693,0.741652,0.824219,0.674121
8,0.1793,0.205555,0.930328,0.742424,0.911628,0.626198
9,0.1476,0.203826,0.93084,0.776119,0.806897,0.747604
10,0.1241,0.178989,0.940574,0.797909,0.877395,0.731629


VBox(children=(Label(value='0.027 MB of 0.027 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
eval/accuracy,▁▅▆▇▇▇▇███
eval/f1,▁▁▅▆▆▇▇▇██
eval/loss,█▅▃▃▂▂▂▁▁▁
eval/precision,▁▇▆██▇▇█▇█
eval/recall,▁▁▄▄▅▆▇▇██
eval/runtime,▂█▅▂▅▄▂▁▃▂
eval/samples_per_second,▇▁▄▇▄▅▇█▆▇
eval/steps_per_second,▇▁▄▇▄▅▇█▆▇
train/epoch,▁▁▂▂▃▃▃▃▄▄▅▅▆▆▆▆▇▇███
train/global_step,▁▁▂▂▃▃▃▃▄▄▅▅▆▆▆▆▇▇███

0,1
eval/accuracy,0.94057
eval/f1,0.79791
eval/loss,0.17899
eval/precision,0.87739
eval/recall,0.73163
eval/runtime,2.7762
eval/samples_per_second,87.89
eval/steps_per_second,5.763
total_flos,3444860883575808.0
train/epoch,10.0


[34m[1mwandb[0m: Agent Starting Run: 9fii11kt with config:
[34m[1mwandb[0m: 	epochs: 4
[34m[1mwandb[0m: 	learning_rate: 9.68925232668124e-06
[34m[1mwandb[0m: 	warmup_steps: 50
[34m[1mwandb[0m: 	weight_decay: 0.01
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of DebertaV2ForSequenceClassification were not initialized from the model checkpoint at microsoft/deberta-v3-large and are newly initialized: ['classifier.bias', 'classifier.weight', 'pooler.dense.bias', 'pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.5784,0.361353,0.869365,0.500978,0.646465,0.408946
2,0.3378,0.305602,0.894467,0.52968,0.928,0.370607
3,0.3017,0.303195,0.89498,0.526559,0.95,0.364217
4,0.2761,0.28277,0.902664,0.585153,0.924138,0.428115


VBox(children=(Label(value='0.027 MB of 0.027 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
eval/accuracy,▁▆▆█
eval/f1,▁▃▃█
eval/loss,█▃▃▁
eval/precision,▁▇█▇
eval/recall,▆▂▁█
eval/runtime,▁▇█▂
eval/samples_per_second,█▂▁▇
eval/steps_per_second,█▂▁▇
train/epoch,▁▁▃▃▆▆███
train/global_step,▁▁▃▃▆▆███

0,1
eval/accuracy,0.90266
eval/f1,0.58515
eval/loss,0.28277
eval/precision,0.92414
eval/recall,0.42812
eval/runtime,2.771
eval/samples_per_second,88.056
eval/steps_per_second,5.774
total_flos,1388207524910592.0
train/epoch,4.0


[34m[1mwandb[0m: Agent Starting Run: dqdqfofl with config:
[34m[1mwandb[0m: 	epochs: 1
[34m[1mwandb[0m: 	learning_rate: 5.5397322025704185e-06
[34m[1mwandb[0m: 	warmup_steps: 500
[34m[1mwandb[0m: 	weight_decay: 0.01
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of DebertaV2ForSequenceClassification were not initialized from the model checkpoint at microsoft/deberta-v3-large and are newly initialized: ['classifier.bias', 'classifier.weight', 'pooler.dense.bias', 'pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.703,0.693776,0.52459,0.29052,0.190955,0.607029


VBox(children=(Label(value='0.008 MB of 0.008 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
eval/accuracy,▁
eval/f1,▁
eval/loss,▁
eval/precision,▁
eval/recall,▁
eval/runtime,▁
eval/samples_per_second,▁
eval/steps_per_second,▁
train/epoch,▁▁▁
train/global_step,▁▁▁

0,1
eval/accuracy,0.52459
eval/f1,0.29052
eval/loss,0.69378
eval/precision,0.19095
eval/recall,0.60703
eval/runtime,2.7753
eval/samples_per_second,87.919
eval/steps_per_second,5.765
total_flos,350939887449600.0
train/epoch,1.0


[34m[1mwandb[0m: Agent Starting Run: 1yh39cxx with config:
[34m[1mwandb[0m: 	epochs: 7
[34m[1mwandb[0m: 	learning_rate: 5.898116615385523e-06
[34m[1mwandb[0m: 	warmup_steps: 50
[34m[1mwandb[0m: 	weight_decay: 0.01
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of DebertaV2ForSequenceClassification were not initialized from the model checkpoint at microsoft/deberta-v3-large and are newly initialized: ['classifier.bias', 'classifier.weight', 'pooler.dense.bias', 'pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.6486,0.382349,0.870902,0.509728,0.651741,0.41853
2,0.3466,0.311268,0.887807,0.498856,0.879032,0.348243
3,0.3038,0.291544,0.89959,0.556561,0.953488,0.392971
4,0.272,0.271735,0.906762,0.625514,0.878613,0.485623
5,0.2496,0.254062,0.911373,0.640333,0.916667,0.492013
6,0.2304,0.243721,0.915984,0.673307,0.89418,0.539936
7,0.2203,0.243468,0.91752,0.687379,0.876238,0.565495


VBox(children=(Label(value='0.008 MB of 0.008 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
eval/accuracy,▁▄▅▆▇██
eval/f1,▁▁▃▆▆▇█
eval/loss,█▄▃▂▂▁▁
eval/precision,▁▆█▆▇▇▆
eval/recall,▃▁▂▅▆▇█
eval/runtime,▁▁▅▄▅▅█
eval/samples_per_second,██▄▅▄▄▁
eval/steps_per_second,██▅▅▄▄▁
train/epoch,▁▁▂▂▃▃▅▅▆▆▇▇███
train/global_step,▁▁▂▂▃▃▅▅▆▆▇▇███

0,1
eval/accuracy,0.91752
eval/f1,0.68738
eval/loss,0.24347
eval/precision,0.87624
eval/recall,0.5655
eval/runtime,2.7838
eval/samples_per_second,87.651
eval/steps_per_second,5.748
total_flos,2421223110623232.0
train/epoch,7.0


[34m[1mwandb[0m: Agent Starting Run: juvbjo01 with config:
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	learning_rate: 6.956512493102417e-06
[34m[1mwandb[0m: 	warmup_steps: 500
[34m[1mwandb[0m: 	weight_decay: 0.01
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of DebertaV2ForSequenceClassification were not initialized from the model checkpoint at microsoft/deberta-v3-large and are newly initialized: ['classifier.bias', 'classifier.weight', 'pooler.dense.bias', 'pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.6573,0.646566,0.662398,0.344279,0.25,0.552716
2,0.5955,0.481894,0.846311,0.096386,0.842105,0.051118
3,0.412,0.357612,0.871414,0.453159,0.712329,0.332268
4,0.348,0.324943,0.880123,0.502128,0.751592,0.376997
5,0.3176,0.295389,0.896004,0.557734,0.876712,0.408946
6,0.2813,0.284476,0.903689,0.658182,0.763713,0.578275
7,0.2425,0.238947,0.918033,0.715302,0.807229,0.642173
8,0.2071,0.21855,0.927254,0.738971,0.87013,0.642173
9,0.1784,0.236607,0.913422,0.73132,0.727848,0.734824
10,0.1553,0.196458,0.935451,0.77972,0.861004,0.71246


VBox(children=(Label(value='0.027 MB of 0.027 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
eval/accuracy,▁▆▆▇▇▇██▇█
eval/f1,▄▁▅▅▆▇▇███
eval/loss,█▅▄▃▃▂▂▁▂▁
eval/precision,▁█▆▇█▇▇█▆█
eval/recall,▆▁▄▄▅▆▇▇██
eval/runtime,▃▄▄▂▂▄▂█▂▁
eval/samples_per_second,▆▅▅▇▇▅▇▁▇█
eval/steps_per_second,▆▅▅▇▇▅▇▁▇█
train/epoch,▁▁▂▂▃▃▃▃▄▄▅▅▆▆▆▆▇▇███
train/global_step,▁▁▂▂▃▃▃▃▄▄▅▅▆▆▆▆▇▇███

0,1
eval/accuracy,0.93545
eval/f1,0.77972
eval/loss,0.19646
eval/precision,0.861
eval/recall,0.71246
eval/runtime,2.7687
eval/samples_per_second,88.127
eval/steps_per_second,5.779
total_flos,3444860883575808.0
train/epoch,10.0


[34m[1mwandb[0m: Agent Starting Run: zx9ym5y8 with config:
[34m[1mwandb[0m: 	epochs: 9
[34m[1mwandb[0m: 	learning_rate: 5.9183055813707145e-06
[34m[1mwandb[0m: 	warmup_steps: 100
[34m[1mwandb[0m: 	weight_decay: 0.01
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of DebertaV2ForSequenceClassification were not initialized from the model checkpoint at microsoft/deberta-v3-large and are newly initialized: ['classifier.bias', 'classifier.weight', 'pooler.dense.bias', 'pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.6541,0.554067,0.839139,0.0,0.0,0.0
2,0.4181,0.347334,0.872951,0.441441,0.748092,0.313099
3,0.3257,0.301203,0.89498,0.553377,0.869863,0.405751
4,0.294,0.286551,0.896516,0.538813,0.944,0.376997
5,0.2628,0.259642,0.903176,0.584615,0.93662,0.42492
6,0.2366,0.248184,0.914959,0.670635,0.884817,0.539936
7,0.2189,0.240262,0.921107,0.709434,0.866359,0.600639
8,0.2061,0.231796,0.923668,0.72045,0.872727,0.613419
9,0.1974,0.229978,0.924693,0.725234,0.873874,0.619808


VBox(children=(Label(value='0.008 MB of 0.008 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
eval/accuracy,▁▄▆▆▆▇███
eval/f1,▁▅▆▆▇▇███
eval/loss,█▄▃▂▂▁▁▁▁
eval/precision,▁▇▇███▇▇▇
eval/recall,▁▅▆▅▆▇███
eval/runtime,▁█▅▅▄▄▅▅▂
eval/samples_per_second,█▁▄▄▅▅▄▄▇
eval/steps_per_second,█▁▄▄▅▅▄▄▇
train/epoch,▁▁▂▂▃▃▄▄▅▅▅▅▆▆▇▇███
train/global_step,▁▁▂▂▃▃▄▄▅▅▅▅▆▆▇▇███

0,1
eval/accuracy,0.92469
eval/f1,0.72523
eval/loss,0.22998
eval/precision,0.87387
eval/recall,0.61981
eval/runtime,2.7657
eval/samples_per_second,88.222
eval/steps_per_second,5.785
total_flos,3104813238276096.0
train/epoch,9.0


[34m[1mwandb[0m: Agent Starting Run: mme497yw with config:
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 8.037016383176912e-06
[34m[1mwandb[0m: 	warmup_steps: 500
[34m[1mwandb[0m: 	weight_decay: 0.01
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of DebertaV2ForSequenceClassification were not initialized from the model checkpoint at microsoft/deberta-v3-large and are newly initialized: ['classifier.bias', 'classifier.weight', 'pooler.dense.bias', 'pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.646,0.632627,0.726947,0.043088,0.04918,0.038339
2,0.5722,0.435233,0.861168,0.299742,0.783784,0.185304
3,0.3821,0.343814,0.876537,0.488323,0.727848,0.367412
4,0.3287,0.304704,0.89293,0.538631,0.871429,0.389776
5,0.2909,0.283351,0.901639,0.591489,0.88535,0.444089


VBox(children=(Label(value='0.008 MB of 0.008 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
eval/accuracy,▁▆▇██
eval/f1,▁▄▇▇█
eval/loss,█▄▂▁▁
eval/precision,▁▇▇██
eval/recall,▁▄▇▇█
eval/runtime,▄▆▅▁█
eval/samples_per_second,▅▃▄█▁
eval/steps_per_second,▅▄▅█▁
train/epoch,▁▁▃▃▅▅▆▆███
train/global_step,▁▁▃▃▅▅▆▆███

0,1
eval/accuracy,0.90164
eval/f1,0.59149
eval/loss,0.28335
eval/precision,0.88535
eval/recall,0.44409
eval/runtime,2.7874
eval/samples_per_second,87.536
eval/steps_per_second,5.74
total_flos,1737574735686144.0
train/epoch,5.0


[34m[1mwandb[0m: Agent Starting Run: sxyo09pw with config:
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 8.02383033686227e-06
[34m[1mwandb[0m: 	warmup_steps: 100
[34m[1mwandb[0m: 	weight_decay: 0.01
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of DebertaV2ForSequenceClassification were not initialized from the model checkpoint at microsoft/deberta-v3-large and are newly initialized: ['classifier.bias', 'classifier.weight', 'pooler.dense.bias', 'pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.616,0.410101,0.870389,0.512524,0.645631,0.42492
2,0.3596,0.322151,0.883709,0.515991,0.775641,0.386581
3,0.3129,0.303012,0.895492,0.550661,0.886525,0.399361


VBox(children=(Label(value='0.008 MB of 0.008 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
eval/accuracy,▁▅█
eval/f1,▁▂█
eval/loss,█▂▁
eval/precision,▁▅█
eval/recall,█▁▃
eval/runtime,▄▁█
eval/samples_per_second,▅█▁
eval/steps_per_second,▅█▁
train/epoch,▁▁▅▅███
train/global_step,▁▁▅▅███

0,1
eval/accuracy,0.89549
eval/f1,0.55066
eval/loss,0.30301
eval/precision,0.88652
eval/recall,0.39936
eval/runtime,2.7741
eval/samples_per_second,87.957
eval/steps_per_second,5.768
total_flos,1046849315715840.0
train/epoch,3.0


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: ooihww4q with config:
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 6.025434790489964e-06
[34m[1mwandb[0m: 	warmup_steps: 50
[34m[1mwandb[0m: 	weight_decay: 0.01
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of DebertaV2ForSequenceClassification were not initialized from the model checkpoint at microsoft/deberta-v3-large and are newly initialized: ['classifier.bias', 'classifier.weight', 'pooler.dense.bias', 'pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.5456,0.362388,0.869877,0.507752,0.64532,0.41853
2,0.3479,0.327492,0.883709,0.522105,0.765432,0.396166
3,0.314,0.301947,0.89498,0.547461,0.885714,0.396166
4,0.2862,0.28906,0.901639,0.586207,0.900662,0.434505
5,0.2707,0.285154,0.901127,0.581345,0.905405,0.428115


VBox(children=(Label(value='0.008 MB of 0.008 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
eval/accuracy,▁▄▇██
eval/f1,▁▂▅██
eval/loss,█▅▃▁▁
eval/precision,▁▄▇██
eval/recall,▅▁▁█▇
eval/runtime,▁▅▂█▄
eval/samples_per_second,█▄▇▁▅
eval/steps_per_second,█▅▇▁▅
train/epoch,▁▁▃▃▅▅▆▆███
train/global_step,▁▁▃▃▅▅▆▆███

0,1
eval/accuracy,0.90113
eval/f1,0.58134
eval/loss,0.28515
eval/precision,0.90541
eval/recall,0.42812
eval/runtime,2.7724
eval/samples_per_second,88.011
eval/steps_per_second,5.771
total_flos,1737574735686144.0
train/epoch,5.0


[34m[1mwandb[0m: Agent Starting Run: uh3amdxu with config:
[34m[1mwandb[0m: 	epochs: 9
[34m[1mwandb[0m: 	learning_rate: 7.986301123571913e-06
[34m[1mwandb[0m: 	warmup_steps: 100
[34m[1mwandb[0m: 	weight_decay: 0.01
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of DebertaV2ForSequenceClassification were not initialized from the model checkpoint at microsoft/deberta-v3-large and are newly initialized: ['classifier.bias', 'classifier.weight', 'pooler.dense.bias', 'pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.6164,0.410839,0.872951,0.515625,0.663317,0.421725
2,0.3598,0.320977,0.885758,0.512035,0.8125,0.373802
3,0.3057,0.289577,0.899078,0.561247,0.926471,0.402556
4,0.2632,0.260395,0.906762,0.614407,0.91195,0.463259
5,0.2249,0.240441,0.920594,0.704762,0.872642,0.591054
6,0.2018,0.231387,0.918545,0.720562,0.800781,0.654952
7,0.181,0.214021,0.928279,0.751773,0.844622,0.677316
8,0.1655,0.201543,0.931352,0.755474,0.880851,0.661342
9,0.1568,0.20066,0.93084,0.754991,0.87395,0.664537


VBox(children=(Label(value='0.008 MB of 0.008 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
eval/accuracy,▁▃▄▅▇▆███
eval/f1,▁▁▂▄▇▇███
eval/loss,█▅▄▃▂▂▁▁▁
eval/precision,▁▅██▇▅▆▇▇
eval/recall,▂▁▂▃▆▇███
eval/runtime,▁▄█▅▄█▇▂▃
eval/samples_per_second,█▅▁▄▅▁▂▇▆
eval/steps_per_second,█▅▁▄▅▁▂▇▆
train/epoch,▁▁▂▂▃▃▄▄▅▅▅▅▆▆▇▇███
train/global_step,▁▁▂▂▃▃▄▄▅▅▅▅▆▆▇▇███

0,1
eval/accuracy,0.93084
eval/f1,0.75499
eval/loss,0.20066
eval/precision,0.87395
eval/recall,0.66454
eval/runtime,2.7698
eval/samples_per_second,88.092
eval/steps_per_second,5.777
total_flos,3104813238276096.0
train/epoch,9.0


[34m[1mwandb[0m: Agent Starting Run: wm3w8nyr with config:
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 5.167044915740036e-06
[34m[1mwandb[0m: 	warmup_steps: 1000
[34m[1mwandb[0m: 	weight_decay: 0.01
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of DebertaV2ForSequenceClassification were not initialized from the model checkpoint at microsoft/deberta-v3-large and are newly initialized: ['classifier.bias', 'classifier.weight', 'pooler.dense.bias', 'pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.6493,0.64375,0.726947,0.043088,0.04918,0.038339
2,0.6392,0.625775,0.727971,0.043243,0.049587,0.038339
3,0.586,0.488127,0.839652,0.0,0.0,0.0


  _warn_prf(average, modifier, f"{metric.capitalize()} is", len(result))


VBox(children=(Label(value='0.008 MB of 0.008 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
eval/accuracy,▁▁█
eval/f1,██▁
eval/loss,█▇▁
eval/precision,██▁
eval/recall,██▁
eval/runtime,█▁▁
eval/samples_per_second,▁██
eval/steps_per_second,▁██
train/epoch,▁▁▅▅███
train/global_step,▁▁▅▅███

0,1
eval/accuracy,0.83965
eval/f1,0.0
eval/loss,0.48813
eval/precision,0.0
eval/recall,0.0
eval/runtime,2.7752
eval/samples_per_second,87.922
eval/steps_per_second,5.765
total_flos,1046849315715840.0
train/epoch,3.0


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 4dralhbj with config:
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 6.462772644232436e-06
[34m[1mwandb[0m: 	warmup_steps: 500
[34m[1mwandb[0m: 	weight_decay: 0.01
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of DebertaV2ForSequenceClassification were not initialized from the model checkpoint at microsoft/deberta-v3-large and are newly initialized: ['classifier.bias', 'classifier.weight', 'pooler.dense.bias', 'pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.6373,0.614061,0.85502,0.491921,0.561475,0.4377
2,0.5353,0.408613,0.859119,0.499089,0.580508,0.4377
3,0.3821,0.346853,0.878074,0.504167,0.724551,0.386581
4,0.3393,0.323683,0.882684,0.4662,0.862069,0.319489
5,0.3087,0.309609,0.889857,0.549266,0.79878,0.41853


VBox(children=(Label(value='0.008 MB of 0.008 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
eval/accuracy,▁▂▆▇█
eval/f1,▃▄▄▁█
eval/loss,█▃▂▁▁
eval/precision,▁▁▅█▇
eval/recall,██▅▁▇
eval/runtime,▁█▇▆▆
eval/samples_per_second,█▁▂▃▃
eval/steps_per_second,█▁▂▃▃
train/epoch,▁▁▃▃▅▅▆▆███
train/global_step,▁▁▃▃▅▅▆▆███

0,1
eval/accuracy,0.88986
eval/f1,0.54927
eval/loss,0.30961
eval/precision,0.79878
eval/recall,0.41853
eval/runtime,2.7696
eval/samples_per_second,88.098
eval/steps_per_second,5.777
total_flos,1737574735686144.0
train/epoch,5.0


[34m[1mwandb[0m: Agent Starting Run: fzb79a4e with config:
[34m[1mwandb[0m: 	epochs: 3
[34m[1mwandb[0m: 	learning_rate: 5.467769403244844e-06
[34m[1mwandb[0m: 	warmup_steps: 1000
[34m[1mwandb[0m: 	weight_decay: 0.01
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of DebertaV2ForSequenceClassification were not initialized from the model checkpoint at microsoft/deberta-v3-large and are newly initialized: ['classifier.bias', 'classifier.weight', 'pooler.dense.bias', 'pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.6712,0.664985,0.619877,0.074813,0.06135,0.095847
2,0.6582,0.641441,0.635758,0.075423,0.063596,0.092652
3,0.5558,0.424981,0.876025,0.480687,0.732026,0.357827


VBox(children=(Label(value='0.008 MB of 0.008 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
eval/accuracy,▁▁█
eval/f1,▁▁█
eval/loss,█▇▁
eval/precision,▁▁█
eval/recall,▁▁█
eval/runtime,▁▄█
eval/samples_per_second,█▅▁
eval/steps_per_second,█▅▁
train/epoch,▁▁▅▅███
train/global_step,▁▁▅▅███

0,1
eval/accuracy,0.87602
eval/f1,0.48069
eval/loss,0.42498
eval/precision,0.73203
eval/recall,0.35783
eval/runtime,2.7788
eval/samples_per_second,87.809
eval/steps_per_second,5.758
total_flos,1046849315715840.0
train/epoch,3.0


[34m[1mwandb[0m: Agent Starting Run: mbp8dacj with config:
[34m[1mwandb[0m: 	epochs: 1
[34m[1mwandb[0m: 	learning_rate: 6.733189579445929e-06
[34m[1mwandb[0m: 	warmup_steps: 500
[34m[1mwandb[0m: 	weight_decay: 0.01
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of DebertaV2ForSequenceClassification were not initialized from the model checkpoint at microsoft/deberta-v3-large and are newly initialized: ['classifier.bias', 'classifier.weight', 'pooler.dense.bias', 'pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.6369,0.612422,0.85502,0.491921,0.561475,0.4377


VBox(children=(Label(value='0.008 MB of 0.008 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
eval/accuracy,▁
eval/f1,▁
eval/loss,▁
eval/precision,▁
eval/recall,▁
eval/runtime,▁
eval/samples_per_second,▁
eval/steps_per_second,▁
train/epoch,▁▁▁
train/global_step,▁▁▁

0,1
eval/accuracy,0.85502
eval/f1,0.49192
eval/loss,0.61242
eval/precision,0.56148
eval/recall,0.4377
eval/runtime,2.7644
eval/samples_per_second,88.267
eval/steps_per_second,5.788
total_flos,350939887449600.0
train/epoch,1.0


[34m[1mwandb[0m: Agent Starting Run: hyibz6b0 with config:
[34m[1mwandb[0m: 	epochs: 8
[34m[1mwandb[0m: 	learning_rate: 9.829080036348189e-06
[34m[1mwandb[0m: 	warmup_steps: 1000
[34m[1mwandb[0m: 	weight_decay: 0.01
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of DebertaV2ForSequenceClassification were not initialized from the model checkpoint at microsoft/deberta-v3-large and are newly initialized: ['classifier.bias', 'classifier.weight', 'pooler.dense.bias', 'pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.7266,0.720645,0.336578,0.298863,0.179922,0.881789
2,0.7061,0.679733,0.679816,0.371859,0.271261,0.591054
3,0.4755,0.362569,0.876025,0.464602,0.755396,0.335463
4,0.349,0.322822,0.885246,0.513043,0.802721,0.376997
5,0.3148,0.294308,0.89498,0.557235,0.86,0.412141
6,0.2867,0.274785,0.908811,0.641129,0.868852,0.507987
7,0.2567,0.261019,0.913934,0.695652,0.803347,0.613419
8,0.2293,0.238346,0.919057,0.709559,0.835498,0.616613


VBox(children=(Label(value='0.008 MB of 0.008 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
eval/accuracy,▁▅▇█████
eval/f1,▁▂▄▅▅▇██
eval/loss,█▇▃▂▂▂▁▁
eval/precision,▁▂▇▇██▇█
eval/recall,█▄▁▂▂▃▅▅
eval/runtime,▂▃▁▅█▃▂▁
eval/samples_per_second,▇▆█▄▁▆██
eval/steps_per_second,▇▆█▄▁▆██
train/epoch,▁▁▂▂▃▃▄▄▅▅▆▆▇▇███
train/global_step,▁▁▂▂▃▃▄▄▅▅▆▆▇▇███

0,1
eval/accuracy,0.91906
eval/f1,0.70956
eval/loss,0.23835
eval/precision,0.8355
eval/recall,0.61661
eval/runtime,2.7711
eval/samples_per_second,88.053
eval/steps_per_second,5.774
total_flos,2764882087544832.0
train/epoch,8.0


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: s17r3zik with config:
[34m[1mwandb[0m: 	epochs: 9
[34m[1mwandb[0m: 	learning_rate: 5.442631041052797e-06
[34m[1mwandb[0m: 	warmup_steps: 1000
[34m[1mwandb[0m: 	weight_decay: 0.01
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of DebertaV2ForSequenceClassification were not initialized from the model checkpoint at microsoft/deberta-v3-large and are newly initialized: ['classifier.bias', 'classifier.weight', 'pooler.dense.bias', 'pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.6564,0.649651,0.651639,0.360902,0.255659,0.613419
2,0.6255,0.571607,0.850922,0.488576,0.542969,0.444089
3,0.5353,0.464605,0.856045,0.495512,0.565574,0.440895
4,0.4216,0.362645,0.871926,0.513619,0.656716,0.421725
5,0.3604,0.335715,0.884734,0.520256,0.782051,0.389776
6,0.3314,0.313266,0.894467,0.561702,0.840764,0.421725
7,0.307,0.303139,0.893955,0.56785,0.819277,0.434505
8,0.2846,0.283537,0.90625,0.611465,0.911392,0.460064
9,0.2677,0.296679,0.896516,0.648084,0.712644,0.594249


VBox(children=(Label(value='0.008 MB of 0.026 MB uploaded\r'), FloatProgress(value=0.2871724337628493, max=1.0…

0,1
eval/accuracy,▁▆▇▇▇████
eval/f1,▁▄▄▅▅▆▆▇█
eval/loss,█▇▄▃▂▂▁▁▁
eval/precision,▁▄▄▅▇▇▇█▆
eval/recall,█▃▃▂▁▂▂▃▇
eval/runtime,▁▃██▅▅▇▄▅
eval/samples_per_second,█▆▁▁▄▄▂▅▄
eval/steps_per_second,█▆▁▁▄▄▂▅▄
train/epoch,▁▁▂▂▃▃▄▄▅▅▅▅▆▆▇▇███
train/global_step,▁▁▂▂▃▃▄▄▅▅▅▅▆▆▇▇███

0,1
eval/accuracy,0.89652
eval/f1,0.64808
eval/loss,0.29668
eval/precision,0.71264
eval/recall,0.59425
eval/runtime,2.7755
eval/samples_per_second,87.914
eval/steps_per_second,5.765
total_flos,3104813238276096.0
train/epoch,9.0


[34m[1mwandb[0m: Agent Starting Run: esi54qh8 with config:
[34m[1mwandb[0m: 	epochs: 5
[34m[1mwandb[0m: 	learning_rate: 9.794509462485289e-06
[34m[1mwandb[0m: 	warmup_steps: 50
[34m[1mwandb[0m: 	weight_decay: 0.01
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of DebertaV2ForSequenceClassification were not initialized from the model checkpoint at microsoft/deberta-v3-large and are newly initialized: ['classifier.bias', 'classifier.weight', 'pooler.dense.bias', 'pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.5421,0.34864,0.873463,0.498986,0.683333,0.392971
2,0.329,0.30231,0.898053,0.558758,0.913043,0.402556
3,0.2896,0.282084,0.904201,0.619145,0.853933,0.485623
4,0.2531,0.263777,0.90625,0.613108,0.90625,0.463259
5,0.2319,0.256196,0.909324,0.65896,0.830097,0.546326


VBox(children=(Label(value='0.008 MB of 0.008 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
eval/accuracy,▁▆▇▇█
eval/f1,▁▄▆▆█
eval/loss,█▄▃▂▁
eval/precision,▁█▆█▅
eval/recall,▁▁▅▄█
eval/runtime,▄▅█▁▇
eval/samples_per_second,▅▄▁█▂
eval/steps_per_second,▅▄▁█▂
train/epoch,▁▁▃▃▅▅▆▆███
train/global_step,▁▁▃▃▅▅▆▆███

0,1
eval/accuracy,0.90932
eval/f1,0.65896
eval/loss,0.2562
eval/precision,0.8301
eval/recall,0.54633
eval/runtime,2.7821
eval/samples_per_second,87.702
eval/steps_per_second,5.751
total_flos,1737574735686144.0
train/epoch,5.0


[34m[1mwandb[0m: Agent Starting Run: uirmmo0s with config:
[34m[1mwandb[0m: 	epochs: 1
[34m[1mwandb[0m: 	learning_rate: 7.425516935504392e-06
[34m[1mwandb[0m: 	warmup_steps: 50
[34m[1mwandb[0m: 	weight_decay: 0.01
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of DebertaV2ForSequenceClassification were not initialized from the model checkpoint at microsoft/deberta-v3-large and are newly initialized: ['classifier.bias', 'classifier.weight', 'pooler.dense.bias', 'pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.5668,0.365972,0.869365,0.50677,0.642157,0.41853


VBox(children=(Label(value='0.008 MB of 0.008 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
eval/accuracy,▁
eval/f1,▁
eval/loss,▁
eval/precision,▁
eval/recall,▁
eval/runtime,▁
eval/samples_per_second,▁
eval/steps_per_second,▁
train/epoch,▁▁▁
train/global_step,▁▁▁

0,1
eval/accuracy,0.86936
eval/f1,0.50677
eval/loss,0.36597
eval/precision,0.64216
eval/recall,0.41853
eval/runtime,2.761
eval/samples_per_second,88.373
eval/steps_per_second,5.795
total_flos,350939887449600.0
train/epoch,1.0


[34m[1mwandb[0m: Agent Starting Run: sn8wc0y6 with config:
[34m[1mwandb[0m: 	epochs: 10
[34m[1mwandb[0m: 	learning_rate: 5.183910896250867e-06
[34m[1mwandb[0m: 	warmup_steps: 1000
[34m[1mwandb[0m: 	weight_decay: 0.01
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of DebertaV2ForSequenceClassification were not initialized from the model checkpoint at microsoft/deberta-v3-large and are newly initialized: ['classifier.bias', 'classifier.weight', 'pooler.dense.bias', 'pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.7284,0.726005,0.296619,0.291903,0.174047,0.904153
2,0.7174,0.709451,0.540984,0.352601,0.227824,0.779553
3,0.6703,0.525888,0.835553,0.0,0.0,0.0
4,0.429,0.360857,0.869365,0.508671,0.640777,0.421725
5,0.353,0.327095,0.883709,0.511828,0.782895,0.380192
6,0.3216,0.301329,0.896004,0.551876,0.892857,0.399361
7,0.2991,0.290008,0.902152,0.604555,0.858824,0.466454
8,0.275,0.270594,0.908811,0.622881,0.924528,0.469649
9,0.2543,0.261885,0.913422,0.691042,0.807692,0.603834
10,0.2333,0.246236,0.916496,0.697588,0.831858,0.600639


VBox(children=(Label(value='0.008 MB of 0.008 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
eval/accuracy,▁▄▇▇██████
eval/f1,▄▅▁▆▆▇▇▇██
eval/loss,██▅▃▂▂▂▁▁▁
eval/precision,▂▃▁▆▇███▇▇
eval/recall,█▇▁▄▄▄▅▅▆▆
eval/runtime,▁▅█▅▃▄▄▄▄▃
eval/samples_per_second,█▄▁▄▆▅▅▅▄▆
eval/steps_per_second,█▄▁▄▆▅▅▅▄▆
train/epoch,▁▁▂▂▃▃▃▃▄▄▅▅▆▆▆▆▇▇███
train/global_step,▁▁▂▂▃▃▃▃▄▄▅▅▆▆▆▆▇▇███

0,1
eval/accuracy,0.9165
eval/f1,0.69759
eval/loss,0.24624
eval/precision,0.83186
eval/recall,0.60064
eval/runtime,2.768
eval/samples_per_second,88.15
eval/steps_per_second,5.78
total_flos,3444860883575808.0
train/epoch,10.0


[34m[1mwandb[0m: Agent Starting Run: eci9saaa with config:
[34m[1mwandb[0m: 	epochs: 2
[34m[1mwandb[0m: 	learning_rate: 5.067048219163398e-06
[34m[1mwandb[0m: 	warmup_steps: 1000
[34m[1mwandb[0m: 	weight_decay: 0.01
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of DebertaV2ForSequenceClassification were not initialized from the model checkpoint at microsoft/deberta-v3-large and are newly initialized: ['classifier.bias', 'classifier.weight', 'pooler.dense.bias', 'pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.6777,0.671511,0.693135,0.159888,0.1425,0.182109
2,0.6669,0.655243,0.726947,0.043088,0.04918,0.038339


VBox(children=(Label(value='0.008 MB of 0.008 MB uploaded\r'), FloatProgress(value=1.0, max=1.0)))

0,1
eval/accuracy,▁█
eval/f1,█▁
eval/loss,█▁
eval/precision,█▁
eval/recall,█▁
eval/runtime,▁█
eval/samples_per_second,█▁
eval/steps_per_second,█▁
train/epoch,▁▁███
train/global_step,▁▁███

0,1
eval/accuracy,0.72695
eval/f1,0.04309
eval/loss,0.65524
eval/precision,0.04918
eval/recall,0.03834
eval/runtime,2.7821
eval/samples_per_second,87.704
eval/steps_per_second,5.751
total_flos,697860712287744.0
train/epoch,2.0
