In [1]:
import pandas as pd
import numpy as np
import torch

torch.cuda.empty_cache()

def read_file(fname: str, correct_labels=True) -> pd.DataFrame:
    """Reads a filename, return df with text and labels."""

    df = pd.read_table(fname, sep="\t", header=None, names="text,labels,role".split(","))
    if correct_labels:
        offensive_ids = df.labels != "Acceptable speech"
        df.labels[offensive_ids] = 1
        df.labels[~offensive_ids] = 0

    df = df.drop(columns=["role"])
    return df


def run_hyperparams_optimization(model_name, model_type, lang):
    import torch
    torch.cuda.empty_cache()
    if lang not in {"sl", "hr", "en"}:
        raise AttributeError(f"Language {lang} is not valid")
    eval_file, train_file = f"../data/merged-{lang}.test.tsv" , f"../data/merged-{lang}.train.tsv"
    from simpletransformers.classification import ClassificationModel, ClassificationArgs
    import wandb


    model_args = ClassificationArgs()
    model_args.use_early_stopping = True
    model_args.early_stopping_delta = 0.01
    model_args.early_stopping_metric = "mcc"
    model_args.early_stopping_metric_minimize = False
    model_args.early_stopping_patience = 3
    model_args.evaluate_during_training_steps = 1000

    model_args.evaluate_during_training = True
    model_args.manual_seed = 4
    model_args.use_multiprocessing = True
    model_args.eval_batch_size = 8
    model_args.labels_list = [0, 1]
    model_args.wandb_project = "task3"
    model_args.reprocess_input_data = True
    model_args.overwrite_output_dir = True
    model_args.no_save = True

    sweep_config = {
        "method": "bayes",  # grid, random
        "metric": {"name": "mcc", "goal": "maximize"},
        "parameters": {
            "num_train_epochs":  {"max": 20, "min": 3},
            "learning_rate": {"min": 1e-6, "max": 1e-4},
            "train_batch_size": {"max": 100, "min": 5}
        },
    }

    sweep_id = wandb.sweep(sweep_config, project="task3_"+model_name.replace("/", "_")+model_type)

    train_df = read_file(train_file, correct_labels=True)
    eval_df = read_file(eval_file, correct_labels=True)

    def train():
        # Initialize a new wandb run
        wandb.init()

        # Create a TransformerModel
        model = ClassificationModel(
            model_type,
            model_name,
            use_cuda=True,
            args=model_args,
            sweep_config=wandb.config,
        )
        model.overwrite_output_dir = True
        model.no_save = True
        
        
        # Train the model
        model.train_model(train_df, eval_df=eval_df)

        # Evaluate the model
        model.eval_model(eval_df)

        # Sync wandb
        wandb.join()

    wandb.agent(sweep_id, train, count=50)


 "electra",
        "classla/bcms-bertic",

In [2]:
model_name = "classla/bcms-bertic"
model_type = "electra"
language = "hr"

run_hyperparams_optimization(model_name, model_type, language)

Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Create sweep with ID: 6am13hot
Sweep URL: https://wandb.ai/5roop/task3_classla_bcms-berticelectra/sweeps/6am13hot


[34m[1mwandb[0m: Agent Starting Run: 4g9eu69v with config:
[34m[1mwandb[0m: 	learning_rate: 3.435642841771529e-05
[34m[1mwandb[0m: 	num_train_epochs: 14
[34m[1mwandb[0m: 	train_batch_size: 17
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.
[34m[1mwandb[0m: Currently logged in as: [33m5roop[0m (use `wandb login --relogin` to force relogin)


Some weights of the model checkpoint at classla/bcms-bertic were not used when initializing ElectraForSequenceClassification: ['discriminator_predictions.dense.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense_prediction.weight', 'discriminator_predictions.dense_prediction.bias']
- This IS expected if you are initializing ElectraForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForSequenceClassification were not initialized from the model checkpoint at classla/bcms-bertic and are newly initialized: ['pooler.dense.bias', 'pooler.dense.weight

HBox(children=(FloatProgress(value=0.0, max=8851.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Epoch', max=14.0, style=ProgressStyle(description_width='…

HBox(children=(FloatProgress(value=0.0, description='Running Epoch 0 of 14', max=521.0, style=ProgressStyle(de…

  torch.nn.utils.clip_grad_norm_(





HBox(children=(FloatProgress(value=0.0, max=2120.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 1 of 14', max=521.0, style=ProgressStyle(de…

HBox(children=(FloatProgress(value=0.0, max=2120.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2120.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 2 of 14', max=521.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2120.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 3 of 14', max=521.0, style=ProgressStyle(de…

HBox(children=(FloatProgress(value=0.0, max=2120.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2120.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 4 of 14', max=521.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2120.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 5 of 14', max=521.0, style=ProgressStyle(de…

[34m[1mwandb[0m: Ctrl + C detected. Stopping sweep.


In [3]:
model_name = "EMBEDDIA/sloberta"
model_type = "camembert"
language = "sl"

run_hyperparams_optimization(model_name, model_type, language)

Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


KeyboardInterrupt: 

In [7]:
model_name = "EMBEDDIA/sloberta"
model_type = "roberta"
language = "sl"

run_hyperparams_optimization(model_name, model_type, language)

Create sweep with ID: um04mk5v
Sweep URL: https://wandb.ai/5roop/task3_EMBEDDIA_slobertaroberta/sweeps/um04mk5v


[34m[1mwandb[0m: Agent Starting Run: qwu4qq1k with config:
[34m[1mwandb[0m: 	learning_rate: 1.5175992821295014e-05
[34m[1mwandb[0m: 	num_train_epochs: 7
[34m[1mwandb[0m: 	train_batch_size: 13
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


You are using a model of type camembert to instantiate a model of type roberta. This is not supported for all configurations of models and can yield errors.
Some weights of the model checkpoint at EMBEDDIA/sloberta were not used when initializing RobertaForSequenceClassification: ['lm_head.dense.bias', 'lm_head.dense.weight', 'lm_head.decoder.bias', 'lm_head.layer_norm.bias', 'lm_head.bias', 'lm_head.layer_norm.weight', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification we

VBox(children=(Label(value=' 0.00MB of 0.00MB uploaded (0.00MB deduped)\r'), FloatProgress(value=1.0, max=1.0)…

Run qwu4qq1k errored: OSError("Can't load tokenizer for 'EMBEDDIA/sloberta'. Make sure that:\n\n- 'EMBEDDIA/sloberta' is a correct model identifier listed on 'https://huggingface.co/models'\n\n- or 'EMBEDDIA/sloberta' is the correct path to a directory containing relevant tokenizer files\n\n")
[34m[1mwandb[0m: [32m[41mERROR[0m Run qwu4qq1k errored: OSError("Can't load tokenizer for 'EMBEDDIA/sloberta'. Make sure that:\n\n- 'EMBEDDIA/sloberta' is a correct model identifier listed on 'https://huggingface.co/models'\n\n- or 'EMBEDDIA/sloberta' is the correct path to a directory containing relevant tokenizer files\n\n")
[34m[1mwandb[0m: Agent Starting Run: 3hi4lnee with config:
[34m[1mwandb[0m: 	learning_rate: 8.57222802142255e-05
[34m[1mwandb[0m: 	num_train_epochs: 14
[34m[1mwandb[0m: 	train_batch_size: 14
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


You are using a model of type camembert to instantiate a model of type roberta. This is not supported for all configurations of models and can yield errors.
Some weights of the model checkpoint at EMBEDDIA/sloberta were not used when initializing RobertaForSequenceClassification: ['lm_head.dense.bias', 'lm_head.dense.weight', 'lm_head.decoder.bias', 'lm_head.layer_norm.bias', 'lm_head.bias', 'lm_head.layer_norm.weight', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification we

VBox(children=(Label(value=' 0.00MB of 0.00MB uploaded (0.00MB deduped)\r'), FloatProgress(value=1.0, max=1.0)…

Run 3hi4lnee errored: OSError("Can't load tokenizer for 'EMBEDDIA/sloberta'. Make sure that:\n\n- 'EMBEDDIA/sloberta' is a correct model identifier listed on 'https://huggingface.co/models'\n\n- or 'EMBEDDIA/sloberta' is the correct path to a directory containing relevant tokenizer files\n\n")
[34m[1mwandb[0m: [32m[41mERROR[0m Run 3hi4lnee errored: OSError("Can't load tokenizer for 'EMBEDDIA/sloberta'. Make sure that:\n\n- 'EMBEDDIA/sloberta' is a correct model identifier listed on 'https://huggingface.co/models'\n\n- or 'EMBEDDIA/sloberta' is the correct path to a directory containing relevant tokenizer files\n\n")
[34m[1mwandb[0m: Agent Starting Run: g1tbhqt0 with config:
[34m[1mwandb[0m: 	learning_rate: 9.063901189210694e-05
[34m[1mwandb[0m: 	num_train_epochs: 3
[34m[1mwandb[0m: 	train_batch_size: 100
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


You are using a model of type camembert to instantiate a model of type roberta. This is not supported for all configurations of models and can yield errors.
Some weights of the model checkpoint at EMBEDDIA/sloberta were not used when initializing RobertaForSequenceClassification: ['lm_head.dense.bias', 'lm_head.dense.weight', 'lm_head.decoder.bias', 'lm_head.layer_norm.bias', 'lm_head.bias', 'lm_head.layer_norm.weight', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification we

VBox(children=(Label(value=' 0.00MB of 0.00MB uploaded (0.00MB deduped)\r'), FloatProgress(value=1.0, max=1.0)…

Run g1tbhqt0 errored: OSError("Can't load tokenizer for 'EMBEDDIA/sloberta'. Make sure that:\n\n- 'EMBEDDIA/sloberta' is a correct model identifier listed on 'https://huggingface.co/models'\n\n- or 'EMBEDDIA/sloberta' is the correct path to a directory containing relevant tokenizer files\n\n")
[34m[1mwandb[0m: [32m[41mERROR[0m Run g1tbhqt0 errored: OSError("Can't load tokenizer for 'EMBEDDIA/sloberta'. Make sure that:\n\n- 'EMBEDDIA/sloberta' is a correct model identifier listed on 'https://huggingface.co/models'\n\n- or 'EMBEDDIA/sloberta' is the correct path to a directory containing relevant tokenizer files\n\n")
Detected 3 failed runs in the first 60 seconds, killing sweep.
[34m[1mwandb[0m: [32m[41mERROR[0m Detected 3 failed runs in the first 60 seconds, killing sweep.
[34m[1mwandb[0m: To disable this check set WANDB_AGENT_DISABLE_FLAPPING=true


In [9]:
# Doesen't run, don't know why
model_name = "xlm-roberta-base"
model_type = "xlm-roberta"
language = "sl"

run_hyperparams_optimization(model_name, model_type, language)

Create sweep with ID: xtzzgzuv
Sweep URL: https://wandb.ai/5roop/task3_xlm-roberta-basexlm-roberta/sweeps/xtzzgzuv


[34m[1mwandb[0m: Agent Starting Run: im3ycjw4 with config:
[34m[1mwandb[0m: 	learning_rate: 7.525077012287136e-05
[34m[1mwandb[0m: 	num_train_epochs: 5
[34m[1mwandb[0m: 	train_batch_size: 7
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value=' 0.00MB of 0.00MB uploaded (0.00MB deduped)\r'), FloatProgress(value=1.0, max=1.0)…

Run im3ycjw4 errored: KeyError('xlm-roberta')
[34m[1mwandb[0m: [32m[41mERROR[0m Run im3ycjw4 errored: KeyError('xlm-roberta')
[34m[1mwandb[0m: Agent Starting Run: un0yk9nj with config:
[34m[1mwandb[0m: 	learning_rate: 4.909199593792542e-05
[34m[1mwandb[0m: 	num_train_epochs: 20
[34m[1mwandb[0m: 	train_batch_size: 25
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value=' 0.00MB of 0.00MB uploaded (0.00MB deduped)\r'), FloatProgress(value=1.0, max=1.0)…

Run un0yk9nj errored: KeyError('xlm-roberta')
[34m[1mwandb[0m: [32m[41mERROR[0m Run un0yk9nj errored: KeyError('xlm-roberta')
[34m[1mwandb[0m: Agent Starting Run: a1lx75od with config:
[34m[1mwandb[0m: 	learning_rate: 1.0999838114011426e-05
[34m[1mwandb[0m: 	num_train_epochs: 12
[34m[1mwandb[0m: 	train_batch_size: 98
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value=' 0.00MB of 0.00MB uploaded (0.00MB deduped)\r'), FloatProgress(value=1.0, max=1.0)…

Run a1lx75od errored: KeyError('xlm-roberta')
[34m[1mwandb[0m: [32m[41mERROR[0m Run a1lx75od errored: KeyError('xlm-roberta')
Detected 3 failed runs in the first 60 seconds, killing sweep.
[34m[1mwandb[0m: [32m[41mERROR[0m Detected 3 failed runs in the first 60 seconds, killing sweep.
[34m[1mwandb[0m: To disable this check set WANDB_AGENT_DISABLE_FLAPPING=true


In [3]:
# Doesen't run, don't know why
model_name = "xlm-roberta-large"
model_type = "xlm-roberta"
language = "sl"

run_hyperparams_optimization(model_name, model_type, language)

Create sweep with ID: ggk3zsph
Sweep URL: https://wandb.ai/5roop/task3_xlm-roberta-largexlm-roberta/sweeps/ggk3zsph


[34m[1mwandb[0m: Agent Starting Run: 7w8r1h5i with config:
[34m[1mwandb[0m: 	learning_rate: 9.901888495782402e-06
[34m[1mwandb[0m: 	num_train_epochs: 19
[34m[1mwandb[0m: 	train_batch_size: 71
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value=' 0.00MB of 0.00MB uploaded (0.00MB deduped)\r'), FloatProgress(value=1.0, max=1.0)…

Run 7w8r1h5i errored: KeyError('xlm-roberta')
[34m[1mwandb[0m: [32m[41mERROR[0m Run 7w8r1h5i errored: KeyError('xlm-roberta')
[34m[1mwandb[0m: Agent Starting Run: 5c0aworn with config:
[34m[1mwandb[0m: 	learning_rate: 3.609675069777099e-05
[34m[1mwandb[0m: 	num_train_epochs: 18
[34m[1mwandb[0m: 	train_batch_size: 69
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value=' 0.00MB of 0.00MB uploaded (0.00MB deduped)\r'), FloatProgress(value=0.0, max=1.0)…

Run 5c0aworn errored: KeyError('xlm-roberta')
[34m[1mwandb[0m: [32m[41mERROR[0m Run 5c0aworn errored: KeyError('xlm-roberta')
[34m[1mwandb[0m: Agent Starting Run: ln9nvxyx with config:
[34m[1mwandb[0m: 	learning_rate: 8.763866256561414e-05
[34m[1mwandb[0m: 	num_train_epochs: 3
[34m[1mwandb[0m: 	train_batch_size: 30
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value=' 0.00MB of 0.00MB uploaded (0.00MB deduped)\r'), FloatProgress(value=1.0, max=1.0)…

Run ln9nvxyx errored: KeyError('xlm-roberta')
[34m[1mwandb[0m: [32m[41mERROR[0m Run ln9nvxyx errored: KeyError('xlm-roberta')
Detected 3 failed runs in the first 60 seconds, killing sweep.
[34m[1mwandb[0m: [32m[41mERROR[0m Detected 3 failed runs in the first 60 seconds, killing sweep.
[34m[1mwandb[0m: To disable this check set WANDB_AGENT_DISABLE_FLAPPING=true


In [4]:
# Doesen't run, don't know why
model_name = "xlm-roberta"
model_type = "xlm-roberta"
language = "sl"

run_hyperparams_optimization(model_name, model_type, language)

Create sweep with ID: abego22b
Sweep URL: https://wandb.ai/5roop/task3_xlm-robertaxlm-roberta/sweeps/abego22b


[34m[1mwandb[0m: Agent Starting Run: w869ljxa with config:
[34m[1mwandb[0m: 	learning_rate: 1.8163040630492245e-05
[34m[1mwandb[0m: 	num_train_epochs: 6
[34m[1mwandb[0m: 	train_batch_size: 12
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value=' 0.00MB of 0.00MB uploaded (0.00MB deduped)\r'), FloatProgress(value=1.0, max=1.0)…

Run w869ljxa errored: KeyError('xlm-roberta')
[34m[1mwandb[0m: [32m[41mERROR[0m Run w869ljxa errored: KeyError('xlm-roberta')
[34m[1mwandb[0m: Agent Starting Run: d8na1zvk with config:
[34m[1mwandb[0m: 	learning_rate: 1.1651535465097527e-05
[34m[1mwandb[0m: 	num_train_epochs: 4
[34m[1mwandb[0m: 	train_batch_size: 99
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value=' 0.00MB of 0.00MB uploaded (0.00MB deduped)\r'), FloatProgress(value=1.0, max=1.0)…

Run d8na1zvk errored: KeyError('xlm-roberta')
[34m[1mwandb[0m: [32m[41mERROR[0m Run d8na1zvk errored: KeyError('xlm-roberta')
[34m[1mwandb[0m: Agent Starting Run: leu1bixn with config:
[34m[1mwandb[0m: 	learning_rate: 7.916020715391716e-05
[34m[1mwandb[0m: 	num_train_epochs: 20
[34m[1mwandb[0m: 	train_batch_size: 100
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


VBox(children=(Label(value=' 0.00MB of 0.00MB uploaded (0.00MB deduped)\r'), FloatProgress(value=1.0, max=1.0)…

Run leu1bixn errored: KeyError('xlm-roberta')
[34m[1mwandb[0m: [32m[41mERROR[0m Run leu1bixn errored: KeyError('xlm-roberta')
Detected 3 failed runs in the first 60 seconds, killing sweep.
[34m[1mwandb[0m: [32m[41mERROR[0m Detected 3 failed runs in the first 60 seconds, killing sweep.
[34m[1mwandb[0m: To disable this check set WANDB_AGENT_DISABLE_FLAPPING=true


In [5]:
model_name = "roberta-base"
model_type = "roberta"
language = "en"

run_hyperparams_optimization(model_name, model_type, language)

Create sweep with ID: u2c0c11r
Sweep URL: https://wandb.ai/5roop/task3_roberta-baseroberta/sweeps/u2c0c11r


[34m[1mwandb[0m: Agent Starting Run: byvzcvl3 with config:
[34m[1mwandb[0m: 	learning_rate: 3.903550621877325e-05
[34m[1mwandb[0m: 	num_train_epochs: 4
[34m[1mwandb[0m: 	train_batch_size: 69
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.bias', 'lm_head.decoder.weight', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.out_proj.bias', 'classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_p

HBox(children=(FloatProgress(value=0.0, max=9339.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Epoch', max=4.0, style=ProgressStyle(description_width='i…

HBox(children=(FloatProgress(value=0.0, description='Running Epoch 0 of 4', max=136.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 1 of 4', max=136.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 2 of 4', max=136.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 3 of 4', max=136.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Evaluation', max=288.0, style=ProgressStyle(descr…




VBox(children=(Label(value=' 0.07MB of 0.07MB uploaded (0.00MB deduped)\r'), FloatProgress(value=0.98963008822…

0,1
Training loss,0.17613
lr,0.0
global_step,544.0
_runtime,138.0
_timestamp,1630924519.0
_step,16.0
tp,677.0
tn,1199.0
fp,201.0
fn,225.0


0,1
Training loss,▇▆▆█▇▅▇▄▁▂
lr,█▇▆▆▅▄▃▃▂▁
global_step,▁▂▂▂▃▄▄▅▅▆▆▇▇█
_runtime,▁▂▂▂▃▄▄▄▅▅▆▆▇████
_timestamp,▁▂▂▂▃▄▄▄▅▅▆▆▇████
_step,▁▁▂▂▃▃▄▄▅▅▅▆▆▇▇██
tp,▁▁█▅
tn,▁█▄▇
fp,█▁▅▂
fn,██▁▄


[34m[1mwandb[0m: Agent Starting Run: 8260pa4h with config:
[34m[1mwandb[0m: 	learning_rate: 8.009702232079093e-05
[34m[1mwandb[0m: 	num_train_epochs: 17
[34m[1mwandb[0m: 	train_batch_size: 61
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.bias', 'lm_head.decoder.weight', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.out_proj.bias', 'classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_p

HBox(children=(FloatProgress(value=0.0, max=9339.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Epoch', max=17.0, style=ProgressStyle(description_width='…

HBox(children=(FloatProgress(value=0.0, description='Running Epoch 0 of 17', max=154.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 1 of 17', max=154.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 2 of 17', max=154.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 3 of 17', max=154.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 4 of 17', max=154.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 5 of 17', max=154.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 6 of 17', max=154.0, style=ProgressStyle(de…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 7 of 17', max=154.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 8 of 17', max=154.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 9 of 17', max=154.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 10 of 17', max=154.0, style=ProgressStyle(d…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 11 of 17', max=154.0, style=ProgressStyle(d…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 12 of 17', max=154.0, style=ProgressStyle(d…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 13 of 17', max=154.0, style=ProgressStyle(d…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 14 of 17', max=154.0, style=ProgressStyle(d…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 15 of 17', max=154.0, style=ProgressStyle(d…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 16 of 17', max=154.0, style=ProgressStyle(d…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Evaluation', max=288.0, style=ProgressStyle(descr…




VBox(children=(Label(value=' 0.04MB of 0.04MB uploaded (0.00MB deduped)\r'), FloatProgress(value=0.98274974253…

0,1
Training loss,0.00022
lr,0.0
global_step,2618.0
_runtime,548.0
_timestamp,1630925080.0
_step,73.0
tp,637.0
tn,1156.0
fp,244.0
fn,265.0


0,1
Training loss,▇█▇▆▅▄▄▄▃▃▂▂▁▃▂▂▁▁▂▁▁▁▁▂▁▂▁▁▁▁▂▁▁▁▂▁▂▁▁▁
lr,████▇▇▇▇▇▆▆▆▆▆▆▅▅▅▅▅▄▄▄▄▄▄▃▃▃▃▃▃▂▂▂▂▂▁▁▁
global_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇███
_runtime,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇████
_timestamp,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇████
_step,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
tp,▂▃▃▄▂▅▆█▂▅▁▇▅▆▆▅▄▅▅
tn,█▇▇▆▆▄▄▁▇▄█▃▅▄▄▆▅▅▅
fp,▁▂▂▃▃▅▅█▂▅▁▆▅▅▅▃▄▄▄
fn,▇▆▆▅▇▄▃▁▇▄█▂▄▃▃▅▅▄▄


[34m[1mwandb[0m: Agent Starting Run: ne3gahga with config:
[34m[1mwandb[0m: 	learning_rate: 3.430134230784744e-05
[34m[1mwandb[0m: 	num_train_epochs: 5
[34m[1mwandb[0m: 	train_batch_size: 69
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.bias', 'lm_head.decoder.weight', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.out_proj.bias', 'classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_p

HBox(children=(FloatProgress(value=0.0, max=9339.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Epoch', max=5.0, style=ProgressStyle(description_width='i…

HBox(children=(FloatProgress(value=0.0, description='Running Epoch 0 of 5', max=136.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 1 of 5', max=136.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 2 of 5', max=136.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 3 of 5', max=136.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 4 of 5', max=136.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Evaluation', max=288.0, style=ProgressStyle(descr…




VBox(children=(Label(value=' 0.07MB of 0.07MB uploaded (0.00MB deduped)\r'), FloatProgress(value=0.98956492358…

0,1
Training loss,0.13153
lr,0.0
global_step,680.0
_runtime,170.0
_timestamp,1630925261.0
_step,20.0
tp,667.0
tn,1198.0
fp,202.0
fn,235.0


0,1
Training loss,█▇▆█▇▄▇▄▁▃▁▃▂
lr,█▇▇▆▆▅▅▄▃▃▂▂▁
global_step,▁▂▂▂▃▃▃▄▄▅▅▅▆▆▇▇██
_runtime,▁▁▂▂▃▃▃▄▄▅▅▅▆▆▆▇▇████
_timestamp,▁▁▂▂▃▃▃▄▄▅▅▅▆▆▆▇▇████
_step,▁▁▂▂▂▃▃▃▄▄▅▅▅▆▆▆▇▇▇██
tp,▄▃▁█▁
tn,▁▄█▂▇
fp,█▅▁▇▂
fn,▅▆█▁█


[34m[1mwandb[0m: Agent Starting Run: 59jwg2iy with config:
[34m[1mwandb[0m: 	learning_rate: 5.150843005614004e-05
[34m[1mwandb[0m: 	num_train_epochs: 3
[34m[1mwandb[0m: 	train_batch_size: 71
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.bias', 'lm_head.decoder.weight', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.out_proj.bias', 'classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_p

HBox(children=(FloatProgress(value=0.0, max=9339.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Epoch', max=3.0, style=ProgressStyle(description_width='i…

HBox(children=(FloatProgress(value=0.0, description='Running Epoch 0 of 3', max=132.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 1 of 3', max=132.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 2 of 3', max=132.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Evaluation', max=288.0, style=ProgressStyle(descr…




VBox(children=(Label(value=' 0.07MB of 0.08MB uploaded (0.00MB deduped)\r'), FloatProgress(value=0.98981276833…

0,1
Training loss,0.23105
lr,1e-05
global_step,396.0
_runtime,108.0
_timestamp,1630925379.0
_step,12.0
tp,662.0
tn,1183.0
fp,217.0
fn,240.0


0,1
Training loss,█▆▆▆█▁▂
lr,█▇▆▅▃▂▁
global_step,▁▂▃▃▄▅▅▆▇█
_runtime,▁▂▃▃▄▄▅▆▆▇███
_timestamp,▁▂▃▃▄▄▅▆▆▇███
_step,▁▂▂▃▃▄▅▅▆▆▇▇█
tp,█▁▂
tn,▁██
fp,█▁▁
fn,▁█▇


[34m[1mwandb[0m: Agent Starting Run: f88nmowc with config:
[34m[1mwandb[0m: 	learning_rate: 3.369492505681477e-05
[34m[1mwandb[0m: 	num_train_epochs: 4
[34m[1mwandb[0m: 	train_batch_size: 64
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.bias', 'lm_head.decoder.weight', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.out_proj.bias', 'classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_p

HBox(children=(FloatProgress(value=0.0, max=9339.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Epoch', max=4.0, style=ProgressStyle(description_width='i…

HBox(children=(FloatProgress(value=0.0, description='Running Epoch 0 of 4', max=146.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 1 of 4', max=146.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 2 of 4', max=146.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 3 of 4', max=146.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Evaluation', max=288.0, style=ProgressStyle(descr…




VBox(children=(Label(value=' 0.07MB of 0.07MB uploaded (0.00MB deduped)\r'), FloatProgress(value=0.98962804925…

0,1
Training loss,0.20056
lr,0.0
global_step,584.0
_runtime,140.0
_timestamp,1630925529.0
_step,17.0
tp,669.0
tn,1189.0
fp,211.0
fn,233.0


0,1
Training loss,▇▇▄█▅▅▃▅▂▁▃
lr,█▇▇▆▅▅▄▃▂▂▁
global_step,▁▂▂▂▃▄▄▄▅▆▆▆▇██
_runtime,▁▁▂▂▃▃▄▄▅▅▆▆▇▇████
_timestamp,▁▁▂▂▃▃▄▄▅▅▆▆▇▇████
_step,▁▁▂▂▃▃▃▄▄▅▅▆▆▆▇▇██
tp,█▂▆▁
tn,▁▇▅█
fp,█▂▄▁
fn,▁▇▃█


[34m[1mwandb[0m: Agent Starting Run: yh3tku98 with config:
[34m[1mwandb[0m: 	learning_rate: 3.3545833586402316e-05
[34m[1mwandb[0m: 	num_train_epochs: 4
[34m[1mwandb[0m: 	train_batch_size: 76
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.bias', 'lm_head.decoder.weight', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.out_proj.bias', 'classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_p

HBox(children=(FloatProgress(value=0.0, max=9339.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Epoch', max=4.0, style=ProgressStyle(description_width='i…

HBox(children=(FloatProgress(value=0.0, description='Running Epoch 0 of 4', max=123.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 1 of 4', max=123.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 2 of 4', max=123.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 3 of 4', max=123.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Evaluation', max=288.0, style=ProgressStyle(descr…




VBox(children=(Label(value=' 0.07MB of 0.07MB uploaded (0.00MB deduped)\r'), FloatProgress(value=0.98975803354…

0,1
Training loss,0.20341
lr,0.0
global_step,492.0
_runtime,136.0
_timestamp,1630925677.0
_step,15.0
tp,676.0
tn,1192.0
fp,208.0
fn,226.0


0,1
Training loss,█▆▄▅▃▃▁▂▁
lr,█▇▆▅▄▄▃▂▁
global_step,▁▂▂▃▃▄▄▅▆▆▇▇█
_runtime,▁▂▂▃▃▄▄▅▅▆▆▇████
_timestamp,▁▂▂▃▃▄▄▅▅▆▆▇████
_step,▁▁▂▂▃▃▄▄▅▅▆▆▇▇██
tp,█▁▆▃
tn,▁█▅▇
fp,█▁▄▂
fn,▁█▃▆


[34m[1mwandb[0m: Agent Starting Run: 2gtc208r with config:
[34m[1mwandb[0m: 	learning_rate: 3.557077180568143e-05
[34m[1mwandb[0m: 	num_train_epochs: 8
[34m[1mwandb[0m: 	train_batch_size: 86
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.bias', 'lm_head.decoder.weight', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.out_proj.bias', 'classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_p

HBox(children=(FloatProgress(value=0.0, max=9339.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Epoch', max=8.0, style=ProgressStyle(description_width='i…

HBox(children=(FloatProgress(value=0.0, description='Running Epoch 0 of 8', max=109.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 1 of 8', max=109.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 2 of 8', max=109.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 3 of 8', max=109.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 4 of 8', max=109.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 5 of 8', max=109.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 6 of 8', max=109.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 7 of 8', max=109.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Evaluation', max=288.0, style=ProgressStyle(descr…




VBox(children=(Label(value=' 0.06MB of 0.06MB uploaded (0.00MB deduped)\r'), FloatProgress(value=0.98818886041…

0,1
Training loss,0.07888
lr,0.0
global_step,872.0
_runtime,249.0
_timestamp,1630925937.0
_step,27.0
tp,666.0
tn,1191.0
fp,209.0
fn,236.0


0,1
Training loss,██▅▆▄▄▃▄▂▃▂▁▂▂▁▁▂
lr,██▇▇▆▆▅▅▅▄▄▃▃▂▂▁▁
global_step,▁▁▂▂▂▂▃▃▃▄▄▄▄▅▅▅▆▆▆▇▇▇▇██
_runtime,▁▁▂▂▂▂▃▃▃▃▄▄▄▅▅▅▅▆▆▆▇▇▇█████
_timestamp,▁▁▂▂▂▂▃▃▃▃▄▄▄▅▅▅▅▆▆▆▇▇▇█████
_step,▁▁▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇██
tp,█▄▁▁▇▄▅▂
tn,▁▆█▇▄▆▅▇
fp,█▃▁▂▅▃▄▂
fn,▁▅██▂▅▄▇


[34m[1mwandb[0m: Agent Starting Run: i81zs7p1 with config:
[34m[1mwandb[0m: 	learning_rate: 4.2455263792412026e-05
[34m[1mwandb[0m: 	num_train_epochs: 5
[34m[1mwandb[0m: 	train_batch_size: 75
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.bias', 'lm_head.decoder.weight', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.out_proj.bias', 'classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_p

HBox(children=(FloatProgress(value=0.0, max=9339.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Epoch', max=5.0, style=ProgressStyle(description_width='i…

HBox(children=(FloatProgress(value=0.0, description='Running Epoch 0 of 5', max=125.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 1 of 5', max=125.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 2 of 5', max=125.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 3 of 5', max=125.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 4 of 5', max=125.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Evaluation', max=288.0, style=ProgressStyle(descr…




VBox(children=(Label(value=' 0.07MB of 0.08MB uploaded (0.00MB deduped)\r'), FloatProgress(value=0.98985251481…

0,1
Training loss,0.08077
lr,0.0
global_step,625.0
_runtime,166.0
_timestamp,1630926114.0
_step,19.0
tp,623.0
tn,1222.0
fp,178.0
fn,279.0


0,1
Training loss,▇█▆▆▅▄▅▃▂▁▂▁
lr,█▇▇▆▅▅▄▄▃▂▂▁
global_step,▁▂▂▂▃▃▃▄▅▅▅▆▆▆▇██
_runtime,▁▁▂▂▃▃▃▄▄▅▅▆▆▆▇▇████
_timestamp,▁▁▂▂▃▃▃▄▄▅▅▆▆▆▇▇████
_step,▁▁▂▂▂▃▃▄▄▄▅▅▅▆▆▇▇▇██
tp,▆▅█▇▁
tn,▁▂▃▃█
fp,█▇▆▆▁
fn,▃▄▁▂█


[34m[1mwandb[0m: Agent Starting Run: 67i0lmjb with config:
[34m[1mwandb[0m: 	learning_rate: 2.2587615036824637e-05
[34m[1mwandb[0m: 	num_train_epochs: 10
[34m[1mwandb[0m: 	train_batch_size: 62
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.bias', 'lm_head.decoder.weight', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.out_proj.bias', 'classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_p

HBox(children=(FloatProgress(value=0.0, max=9339.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Epoch', max=10.0, style=ProgressStyle(description_width='…

HBox(children=(FloatProgress(value=0.0, description='Running Epoch 0 of 10', max=151.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 1 of 10', max=151.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 2 of 10', max=151.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 3 of 10', max=151.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 4 of 10', max=151.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 5 of 10', max=151.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 6 of 10', max=151.0, style=ProgressStyle(de…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 7 of 10', max=151.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 8 of 10', max=151.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 9 of 10', max=151.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Evaluation', max=288.0, style=ProgressStyle(descr…




VBox(children=(Label(value=' 0.06MB of 0.06MB uploaded (0.00MB deduped)\r'), FloatProgress(value=0.98817572554…

0,1
Training loss,0.00809
lr,0.0
global_step,1510.0
_runtime,331.0
_timestamp,1630926458.0
_step,43.0
tp,649.0
tn,1209.0
fp,191.0
fn,253.0


0,1
Training loss,█▇▇▅▆▅▅▄▄▄▃▄▃▄▂▂▂▂▁▁▃▂▂▁▂▂▁▁▁▁
lr,███▇▇▇▇▆▆▆▆▅▅▅▅▄▄▄▄▃▃▃▃▂▂▂▂▁▁▁
global_step,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇▇▇██
_runtime,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇█████
_timestamp,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇█████
_step,▁▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
tp,▁▇▂▄█▃▆█▆▅▄
tn,▇▂█▆▁▇▃▂▄▅▆
fp,▂▇▁▃█▂▆▇▅▄▃
fn,█▂▇▅▁▆▃▁▃▄▅


[34m[1mwandb[0m: Agent Starting Run: fkmf9uvl with config:
[34m[1mwandb[0m: 	learning_rate: 6.612444604981019e-06
[34m[1mwandb[0m: 	num_train_epochs: 9
[34m[1mwandb[0m: 	train_batch_size: 12
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.bias', 'lm_head.decoder.weight', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.out_proj.bias', 'classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_p

HBox(children=(FloatProgress(value=0.0, max=9339.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Epoch', max=9.0, style=ProgressStyle(description_width='i…

HBox(children=(FloatProgress(value=0.0, description='Running Epoch 0 of 9', max=779.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 1 of 9', max=779.0, style=ProgressStyle(des…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 2 of 9', max=779.0, style=ProgressStyle(des…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 3 of 9', max=779.0, style=ProgressStyle(des…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 4 of 9', max=779.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 5 of 9', max=779.0, style=ProgressStyle(des…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 6 of 9', max=779.0, style=ProgressStyle(des…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 7 of 9', max=779.0, style=ProgressStyle(des…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 8 of 9', max=779.0, style=ProgressStyle(des…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))






HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Evaluation', max=288.0, style=ProgressStyle(descr…




VBox(children=(Label(value=' 0.05MB of 0.06MB uploaded (0.00MB deduped)\r'), FloatProgress(value=0.98610631687…

0,1
Training loss,0.00675
lr,0.0
global_step,7000.0
_runtime,571.0
_timestamp,1630927041.0
_step,157.0
tp,662.0
tn,1181.0
fp,219.0
fn,240.0


0,1
Training loss,▆▅▄▄▃▃▄▆▄▄▄▃▃▂▂▂▁▁▃▃▄▁▁▂▅▆▂█▁▁▁▁▁▄▁▅▁▁▂▁
lr,███▇▇▇▇▇▇▆▆▆▆▆▆▅▅▅▅▅▄▄▄▄▄▄▃▃▃▃▃▃▂▂▂▂▂▁▁▁
global_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇███
_runtime,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇████
_timestamp,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇████
_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
tp,▁▆▃█▃▂▆▄▃▂▆▃▄▅▅
tn,▇▄▇▁▇█▅▆▇▇▄▇▆▅▅
fp,▂▅▂█▂▁▄▃▂▂▅▂▃▄▄
fn,█▃▆▁▆▇▃▅▆▇▃▆▅▄▄


[34m[1mwandb[0m: Agent Starting Run: vlr1z3s9 with config:
[34m[1mwandb[0m: 	learning_rate: 2.6939194796761716e-05
[34m[1mwandb[0m: 	num_train_epochs: 12
[34m[1mwandb[0m: 	train_batch_size: 99
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.bias', 'lm_head.decoder.weight', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.out_proj.bias', 'classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_p

HBox(children=(FloatProgress(value=0.0, max=9339.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Epoch', max=12.0, style=ProgressStyle(description_width='…

HBox(children=(FloatProgress(value=0.0, description='Running Epoch 0 of 12', max=95.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 1 of 12', max=95.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 2 of 12', max=95.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 3 of 12', max=95.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 4 of 12', max=95.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 5 of 12', max=95.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 6 of 12', max=95.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 7 of 12', max=95.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 8 of 12', max=95.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 9 of 12', max=95.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 10 of 12', max=95.0, style=ProgressStyle(de…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 11 of 12', max=95.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Evaluation', max=288.0, style=ProgressStyle(descr…




VBox(children=(Label(value=' 0.06MB of 0.06MB uploaded (0.00MB deduped)\r'), FloatProgress(value=0.98805713608…

0,1
Training loss,0.00805
lr,0.0
global_step,1140.0
_runtime,358.0
_timestamp,1630927412.0
_step,37.0
tp,671.0
tn,1167.0
fp,233.0
fn,231.0


0,1
Training loss,█▆▅▅▅▃▅▂▄▂▃▂▃▁▂▁▂▂▁▁▁▁
lr,██▇▇▇▆▆▆▅▅▅▄▄▄▃▃▃▂▂▂▁▁
global_step,▁▁▁▂▂▂▂▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇██
_runtime,▁▁▁▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇█████
_timestamp,▁▁▁▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇█████
_step,▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇███
tp,▅▅▆▄█▃▄▁▂▅▃▄▄
tn,▃▅▄▆▁▆▅█▇▄▆▅▅
fp,▆▄▅▃█▃▄▁▂▅▃▄▄
fn,▄▄▃▅▁▆▅█▇▄▆▅▅


[34m[1mwandb[0m: Agent Starting Run: p0lgwq8t with config:
[34m[1mwandb[0m: 	learning_rate: 3.4897515763145844e-05
[34m[1mwandb[0m: 	num_train_epochs: 19
[34m[1mwandb[0m: 	train_batch_size: 96
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.bias', 'lm_head.decoder.weight', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.out_proj.bias', 'classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_p

HBox(children=(FloatProgress(value=0.0, max=9339.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Epoch', max=19.0, style=ProgressStyle(description_width='…

HBox(children=(FloatProgress(value=0.0, description='Running Epoch 0 of 19', max=98.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 1 of 19', max=98.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 2 of 19', max=98.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 3 of 19', max=98.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 4 of 19', max=98.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 5 of 19', max=98.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 6 of 19', max=98.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 7 of 19', max=98.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 8 of 19', max=98.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 9 of 19', max=98.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 10 of 19', max=98.0, style=ProgressStyle(de…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 11 of 19', max=98.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 12 of 19', max=98.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 13 of 19', max=98.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 14 of 19', max=98.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 15 of 19', max=98.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 16 of 19', max=98.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 17 of 19', max=98.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 18 of 19', max=98.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Evaluation', max=288.0, style=ProgressStyle(descr…




VBox(children=(Label(value=' 0.05MB of 0.05MB uploaded (0.00MB deduped)\r'), FloatProgress(value=0.98439569858…

0,1
Training loss,0.00127
lr,0.0
global_step,1862.0
_runtime,557.0
_timestamp,1630927981.0
_step,59.0
tp,648.0
tn,1195.0
fp,205.0
fn,254.0


0,1
Training loss,███▆▆▄▄▃▂▂▁▂▁▂▁▁▁▁▂▁▁▁▂▁▁▂▁▂▁▁▃▁▁▁▁▁▁
lr,███▇▇▇▇▇▆▆▆▆▆▅▅▅▅▅▅▄▄▄▄▄▃▃▃▃▃▂▂▂▂▂▁▁▁
global_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇███
_runtime,▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇████
_timestamp,▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇████
_step,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇███
tp,█▇▅▃▇▁▄▂▄▄▃▃▄▄▂▅▃▄▄▄
tn,▁▃▆▇▄█▆▇▆▆▆▇▇▆▇▅▇▆▆▆
fp,█▆▃▂▅▁▃▂▃▃▃▂▂▃▂▄▂▃▃▃
fn,▁▂▄▆▂█▅▇▅▅▆▆▅▅▇▄▆▅▅▅


[34m[1mwandb[0m: Agent Starting Run: atc9l2ln with config:
[34m[1mwandb[0m: 	learning_rate: 9.493338713420705e-05
[34m[1mwandb[0m: 	num_train_epochs: 6
[34m[1mwandb[0m: 	train_batch_size: 25
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.bias', 'lm_head.decoder.weight', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.out_proj.bias', 'classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_p

HBox(children=(FloatProgress(value=0.0, max=9339.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Epoch', max=6.0, style=ProgressStyle(description_width='i…

HBox(children=(FloatProgress(value=0.0, description='Running Epoch 0 of 6', max=374.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 1 of 6', max=374.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 2 of 6', max=374.0, style=ProgressStyle(des…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 3 of 6', max=374.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 4 of 6', max=374.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 5 of 6', max=374.0, style=ProgressStyle(des…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Evaluation', max=288.0, style=ProgressStyle(descr…




VBox(children=(Label(value=' 0.04MB of 0.04MB uploaded (0.00MB deduped)\r'), FloatProgress(value=0.98220150909…

0,1
Training loss,0.01392
lr,0.0
global_step,2244.0
_runtime,275.0
_timestamp,1630928268.0
_step,54.0
tp,604.0
tn,1173.0
fp,227.0
fn,298.0


0,1
Training loss,██▇▅▇▇▆▅▅▆▆▇▆▄█▄▃▃▄▄▂▇▁▆▄▂▂▃▁▃▁▂▅▁▁▃▃▂▃▁
lr,████▇▇▇▇▇▇▆▆▆▆▆▅▅▅▅▅▄▄▄▄▄▄▃▃▃▃▃▂▂▂▂▂▂▁▁▁
global_step,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
_runtime,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
_timestamp,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇███
tp,▃▁█▄▁▄▄▄
tn,▇█▁▅█▆▆▆
fp,▂▁█▄▁▃▃▃
fn,▆█▁▅█▅▅▅


[34m[1mwandb[0m: Agent Starting Run: bpzf2mnc with config:
[34m[1mwandb[0m: 	learning_rate: 9.925886697944663e-05
[34m[1mwandb[0m: 	num_train_epochs: 4
[34m[1mwandb[0m: 	train_batch_size: 25
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.bias', 'lm_head.decoder.weight', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.out_proj.bias', 'classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_p

HBox(children=(FloatProgress(value=0.0, max=9339.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Epoch', max=4.0, style=ProgressStyle(description_width='i…

HBox(children=(FloatProgress(value=0.0, description='Running Epoch 0 of 4', max=374.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




  mcc = cov_ytyp / np.sqrt(cov_ytyt * cov_ypyp)


HBox(children=(FloatProgress(value=0.0, description='Running Epoch 1 of 4', max=374.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 2 of 4', max=374.0, style=ProgressStyle(des…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 3 of 4', max=374.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Evaluation', max=288.0, style=ProgressStyle(descr…




VBox(children=(Label(value=' 0.00MB of 0.00MB uploaded (0.00MB deduped)\r'), FloatProgress(value=0.82176541717…

0,1
Training loss,0.52019
lr,0.0
global_step,1496.0
_runtime,189.0
_timestamp,1630928468.0
_step,36.0
tp,0.0
tn,1400.0
fp,0.0
fn,902.0


0,1
Training loss,▄▆▇▅▅▇▆▅▅▄▆▆▆▇▆▇█▄▅▆▃▆▆█▃▅▆▅▁
lr,██▇▇▇▇▆▆▆▆▅▅▅▅▄▄▄▄▃▃▃▃▃▂▂▂▂▁▁
global_step,▁▁▁▂▂▂▂▃▃▃▃▃▄▄▄▄▄▅▅▅▅▆▆▆▆▆▆▇▇▇▇███
_runtime,▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇████
_timestamp,▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇████
_step,▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇███
tp,▁▁▁▁▁
tn,▁▁▁▁▁
fp,▁▁▁▁▁
fn,▁▁▁▁▁


[34m[1mwandb[0m: Agent Starting Run: 4tjk7jyw with config:
[34m[1mwandb[0m: 	learning_rate: 4.566037959352398e-05
[34m[1mwandb[0m: 	num_train_epochs: 9
[34m[1mwandb[0m: 	train_batch_size: 63
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.bias', 'lm_head.decoder.weight', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.out_proj.bias', 'classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_p

HBox(children=(FloatProgress(value=0.0, max=9339.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Epoch', max=9.0, style=ProgressStyle(description_width='i…

HBox(children=(FloatProgress(value=0.0, description='Running Epoch 0 of 9', max=149.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 1 of 9', max=149.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 2 of 9', max=149.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 3 of 9', max=149.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 4 of 9', max=149.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 5 of 9', max=149.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 6 of 9', max=149.0, style=ProgressStyle(des…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 7 of 9', max=149.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 8 of 9', max=149.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Evaluation', max=288.0, style=ProgressStyle(descr…




VBox(children=(Label(value=' 0.05MB of 0.05MB uploaded (0.00MB deduped)\r'), FloatProgress(value=0.98572806516…

0,1
Training loss,0.00031
lr,0.0
global_step,1341.0
_runtime,302.0
_timestamp,1630928782.0
_step,38.0
tp,653.0
tn,1192.0
fp,208.0
fn,249.0


0,1
Training loss,█▅▅▅▃▃▄▃▃▃▃▂▁▂▁▁▁▁▃▁▁▂▂▁▁▁
lr,██▇▇▇▇▆▆▆▅▅▅▅▄▄▄▄▃▃▃▂▂▂▂▁▁
global_step,▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▆▇▇▇▇███
_runtime,▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇█████
_timestamp,▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇█████
_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
tp,█▇▃▂▅▄▃▅▁▂
tn,▁▄▆▆▅▆▇▅█▇
fp,█▅▃▃▄▃▂▄▁▂
fn,▁▂▆▇▄▅▆▄█▇


[34m[1mwandb[0m: Agent Starting Run: rus95nb1 with config:
[34m[1mwandb[0m: 	learning_rate: 7.457068925615717e-05
[34m[1mwandb[0m: 	num_train_epochs: 17
[34m[1mwandb[0m: 	train_batch_size: 20
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.bias', 'lm_head.decoder.weight', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.out_proj.bias', 'classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_p

HBox(children=(FloatProgress(value=0.0, max=9339.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Epoch', max=17.0, style=ProgressStyle(description_width='…

HBox(children=(FloatProgress(value=0.0, description='Running Epoch 0 of 17', max=467.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 1 of 17', max=467.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 2 of 17', max=467.0, style=ProgressStyle(de…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 3 of 17', max=467.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 4 of 17', max=467.0, style=ProgressStyle(de…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 5 of 17', max=467.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 6 of 17', max=467.0, style=ProgressStyle(de…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 7 of 17', max=467.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 8 of 17', max=467.0, style=ProgressStyle(de…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 9 of 17', max=467.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 10 of 17', max=467.0, style=ProgressStyle(d…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))






HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Evaluation', max=288.0, style=ProgressStyle(descr…




VBox(children=(Label(value=' 0.02MB of 0.02MB uploaded (0.00MB deduped)\r'), FloatProgress(value=0.96780386353…

0,1
Training loss,0.29706
lr,3e-05
global_step,5000.0
_runtime,503.0
_timestamp,1630929298.0
_step,117.0
tp,684.0
tn,1075.0
fp,325.0
fn,218.0


0,1
Training loss,▆▄▇▅▅▅▄█▆▃▃▄▆▅▄▇▇▃▇▅▇▅▃▃▅▆▅▃▅▃▃▅▁▃▃▃▂▁▃▄
lr,████▇▇▇▇▇▆▆▆▆▆▆▅▅▅▅▅▄▄▄▄▄▄▃▃▃▃▃▂▂▂▂▂▂▁▁▁
global_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇████
_runtime,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇████
_timestamp,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇████
_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
tp,▅▇▆▇▇▅▁▄▆▇█▆▆▅█
tn,▆▃▅▄▃▆█▆▄▂▂▄▅▆▁
fp,▃▆▄▅▆▃▁▃▅▇▇▅▄▃█
fn,▄▂▃▂▂▄█▅▃▂▁▃▃▄▁


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: dylqc4re with config:
[34m[1mwandb[0m: 	learning_rate: 3.0187501349081547e-05
[34m[1mwandb[0m: 	num_train_epochs: 3
[34m[1mwandb[0m: 	train_batch_size: 90
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.bias', 'lm_head.decoder.weight', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.out_proj.bias', 'classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_p

HBox(children=(FloatProgress(value=0.0, max=9339.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Epoch', max=3.0, style=ProgressStyle(description_width='i…

HBox(children=(FloatProgress(value=0.0, description='Running Epoch 0 of 3', max=104.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 1 of 3', max=104.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 2 of 3', max=104.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Evaluation', max=288.0, style=ProgressStyle(descr…




VBox(children=(Label(value=' 0.07MB of 0.07MB uploaded (0.00MB deduped)\r'), FloatProgress(value=1.0, max=1.0)…

0,1
Training loss,0.25782
lr,0.0
global_step,312.0
_runtime,107.0
_timestamp,1630929426.0
_step,11.0
tp,635.0
tn,1223.0
fp,177.0
fn,267.0


0,1
Training loss,▇█▅█▂▁
lr,█▇▅▄▂▁
global_step,▁▂▂▄▅▅▆██
_runtime,▁▂▂▃▄▅▆▇▇███
_timestamp,▁▂▂▃▄▅▆▇▇███
_step,▁▂▂▃▄▄▅▅▆▇▇█
tp,█▆▁
tn,▁▅█
fp,█▄▁
fn,▁▃█


[34m[1mwandb[0m: Agent Starting Run: vqtziq1d with config:
[34m[1mwandb[0m: 	learning_rate: 4.886878579228724e-05
[34m[1mwandb[0m: 	num_train_epochs: 8
[34m[1mwandb[0m: 	train_batch_size: 6
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.bias', 'lm_head.decoder.weight', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.out_proj.bias', 'classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_p

HBox(children=(FloatProgress(value=0.0, max=9339.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Epoch', max=8.0, style=ProgressStyle(description_width='i…

HBox(children=(FloatProgress(value=0.0, description='Running Epoch 0 of 8', max=1557.0, style=ProgressStyle(de…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




  mcc = cov_ytyp / np.sqrt(cov_ytyt * cov_ypyp)





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 1 of 8', max=1557.0, style=ProgressStyle(de…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 2 of 8', max=1557.0, style=ProgressStyle(de…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))






HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Evaluation', max=288.0, style=ProgressStyle(descr…




VBox(children=(Label(value=' 0.00MB of 0.00MB uploaded (0.00MB deduped)\r'), FloatProgress(value=0.82129920309…

0,1
Training loss,0.8396
lr,3e-05
global_step,4000.0
_runtime,316.0
_timestamp,1630929753.0
_step,88.0
tp,0.0
tn,1400.0
fp,0.0
fn,902.0


0,1
Training loss,▃▄▅▁▆▂▄▆▆▆▇▅▅▇▆▄▄▇▅▂▆▅█▅▂▅▄▂▅▅▅▃▄▄▅▅▄▁▄▆
lr,███▇▇▇▇▇▇▆▆▆▆▆▆▅▅▅▅▅▄▄▄▄▄▄▃▃▃▃▃▃▂▂▂▂▂▁▁▁
global_step,▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▆▇▇▇▇▇███
_runtime,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
_timestamp,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
_step,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇███
tp,▁▁▁▁▁▁
tn,▁▁▁▁▁▁
fp,▁▁▁▁▁▁
fn,▁▁▁▁▁▁


[34m[1mwandb[0m: Agent Starting Run: y8uemgsb with config:
[34m[1mwandb[0m: 	learning_rate: 8.77518070751763e-05
[34m[1mwandb[0m: 	num_train_epochs: 16
[34m[1mwandb[0m: 	train_batch_size: 28
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.bias', 'lm_head.decoder.weight', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.out_proj.bias', 'classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_p

HBox(children=(FloatProgress(value=0.0, max=9339.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Epoch', max=16.0, style=ProgressStyle(description_width='…

HBox(children=(FloatProgress(value=0.0, description='Running Epoch 0 of 16', max=334.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 1 of 16', max=334.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 2 of 16', max=334.0, style=ProgressStyle(de…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 3 of 16', max=334.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 4 of 16', max=334.0, style=ProgressStyle(de…

[34m[1mwandb[0m: Ctrl + C detected. Stopping sweep.
