In [1]:
import pandas as pd
import numpy as np
import torch

torch.cuda.empty_cache()

def read_file(fname: str, correct_labels=True) -> pd.DataFrame:
    """Reads a filename, return df with text and labels."""

    df = pd.read_table(fname, sep="\t", header=None, names="text,labels,role".split(","))
    if correct_labels:
        offensive_ids = df.labels != "Acceptable speech"
        df.labels[offensive_ids] = 1
        df.labels[~offensive_ids] = 0

    df = df.drop(columns=["role"])
    return df


def run_hyperparams_optimization(model_name, model_type, lang):
    import torch
    torch.cuda.empty_cache()
    if lang not in {"sl", "hr", "en"}:
        raise AttributeError(f"Language {lang} is not valid")
    eval_file, train_file = f"../data/merged-{lang}.test.tsv" , f"../data/merged-{lang}.train.tsv"
    from simpletransformers.classification import ClassificationModel, ClassificationArgs
    import wandb


    model_args = ClassificationArgs()
    model_args.use_early_stopping = True
    model_args.early_stopping_delta = 0.01
    model_args.early_stopping_metric = "mcc"
    model_args.early_stopping_metric_minimize = False
    model_args.early_stopping_patience = 3
    model_args.evaluate_during_training_steps = 1000

    model_args.evaluate_during_training = True
    model_args.manual_seed = 4
    model_args.use_multiprocessing = True
    model_args.eval_batch_size = 8
    model_args.labels_list = [0, 1]
    model_args.wandb_project = "task3"
    model_args.reprocess_input_data = True
    model_args.overwrite_output_dir = True
    model_args.no_save = True

    sweep_config = {
        "method": "bayes",  # grid, random
        "metric": {"name": "mcc", "goal": "maximize"},
        "parameters": {
            "num_train_epochs":  {"max": 15, "min": 3},
            "learning_rate": {"min": 1e-6, "max": 1e-4},
            "train_batch_size": {"max": 100, "min": 5}
        },
    }

    sweep_id = wandb.sweep(sweep_config, project="task3_"+model_name.replace("/", "_")+model_type)

    train_df = read_file(train_file, correct_labels=True)
    eval_df = read_file(eval_file, correct_labels=True)

    def train():
        # Initialize a new wandb run
        wandb.init()

        # Create a TransformerModel
        model = ClassificationModel(
            model_type,
            model_name,
            use_cuda=True,
            args=model_args,
            sweep_config=wandb.config,
        )
        model.overwrite_output_dir = True
        model.no_save = True
        
        
        # Train the model
        model.train_model(train_df, eval_df=eval_df)

        # Evaluate the model
        model.eval_model(eval_df)

        # Sync wandb
        wandb.join()

    wandb.agent(sweep_id, train, count=50)


In [None]:
model_name = "xlm-roberta-base"
model_type = "xlmroberta"
language = "en"

run_hyperparams_optimization(model_name, model_type, language)

Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Create sweep with ID: ypeq6ds8
Sweep URL: https://wandb.ai/5roop/task3_xlm-roberta-basexlmroberta/sweeps/ypeq6ds8


[34m[1mwandb[0m: Agent Starting Run: mvqg2hej with config:
[34m[1mwandb[0m: 	learning_rate: 7.831626915734913e-05
[34m[1mwandb[0m: 	num_train_epochs: 13
[34m[1mwandb[0m: 	train_batch_size: 79
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.
[34m[1mwandb[0m: Currently logged in as: [33m5roop[0m (use `wandb login --relogin` to force relogin)


Some weights of the model checkpoint at xlm-roberta-base were not used when initializing XLMRobertaForSequenceClassification: ['lm_head.layer_norm.weight', 'lm_head.dense.bias', 'lm_head.decoder.weight', 'lm_head.layer_norm.bias', 'lm_head.bias', 'lm_head.dense.weight']
- This IS expected if you are initializing XLMRobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing XLMRobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of XLMRobertaForSequenceClassification were not initialized from the model checkpoint at xlm-roberta-base and are newly initialized: ['classifier.out_proj.bias', 'classifier.dense.weight', 'classifier.dense.bias

HBox(children=(FloatProgress(value=0.0, description='Epoch', max=13.0, style=ProgressStyle(description_width='…

HBox(children=(FloatProgress(value=0.0, description='Running Epoch 0 of 13', max=119.0, style=ProgressStyle(de…

  torch.nn.utils.clip_grad_norm_(





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 1 of 13', max=119.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 2 of 13', max=119.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 3 of 13', max=119.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 4 of 13', max=119.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 5 of 13', max=119.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 6 of 13', max=119.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 7 of 13', max=119.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 8 of 13', max=119.0, style=ProgressStyle(de…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 9 of 13', max=119.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 10 of 13', max=119.0, style=ProgressStyle(d…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 11 of 13', max=119.0, style=ProgressStyle(d…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 12 of 13', max=119.0, style=ProgressStyle(d…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Evaluation', max=288.0, style=ProgressStyle(descr…




VBox(children=(Label(value=' 0.06MB of 0.06MB uploaded (0.00MB deduped)\r'), FloatProgress(value=0.98676050792…

0,1
Training loss,0.00462
lr,0.0
global_step,1547.0
_runtime,443.0
_timestamp,1631632748.0
_step,46.0
tp,613.0
tn,1173.0
fp,227.0
fn,289.0


0,1
Training loss,██▇▅▄▅▅▅▅▃▂▂▃▂▂▁▁▂▁▁▁▁▂▂▁▁▁▁▁▁
lr,▅███▇▇▇▇▆▆▆▆▅▅▅▅▄▄▄▄▃▃▃▃▂▂▂▂▁▁
global_step,▁▁▁▁▂▂▂▂▂▂▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇██
_runtime,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇████
_timestamp,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇████
_step,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇███
tp,█▁▆▃▃▁▃▅▅▄▆▅▄▄
tn,▁█▅▇▇█▇▆▆▇▅▆▇▆
fp,█▁▄▂▂▁▂▃▃▂▄▃▂▃
fn,▁█▃▆▆█▆▄▄▅▃▄▅▅


[34m[1mwandb[0m: Agent Starting Run: s78aio2w with config:
[34m[1mwandb[0m: 	learning_rate: 7.634763102811421e-05
[34m[1mwandb[0m: 	num_train_epochs: 15
[34m[1mwandb[0m: 	train_batch_size: 62
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of the model checkpoint at xlm-roberta-base were not used when initializing XLMRobertaForSequenceClassification: ['lm_head.layer_norm.weight', 'lm_head.dense.bias', 'lm_head.decoder.weight', 'lm_head.layer_norm.bias', 'lm_head.bias', 'lm_head.dense.weight']
- This IS expected if you are initializing XLMRobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing XLMRobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of XLMRobertaForSequenceClassification were not initialized from the model checkpoint at xlm-roberta-base and are newly initialized: ['classifier.out_proj.bias', 'classifier.dense.weight', 'classifier.dense.bias

HBox(children=(FloatProgress(value=0.0, description='Epoch', max=15.0, style=ProgressStyle(description_width='…

HBox(children=(FloatProgress(value=0.0, description='Running Epoch 0 of 15', max=151.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 1 of 15', max=151.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 2 of 15', max=151.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 3 of 15', max=151.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 4 of 15', max=151.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 5 of 15', max=151.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 6 of 15', max=151.0, style=ProgressStyle(de…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 7 of 15', max=151.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 8 of 15', max=151.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 9 of 15', max=151.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 10 of 15', max=151.0, style=ProgressStyle(d…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 11 of 15', max=151.0, style=ProgressStyle(d…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 12 of 15', max=151.0, style=ProgressStyle(d…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 13 of 15', max=151.0, style=ProgressStyle(d…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 14 of 15', max=151.0, style=ProgressStyle(d…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Evaluation', max=288.0, style=ProgressStyle(descr…




VBox(children=(Label(value=' 0.05MB of 0.05MB uploaded (0.00MB deduped)\r'), FloatProgress(value=0.98471466098…

0,1
Training loss,0.00018
lr,0.0
global_step,2265.0
_runtime,551.0
_timestamp,1631633311.0
_step,64.0
tp,636.0
tn,1142.0
fp,258.0
fn,266.0


0,1
Training loss,██▇▆▆▆▅▆▄▅▃▄▃▃▃▃▃▂▁▂▁▂▁▁▁▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁
lr,▅████▇▇▇▇▇▆▆▆▆▆▆▅▅▅▅▅▄▄▄▄▄▃▃▃▃▃▃▂▂▂▂▂▁▁▁
global_step,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇▇███
_runtime,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇████
_timestamp,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇████
_step,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇███
tp,█▁▆▃▃▅▄▃▅▅▅▅▄▄▄▅▅
tn,▁█▅█▇▆▇▇▆▆▆▆▇▇▇▆▆
fp,█▁▄▁▂▃▂▂▃▃▃▃▂▂▂▃▃
fn,▁█▃▆▆▄▅▆▄▄▄▄▅▅▅▄▄


[34m[1mwandb[0m: Agent Starting Run: hdzti2j9 with config:
[34m[1mwandb[0m: 	learning_rate: 4.4324890522344835e-05
[34m[1mwandb[0m: 	num_train_epochs: 13
[34m[1mwandb[0m: 	train_batch_size: 73
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of the model checkpoint at xlm-roberta-base were not used when initializing XLMRobertaForSequenceClassification: ['lm_head.layer_norm.weight', 'lm_head.dense.bias', 'lm_head.decoder.weight', 'lm_head.layer_norm.bias', 'lm_head.bias', 'lm_head.dense.weight']
- This IS expected if you are initializing XLMRobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing XLMRobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of XLMRobertaForSequenceClassification were not initialized from the model checkpoint at xlm-roberta-base and are newly initialized: ['classifier.out_proj.bias', 'classifier.dense.weight', 'classifier.dense.bias

HBox(children=(FloatProgress(value=0.0, description='Epoch', max=13.0, style=ProgressStyle(description_width='…

HBox(children=(FloatProgress(value=0.0, description='Running Epoch 0 of 13', max=128.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 1 of 13', max=128.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 2 of 13', max=128.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 3 of 13', max=128.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 4 of 13', max=128.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 5 of 13', max=128.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 6 of 13', max=128.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 7 of 13', max=128.0, style=ProgressStyle(de…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 8 of 13', max=128.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 9 of 13', max=128.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 10 of 13', max=128.0, style=ProgressStyle(d…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 11 of 13', max=128.0, style=ProgressStyle(d…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 12 of 13', max=128.0, style=ProgressStyle(d…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Evaluation', max=288.0, style=ProgressStyle(descr…




VBox(children=(Label(value=' 0.06MB of 0.06MB uploaded (0.00MB deduped)\r'), FloatProgress(value=0.98813809383…

0,1
Training loss,0.0821
lr,0.0
global_step,1664.0
_runtime,454.0
_timestamp,1631633776.0
_step,49.0
tp,636.0
tn,1147.0
fp,253.0
fn,266.0


0,1
Training loss,██▆█▆▆▆▄▅▅▄▄▃▂▄▃▂▁▄▂▂▁▁▁▁▁▁▃▁▂▂▁▂
lr,▅███▇▇▇▇▆▆▆▆▆▅▅▅▅▄▄▄▄▃▃▃▃▃▂▂▂▂▁▁▁
global_step,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇███
_runtime,▁▁▁▁▂▂▂▂▂▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇████
_timestamp,▁▁▁▁▂▂▂▂▂▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇████
_step,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇███
tp,██▅▁▄▁▇▄▅▂▅▄▃▄
tn,▁▁▅█▆▇▄▆▅▇▅▆▆▅
fp,██▄▁▃▂▅▃▄▂▄▃▃▄
fn,▁▁▄█▅█▂▅▄▇▄▅▆▅


[34m[1mwandb[0m: Agent Starting Run: c9ox7bgv with config:
[34m[1mwandb[0m: 	learning_rate: 1.9998729905462498e-05
[34m[1mwandb[0m: 	num_train_epochs: 14
[34m[1mwandb[0m: 	train_batch_size: 25
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of the model checkpoint at xlm-roberta-base were not used when initializing XLMRobertaForSequenceClassification: ['lm_head.layer_norm.weight', 'lm_head.dense.bias', 'lm_head.decoder.weight', 'lm_head.layer_norm.bias', 'lm_head.bias', 'lm_head.dense.weight']
- This IS expected if you are initializing XLMRobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing XLMRobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of XLMRobertaForSequenceClassification were not initialized from the model checkpoint at xlm-roberta-base and are newly initialized: ['classifier.out_proj.bias', 'classifier.dense.weight', 'classifier.dense.bias

HBox(children=(FloatProgress(value=0.0, description='Epoch', max=14.0, style=ProgressStyle(description_width='…

HBox(children=(FloatProgress(value=0.0, description='Running Epoch 0 of 14', max=374.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 1 of 14', max=374.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 2 of 14', max=374.0, style=ProgressStyle(de…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 3 of 14', max=374.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 4 of 14', max=374.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 5 of 14', max=374.0, style=ProgressStyle(de…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 6 of 14', max=374.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 7 of 14', max=374.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 8 of 14', max=374.0, style=ProgressStyle(de…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 9 of 14', max=374.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 10 of 14', max=374.0, style=ProgressStyle(d…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 11 of 14', max=374.0, style=ProgressStyle(d…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 12 of 14', max=374.0, style=ProgressStyle(d…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 13 of 14', max=374.0, style=ProgressStyle(d…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))






HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Evaluation', max=288.0, style=ProgressStyle(descr…




VBox(children=(Label(value=' 0.06MB of 0.06MB uploaded (0.00MB deduped)\r'), FloatProgress(value=0.98649648538…

0,1
Training loss,0.00077
lr,0.0
global_step,5000.0
_runtime,687.0
_timestamp,1631634475.0
_step,120.0
tp,604.0
tn,1164.0
fp,236.0
fn,298.0


0,1
Training loss,██▇▅▃█▆▄▄▂▃▇▃▄▃▂▄▂▁▄▃▁▁▂▁▁▁▁▅▁▁▁▁▃▁▁▁▁▂▁
lr,▅███▇▇▇▇▇▇▆▆▆▆▆▅▅▅▅▅▅▄▄▄▄▄▃▃▃▃▃▃▂▂▂▂▂▁▁▁
global_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇████
_runtime,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇▇███
_timestamp,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇▇███
_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
tp,█▁▅▇█▃▇▃▂▄▇▂▄▄▃▄▄▃
tn,▁█▅▂▃▇▃▇▇▆▄▇▆▆▇▆▆▇
fp,█▁▄▇▆▂▆▂▂▃▅▂▃▃▂▃▃▂
fn,▁█▄▂▁▆▂▆▇▅▂▇▅▅▆▅▅▆


[34m[1mwandb[0m: Agent Starting Run: km9g304l with config:
[34m[1mwandb[0m: 	learning_rate: 4.743363596039793e-05
[34m[1mwandb[0m: 	num_train_epochs: 13
[34m[1mwandb[0m: 	train_batch_size: 95
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of the model checkpoint at xlm-roberta-base were not used when initializing XLMRobertaForSequenceClassification: ['lm_head.layer_norm.weight', 'lm_head.dense.bias', 'lm_head.decoder.weight', 'lm_head.layer_norm.bias', 'lm_head.bias', 'lm_head.dense.weight']
- This IS expected if you are initializing XLMRobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing XLMRobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of XLMRobertaForSequenceClassification were not initialized from the model checkpoint at xlm-roberta-base and are newly initialized: ['classifier.out_proj.bias', 'classifier.dense.weight', 'classifier.dense.bias

HBox(children=(FloatProgress(value=0.0, description='Epoch', max=13.0, style=ProgressStyle(description_width='…

HBox(children=(FloatProgress(value=0.0, description='Running Epoch 0 of 13', max=99.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 1 of 13', max=99.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 2 of 13', max=99.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 3 of 13', max=99.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 4 of 13', max=99.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 5 of 13', max=99.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 6 of 13', max=99.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 7 of 13', max=99.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 8 of 13', max=99.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 9 of 13', max=99.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 10 of 13', max=99.0, style=ProgressStyle(de…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 11 of 13', max=99.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 12 of 13', max=99.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Evaluation', max=288.0, style=ProgressStyle(descr…




VBox(children=(Label(value=' 0.07MB of 0.07MB uploaded (0.00MB deduped)\r'), FloatProgress(value=0.98886881600…

0,1
Training loss,0.06832
lr,0.0
global_step,1287.0
_runtime,431.0
_timestamp,1631634918.0
_step,41.0
tp,621.0
tn,1175.0
fp,225.0
fn,281.0


0,1
Training loss,█▇▆▅▅▄▅▃▂▂▂▂▂▂▂▂▂▁▃▁▁▁▁▁▂
lr,▅██▇▇▇▆▆▆▆▅▅▅▄▄▄▃▃▃▃▂▂▂▁▁
global_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▆▇▇▇▇▇███
_runtime,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇▇████
_timestamp,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇▇████
_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇▇██
tp,▆▇█▁▃▂▇▃▆▅▅▅▄▄
tn,▂▃▁█▆█▄▇▅▆▆▆▆▆
fp,▇▆█▁▃▁▅▂▄▃▃▃▃▃
fn,▃▂▁█▆▇▂▆▃▄▄▄▅▅


[34m[1mwandb[0m: Agent Starting Run: aq1f9ak0 with config:
[34m[1mwandb[0m: 	learning_rate: 4.2532382925377725e-05
[34m[1mwandb[0m: 	num_train_epochs: 10
[34m[1mwandb[0m: 	train_batch_size: 100
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of the model checkpoint at xlm-roberta-base were not used when initializing XLMRobertaForSequenceClassification: ['lm_head.layer_norm.weight', 'lm_head.dense.bias', 'lm_head.decoder.weight', 'lm_head.layer_norm.bias', 'lm_head.bias', 'lm_head.dense.weight']
- This IS expected if you are initializing XLMRobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing XLMRobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of XLMRobertaForSequenceClassification were not initialized from the model checkpoint at xlm-roberta-base and are newly initialized: ['classifier.out_proj.bias', 'classifier.dense.weight', 'classifier.dense.bias

HBox(children=(FloatProgress(value=0.0, description='Epoch', max=10.0, style=ProgressStyle(description_width='…

HBox(children=(FloatProgress(value=0.0, description='Running Epoch 0 of 10', max=94.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 1 of 10', max=94.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 2 of 10', max=94.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 3 of 10', max=94.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 4 of 10', max=94.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 5 of 10', max=94.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 6 of 10', max=94.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 7 of 10', max=94.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 8 of 10', max=94.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 9 of 10', max=94.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Evaluation', max=288.0, style=ProgressStyle(descr…




VBox(children=(Label(value=' 0.07MB of 0.07MB uploaded (0.00MB deduped)\r'), FloatProgress(value=0.98868657304…

0,1
Training loss,0.07321
lr,0.0
global_step,940.0
_runtime,327.0
_timestamp,1631635256.0
_step,30.0
tp,599.0
tn,1175.0
fp,225.0
fn,303.0


0,1
Training loss,█▇▆▅▇▅▅▃▃▂▃▂▂▁▂▁▁▁
lr,▅██▇▇▆▆▅▅▄▄▄▃▃▂▂▁▁
global_step,▁▁▁▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▆▆▆▇▇▇▇▇██
_runtime,▁▁▁▂▂▂▂▃▃▃▄▄▄▄▄▅▅▅▆▆▆▆▆▇▇▇▇████
_timestamp,▁▁▁▂▂▂▂▃▃▃▄▄▄▄▄▅▅▅▆▆▆▆▆▇▇▇▇████
_step,▁▁▁▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▅▆▆▆▆▇▇▇▇███
tp,█▁▅▁▂▄▃▄▃▃
tn,▁█▆█▇▇▇▆▇▇
fp,█▁▃▁▂▂▂▃▂▂
fn,▁█▄█▇▅▆▅▆▆


[34m[1mwandb[0m: Agent Starting Run: mhjjvzbj with config:
[34m[1mwandb[0m: 	learning_rate: 6.883214982532322e-05
[34m[1mwandb[0m: 	num_train_epochs: 8
[34m[1mwandb[0m: 	train_batch_size: 75
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of the model checkpoint at xlm-roberta-base were not used when initializing XLMRobertaForSequenceClassification: ['lm_head.layer_norm.weight', 'lm_head.dense.bias', 'lm_head.decoder.weight', 'lm_head.layer_norm.bias', 'lm_head.bias', 'lm_head.dense.weight']
- This IS expected if you are initializing XLMRobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing XLMRobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of XLMRobertaForSequenceClassification were not initialized from the model checkpoint at xlm-roberta-base and are newly initialized: ['classifier.out_proj.bias', 'classifier.dense.weight', 'classifier.dense.bias

HBox(children=(FloatProgress(value=0.0, description='Epoch', max=8.0, style=ProgressStyle(description_width='i…

HBox(children=(FloatProgress(value=0.0, description='Running Epoch 0 of 8', max=125.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 1 of 8', max=125.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 2 of 8', max=125.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 3 of 8', max=125.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 4 of 8', max=125.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 5 of 8', max=125.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 6 of 8', max=125.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 7 of 8', max=125.0, style=ProgressStyle(des…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Evaluation', max=288.0, style=ProgressStyle(descr…




VBox(children=(Label(value=' 0.07MB of 0.07MB uploaded (0.00MB deduped)\r'), FloatProgress(value=0.98891730605…

0,1
Training loss,0.01607
lr,0.0
global_step,1000.0
_runtime,290.0
_timestamp,1631635557.0
_step,31.0
tp,609.0
tn,1184.0
fp,216.0
fn,293.0


0,1
Training loss,█▆▇█▆▅▆▄▇▆▅▄▄▄▃▁▂▁▂▁
lr,▅██▇▇▆▆▆▅▅▅▄▄▃▃▃▂▂▁▁
global_step,▁▁▂▂▂▂▂▃▃▃▄▄▄▄▅▅▅▅▆▆▆▇▇▇▇████
_runtime,▁▁▂▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇█████
_timestamp,▁▁▂▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇█████
_step,▁▁▁▂▂▂▂▃▃▃▃▃▄▄▄▄▅▅▅▅▆▆▆▆▆▇▇▇▇███
tp,▆▁█▄▆▅▆▆▆
tn,▄█▁▇▄▅▄▅▅
fp,▅▁█▂▅▄▅▄▄
fn,▃█▁▅▃▄▃▃▃


[34m[1mwandb[0m: Agent Starting Run: 6rmwouo1 with config:
[34m[1mwandb[0m: 	learning_rate: 1.9789497644198483e-06
[34m[1mwandb[0m: 	num_train_epochs: 15
[34m[1mwandb[0m: 	train_batch_size: 48
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of the model checkpoint at xlm-roberta-base were not used when initializing XLMRobertaForSequenceClassification: ['lm_head.layer_norm.weight', 'lm_head.dense.bias', 'lm_head.decoder.weight', 'lm_head.layer_norm.bias', 'lm_head.bias', 'lm_head.dense.weight']
- This IS expected if you are initializing XLMRobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing XLMRobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of XLMRobertaForSequenceClassification were not initialized from the model checkpoint at xlm-roberta-base and are newly initialized: ['classifier.out_proj.bias', 'classifier.dense.weight', 'classifier.dense.bias

HBox(children=(FloatProgress(value=0.0, description='Epoch', max=15.0, style=ProgressStyle(description_width='…

HBox(children=(FloatProgress(value=0.0, description='Running Epoch 0 of 15', max=195.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




  mcc = cov_ytyp / np.sqrt(cov_ytyt * cov_ypyp)


HBox(children=(FloatProgress(value=0.0, description='Running Epoch 1 of 15', max=195.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 2 of 15', max=195.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 3 of 15', max=195.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 4 of 15', max=195.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 5 of 15', max=195.0, style=ProgressStyle(de…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 6 of 15', max=195.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 7 of 15', max=195.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 8 of 15', max=195.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 9 of 15', max=195.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 10 of 15', max=195.0, style=ProgressStyle(d…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 11 of 15', max=195.0, style=ProgressStyle(d…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 12 of 15', max=195.0, style=ProgressStyle(d…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 13 of 15', max=195.0, style=ProgressStyle(d…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 14 of 15', max=195.0, style=ProgressStyle(d…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Evaluation', max=288.0, style=ProgressStyle(descr…




VBox(children=(Label(value=' 0.08MB of 0.08MB uploaded (0.00MB deduped)\r'), FloatProgress(value=0.99006941528…

0,1
Training loss,0.58752
lr,0.0
global_step,2925.0
_runtime,590.0
_timestamp,1631636158.0
_step,77.0
tp,631.0
tn,1148.0
fp,252.0
fn,271.0


0,1
Training loss,██▆▆█▇▆▅█▅▄▅▆▂▅▄▆▅▄▄▃▆▄▄▄▄▃▂▅▁▇▃▄▂▅▄▃▃▄▆
lr,▅████▇▇▇▇▇▆▆▆▆▆▆▅▅▅▅▅▄▄▄▄▄▃▃▃▃▃▃▂▂▂▂▂▁▁▁
global_step,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▆▇▇▇▇▇███
_runtime,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇████
_timestamp,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇████
_step,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
tp,▁▅▆▇▇█▇██▇███████
tn,█▅▄▃▃▂▃▁▁▃▂▂▁▂▂▃▂
fp,▁▄▅▆▆▇▆██▆▇▇█▇▇▆▇
fn,█▄▃▂▂▁▂▁▁▂▁▁▁▁▁▁▁


[34m[1mwandb[0m: Agent Starting Run: dei5xdlv with config:
[34m[1mwandb[0m: 	learning_rate: 3.5898006758946255e-05
[34m[1mwandb[0m: 	num_train_epochs: 3
[34m[1mwandb[0m: 	train_batch_size: 68
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of the model checkpoint at xlm-roberta-base were not used when initializing XLMRobertaForSequenceClassification: ['lm_head.layer_norm.weight', 'lm_head.dense.bias', 'lm_head.decoder.weight', 'lm_head.layer_norm.bias', 'lm_head.bias', 'lm_head.dense.weight']
- This IS expected if you are initializing XLMRobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing XLMRobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of XLMRobertaForSequenceClassification were not initialized from the model checkpoint at xlm-roberta-base and are newly initialized: ['classifier.out_proj.bias', 'classifier.dense.weight', 'classifier.dense.bias

HBox(children=(FloatProgress(value=0.0, description='Epoch', max=3.0, style=ProgressStyle(description_width='i…

HBox(children=(FloatProgress(value=0.0, description='Running Epoch 0 of 3', max=138.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 1 of 3', max=138.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 2 of 3', max=138.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Evaluation', max=288.0, style=ProgressStyle(descr…




VBox(children=(Label(value=' 0.08MB of 0.08MB uploaded (0.00MB deduped)\r'), FloatProgress(value=1.0, max=1.0)…

0,1
Training loss,0.46587
lr,0.0
global_step,414.0
_runtime,122.0
_timestamp,1631636293.0
_step,13.0
tp,660.0
tn,1154.0
fp,246.0
fn,242.0


0,1
Training loss,█▆▄▂▆▁▂▃
lr,▅█▇▆▅▃▂▁
global_step,▁▂▃▃▄▅▅▆▇██
_runtime,▁▂▃▃▄▄▅▅▆▇████
_timestamp,▁▂▃▃▄▄▅▅▆▇████
_step,▁▂▂▃▃▄▄▅▅▆▆▇▇█
tp,█▄▁
tn,▁▆█
fp,█▃▁
fn,▁▅█


[34m[1mwandb[0m: Agent Starting Run: lprl5eq1 with config:
[34m[1mwandb[0m: 	learning_rate: 9.677742308897944e-05
[34m[1mwandb[0m: 	num_train_epochs: 10
[34m[1mwandb[0m: 	train_batch_size: 22
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of the model checkpoint at xlm-roberta-base were not used when initializing XLMRobertaForSequenceClassification: ['lm_head.layer_norm.weight', 'lm_head.dense.bias', 'lm_head.decoder.weight', 'lm_head.layer_norm.bias', 'lm_head.bias', 'lm_head.dense.weight']
- This IS expected if you are initializing XLMRobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing XLMRobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of XLMRobertaForSequenceClassification were not initialized from the model checkpoint at xlm-roberta-base and are newly initialized: ['classifier.out_proj.bias', 'classifier.dense.weight', 'classifier.dense.bias

HBox(children=(FloatProgress(value=0.0, description='Epoch', max=10.0, style=ProgressStyle(description_width='…

HBox(children=(FloatProgress(value=0.0, description='Running Epoch 0 of 10', max=425.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




  mcc = cov_ytyp / np.sqrt(cov_ytyt * cov_ypyp)


HBox(children=(FloatProgress(value=0.0, description='Running Epoch 1 of 10', max=425.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 2 of 10', max=425.0, style=ProgressStyle(de…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 3 of 10', max=425.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 4 of 10', max=425.0, style=ProgressStyle(de…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 5 of 10', max=425.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 6 of 10', max=425.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 7 of 10', max=425.0, style=ProgressStyle(de…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 8 of 10', max=425.0, style=ProgressStyle(de…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 9 of 10', max=425.0, style=ProgressStyle(de…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))






HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Evaluation', max=288.0, style=ProgressStyle(descr…




VBox(children=(Label(value=' 0.00MB of 0.00MB uploaded (0.00MB deduped)\r'), FloatProgress(value=0.82168614772…

0,1
Training loss,0.62055
lr,1e-05
global_step,4000.0
_runtime,515.0
_timestamp,1631636821.0
_step,95.0
tp,0.0
tn,1400.0
fp,0.0
fn,902.0


0,1
Training loss,▆▅█▆▂▂▅▆█▁▂▄▂▄█▂▅▆▇▆▄▇▁▃▆▅▇▆▅▂▄▇▆▅▅▆▇▂▆▃
lr,▅███▇▇▇▇▇▇▆▆▆▆▆▅▅▅▅▅▅▄▄▄▄▄▃▃▃▃▃▃▂▂▂▂▂▁▁▁
global_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
_runtime,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇████
_timestamp,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇████
_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
tp,▁▁▁▁▁▁▁▁▁▁▁▁▁
tn,▁▁▁▁▁▁▁▁▁▁▁▁▁
fp,▁▁▁▁▁▁▁▁▁▁▁▁▁
fn,▁▁▁▁▁▁▁▁▁▁▁▁▁


[34m[1mwandb[0m: Agent Starting Run: pp7i6v6u with config:
[34m[1mwandb[0m: 	learning_rate: 5.0437877383530234e-05
[34m[1mwandb[0m: 	num_train_epochs: 3
[34m[1mwandb[0m: 	train_batch_size: 98
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of the model checkpoint at xlm-roberta-base were not used when initializing XLMRobertaForSequenceClassification: ['lm_head.layer_norm.weight', 'lm_head.dense.bias', 'lm_head.decoder.weight', 'lm_head.layer_norm.bias', 'lm_head.bias', 'lm_head.dense.weight']
- This IS expected if you are initializing XLMRobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing XLMRobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of XLMRobertaForSequenceClassification were not initialized from the model checkpoint at xlm-roberta-base and are newly initialized: ['classifier.out_proj.bias', 'classifier.dense.weight', 'classifier.dense.bias

HBox(children=(FloatProgress(value=0.0, description='Epoch', max=3.0, style=ProgressStyle(description_width='i…

HBox(children=(FloatProgress(value=0.0, description='Running Epoch 0 of 3', max=96.0, style=ProgressStyle(desc…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 1 of 3', max=96.0, style=ProgressStyle(desc…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 2 of 3', max=96.0, style=ProgressStyle(desc…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Evaluation', max=288.0, style=ProgressStyle(descr…




VBox(children=(Label(value=' 0.07MB of 0.08MB uploaded (0.00MB deduped)\r'), FloatProgress(value=0.98982661004…

0,1
Training loss,0.40803
lr,1e-05
global_step,288.0
_runtime,114.0
_timestamp,1631636947.0
_step,10.0
tp,656.0
tn,1155.0
fp,245.0
fn,246.0


0,1
Training loss,█▆▇▂▁
lr,▄█▆▃▁
global_step,▁▂▂▄▅▅▇█
_runtime,▁▂▃▄▅▅▆▇███
_timestamp,▁▂▃▄▅▅▆▇███
_step,▁▂▂▃▄▅▅▆▇▇█
tp,█▆▁
tn,▁▄█
fp,█▅▁
fn,▁▃█


[34m[1mwandb[0m: Agent Starting Run: kjrjnqge with config:
[34m[1mwandb[0m: 	learning_rate: 6.407958942042518e-06
[34m[1mwandb[0m: 	num_train_epochs: 3
[34m[1mwandb[0m: 	train_batch_size: 98
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of the model checkpoint at xlm-roberta-base were not used when initializing XLMRobertaForSequenceClassification: ['lm_head.layer_norm.weight', 'lm_head.dense.bias', 'lm_head.decoder.weight', 'lm_head.layer_norm.bias', 'lm_head.bias', 'lm_head.dense.weight']
- This IS expected if you are initializing XLMRobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing XLMRobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of XLMRobertaForSequenceClassification were not initialized from the model checkpoint at xlm-roberta-base and are newly initialized: ['classifier.out_proj.bias', 'classifier.dense.weight', 'classifier.dense.bias

HBox(children=(FloatProgress(value=0.0, description='Epoch', max=3.0, style=ProgressStyle(description_width='i…

HBox(children=(FloatProgress(value=0.0, description='Running Epoch 0 of 3', max=96.0, style=ProgressStyle(desc…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




  mcc = cov_ytyp / np.sqrt(cov_ytyt * cov_ypyp)


HBox(children=(FloatProgress(value=0.0, description='Running Epoch 1 of 3', max=96.0, style=ProgressStyle(desc…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 2 of 3', max=96.0, style=ProgressStyle(desc…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Evaluation', max=288.0, style=ProgressStyle(descr…




VBox(children=(Label(value=' 0.08MB of 0.08MB uploaded (0.00MB deduped)\r'), FloatProgress(value=1.0, max=1.0)…

0,1
Training loss,0.57498
lr,0.0
global_step,288.0
_runtime,114.0
_timestamp,1631637072.0
_step,10.0
tp,540.0
tn,1174.0
fp,226.0
fn,362.0


0,1
Training loss,▆█▆▁▁
lr,▄█▆▃▁
global_step,▁▂▂▄▅▅▇█
_runtime,▁▂▃▄▅▅▆▇███
_timestamp,▁▂▃▄▅▅▆▇███
_step,▁▂▂▃▄▅▅▆▇▇█
tp,▁▆█
tn,█▄▁
fp,▁▅█
fn,█▃▁


[34m[1mwandb[0m: Agent Starting Run: ym5sl6uk with config:
[34m[1mwandb[0m: 	learning_rate: 9.695278202270423e-05
[34m[1mwandb[0m: 	num_train_epochs: 3
[34m[1mwandb[0m: 	train_batch_size: 99
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of the model checkpoint at xlm-roberta-base were not used when initializing XLMRobertaForSequenceClassification: ['lm_head.layer_norm.weight', 'lm_head.dense.bias', 'lm_head.decoder.weight', 'lm_head.layer_norm.bias', 'lm_head.bias', 'lm_head.dense.weight']
- This IS expected if you are initializing XLMRobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing XLMRobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of XLMRobertaForSequenceClassification were not initialized from the model checkpoint at xlm-roberta-base and are newly initialized: ['classifier.out_proj.bias', 'classifier.dense.weight', 'classifier.dense.bias

HBox(children=(FloatProgress(value=0.0, description='Epoch', max=3.0, style=ProgressStyle(description_width='i…

HBox(children=(FloatProgress(value=0.0, description='Running Epoch 0 of 3', max=95.0, style=ProgressStyle(desc…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 1 of 3', max=95.0, style=ProgressStyle(desc…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 2 of 3', max=95.0, style=ProgressStyle(desc…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Evaluation', max=288.0, style=ProgressStyle(descr…




VBox(children=(Label(value=' 0.08MB of 0.08MB uploaded (0.00MB deduped)\r'), FloatProgress(value=1.0, max=1.0)…

0,1
Training loss,0.41213
lr,2e-05
global_step,285.0
_runtime,115.0
_timestamp,1631637198.0
_step,10.0
tp,679.0
tn,1135.0
fp,265.0
fn,223.0


0,1
Training loss,█▇▆▁▂
lr,▄█▆▃▁
global_step,▁▂▂▄▅▅▇█
_runtime,▁▂▃▄▅▅▆▇███
_timestamp,▁▂▃▄▅▅▆▇███
_step,▁▂▂▃▄▅▅▆▇▇█
tp,█▁▄
tn,▁█▇
fp,█▁▂
fn,▁█▅


[34m[1mwandb[0m: Agent Starting Run: oex6etrs with config:
[34m[1mwandb[0m: 	learning_rate: 7.403105630986895e-05
[34m[1mwandb[0m: 	num_train_epochs: 7
[34m[1mwandb[0m: 	train_batch_size: 98
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of the model checkpoint at xlm-roberta-base were not used when initializing XLMRobertaForSequenceClassification: ['lm_head.layer_norm.weight', 'lm_head.dense.bias', 'lm_head.decoder.weight', 'lm_head.layer_norm.bias', 'lm_head.bias', 'lm_head.dense.weight']
- This IS expected if you are initializing XLMRobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing XLMRobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of XLMRobertaForSequenceClassification were not initialized from the model checkpoint at xlm-roberta-base and are newly initialized: ['classifier.out_proj.bias', 'classifier.dense.weight', 'classifier.dense.bias

HBox(children=(FloatProgress(value=0.0, description='Epoch', max=7.0, style=ProgressStyle(description_width='i…

HBox(children=(FloatProgress(value=0.0, description='Running Epoch 0 of 7', max=96.0, style=ProgressStyle(desc…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 1 of 7', max=96.0, style=ProgressStyle(desc…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 2 of 7', max=96.0, style=ProgressStyle(desc…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 3 of 7', max=96.0, style=ProgressStyle(desc…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 4 of 7', max=96.0, style=ProgressStyle(desc…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 5 of 7', max=96.0, style=ProgressStyle(desc…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 6 of 7', max=96.0, style=ProgressStyle(desc…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Evaluation', max=288.0, style=ProgressStyle(descr…




VBox(children=(Label(value=' 0.07MB of 0.07MB uploaded (0.00MB deduped)\r'), FloatProgress(value=1.0, max=1.0)…

0,1
Training loss,0.08008
lr,0.0
global_step,672.0
_runtime,238.0
_timestamp,1631637446.0
_step,22.0
tp,619.0
tn,1175.0
fp,225.0
fn,283.0


0,1
Training loss,▇▆██▇▄▆▄▆▃▃▂▁
lr,▅█▇▇▆▅▅▄▄▃▂▂▁
global_step,▁▂▂▂▃▃▃▄▄▄▅▅▆▆▆▇▇▇██
_runtime,▁▂▂▂▃▃▃▄▄▄▅▅▅▆▆▆▇▇▇████
_timestamp,▁▂▂▂▃▃▃▄▄▄▅▅▅▆▆▆▇▇▇████
_step,▁▁▂▂▂▃▃▃▄▄▄▅▅▅▅▆▆▆▇▇▇██
tp,▆▁█▂▅▅▅
tn,▂█▁█▆▆▆
fp,▇▁█▁▃▃▃
fn,▃█▁▇▄▄▄


[34m[1mwandb[0m: Agent Starting Run: k0bd3x9a with config:
[34m[1mwandb[0m: 	learning_rate: 8.084645324142018e-05
[34m[1mwandb[0m: 	num_train_epochs: 3
[34m[1mwandb[0m: 	train_batch_size: 84
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of the model checkpoint at xlm-roberta-base were not used when initializing XLMRobertaForSequenceClassification: ['lm_head.layer_norm.weight', 'lm_head.dense.bias', 'lm_head.decoder.weight', 'lm_head.layer_norm.bias', 'lm_head.bias', 'lm_head.dense.weight']
- This IS expected if you are initializing XLMRobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing XLMRobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of XLMRobertaForSequenceClassification were not initialized from the model checkpoint at xlm-roberta-base and are newly initialized: ['classifier.out_proj.bias', 'classifier.dense.weight', 'classifier.dense.bias

HBox(children=(FloatProgress(value=0.0, description='Epoch', max=3.0, style=ProgressStyle(description_width='i…

HBox(children=(FloatProgress(value=0.0, description='Running Epoch 0 of 3', max=112.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 1 of 3', max=112.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 2 of 3', max=112.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Evaluation', max=288.0, style=ProgressStyle(descr…




VBox(children=(Label(value=' 0.07MB of 0.07MB uploaded (0.00MB deduped)\r'), FloatProgress(value=0.98953174540…

0,1
Training loss,0.36858
lr,1e-05
global_step,336.0
_runtime,118.0
_timestamp,1631637574.0
_step,11.0
tp,659.0
tn,1131.0
fp,269.0
fn,243.0


0,1
Training loss,█▆▃▆▁▁
lr,▄█▆▅▃▁
global_step,▁▂▃▃▅▅▆▇█
_runtime,▁▂▃▃▄▅▅▆▇███
_timestamp,▁▂▃▃▄▅▅▆▇███
_step,▁▂▂▃▄▄▅▅▆▇▇█
tp,█▅▁
tn,▁▆█
fp,█▃▁
fn,▁▄█


[34m[1mwandb[0m: Agent Starting Run: h7h3uzhu with config:
[34m[1mwandb[0m: 	learning_rate: 4.567392896324436e-06
[34m[1mwandb[0m: 	num_train_epochs: 3
[34m[1mwandb[0m: 	train_batch_size: 26
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of the model checkpoint at xlm-roberta-base were not used when initializing XLMRobertaForSequenceClassification: ['lm_head.layer_norm.weight', 'lm_head.dense.bias', 'lm_head.decoder.weight', 'lm_head.layer_norm.bias', 'lm_head.bias', 'lm_head.dense.weight']
- This IS expected if you are initializing XLMRobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing XLMRobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of XLMRobertaForSequenceClassification were not initialized from the model checkpoint at xlm-roberta-base and are newly initialized: ['classifier.out_proj.bias', 'classifier.dense.weight', 'classifier.dense.bias

HBox(children=(FloatProgress(value=0.0, description='Epoch', max=3.0, style=ProgressStyle(description_width='i…

HBox(children=(FloatProgress(value=0.0, description='Running Epoch 0 of 3', max=360.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 1 of 3', max=360.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 2 of 3', max=360.0, style=ProgressStyle(des…

HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))





HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Evaluation', max=288.0, style=ProgressStyle(descr…




VBox(children=(Label(value=' 0.08MB of 0.08MB uploaded (0.00MB deduped)\r'), FloatProgress(value=0.99021021755…

0,1
Training loss,0.50093
lr,0.0
global_step,1080.0
_runtime,170.0
_timestamp,1631637755.0
_step,27.0
tp,625.0
tn,1138.0
fp,262.0
fn,277.0


0,1
Training loss,▇▆▇▅▅█▇█▅▇▅▅▄▄▃▃▅▂▃▁▄
lr,▅██▇▇▇▆▆▅▅▅▄▄▄▃▃▂▂▂▁▁
global_step,▁▁▂▂▂▃▃▃▃▄▄▄▅▅▅▆▆▆▆▇▇▇▇██
_runtime,▁▁▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▆▆▆▆▇▇▇████
_timestamp,▁▁▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▆▆▆▆▇▇▇████
_step,▁▁▂▂▂▂▃▃▃▃▄▄▄▄▅▅▅▅▆▆▆▆▇▇▇▇██
tp,█▁▅▄
tn,▁███
fp,█▁▁▁
fn,▁█▅▅


[34m[1mwandb[0m: Agent Starting Run: 8ams3tue with config:
[34m[1mwandb[0m: 	learning_rate: 9.659378022083072e-05
[34m[1mwandb[0m: 	num_train_epochs: 15
[34m[1mwandb[0m: 	train_batch_size: 99
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.


Some weights of the model checkpoint at xlm-roberta-base were not used when initializing XLMRobertaForSequenceClassification: ['lm_head.layer_norm.weight', 'lm_head.dense.bias', 'lm_head.decoder.weight', 'lm_head.layer_norm.bias', 'lm_head.bias', 'lm_head.dense.weight']
- This IS expected if you are initializing XLMRobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing XLMRobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of XLMRobertaForSequenceClassification were not initialized from the model checkpoint at xlm-roberta-base and are newly initialized: ['classifier.out_proj.bias', 'classifier.dense.weight', 'classifier.dense.bias

HBox(children=(FloatProgress(value=0.0, description='Epoch', max=15.0, style=ProgressStyle(description_width='…

HBox(children=(FloatProgress(value=0.0, description='Running Epoch 0 of 15', max=95.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 1 of 15', max=95.0, style=ProgressStyle(des…




HBox(children=(FloatProgress(value=0.0, max=2302.0), HTML(value='')))




HBox(children=(FloatProgress(value=0.0, description='Running Epoch 2 of 15', max=95.0, style=ProgressStyle(des…

In [None]:
model_name = "xlm-roberta-large"
model_type = "xlmroberta"
language = "en"

run_hyperparams_optimization(model_name, model_type, language)

In [None]:
model_name = "distilroberta-base"
model_type = "roberta"
language = "en"

run_hyperparams_optimization(model_name, model_type, language)

In [None]:
model_name = "roberta-base"
model_type = "roberta"
language = "en"

run_hyperparams_optimization(model_name, model_type, language)