In [9]:
import pandas as pd
import os
import numpy as np
from datasets import load_dataset, load_metric, set_caching_enabled
from transformers import (
    AutoModelForSequenceClassification,
    AutoTokenizer,
    PrinterCallback,
    Trainer,
    TrainingArguments,
    default_data_collator,
)
from transformers.trainer_utils import set_seed

In [2]:
import wandb

In [3]:
wandb.init()

sweep_config = {
  "name" : "my-sweep",
  "method" : "bayes",
    "metric": {"name": "eval/f1", "goal": "maximize"},
  "parameters" : {
    "learning_rate" :{
      "distribution": "uniform",
      "min": 0.0000001,
      "max": 0.00001
    },
    "num_train_epochs" :{
      "distribution": "int_uniform",
      "min": 1,
      "max": 3
    },
    "per_device_train_batch_size" :{
      "distribution": "int_uniform",
      "min": 8,
      "max": 32
    },
    "weight_decay":{
      "max": 0.02,
      "min": 0.005,
      "distribution": "uniform",
    },
    "warmup_ratio":{ 
      "max": 0.1,
      "min": 0.01,
      "distribution": "uniform"
    }
  }
}
sweep_id = wandb.sweep(sweep_config)

[34m[1mwandb[0m: Currently logged in as: [33meliottr[0m (use `wandb login --relogin` to force relogin)
2022-04-27 20:04:01.131409: I tensorflow/stream_executor/platform/default/dso_loader.cc:49] Successfully opened dynamic library libcudart.so.10.1


Create sweep with ID: tjsd3ws1
Sweep URL: https://wandb.ai/eliottr/uncategorized/sweeps/tjsd3ws1


In [4]:
MODEL_NAME = "bert-base-uncased"
METRIC_NAME = "f1"
os.environ["TOKENIZERS_PARALLELISM"] = "false"

In [5]:
BATCH_SIZE = 8
MODEL_DIR = "/workspace/models"
DATA_DIR = "/workspace/data"
CACHE_DIR = "/.cache/huggingface"
LOG_DIR = "/workspace/logs"

In [6]:
def tokenize_fn(example):
    model = AutoModelForSequenceClassification.from_pretrained(MODEL_NAME, num_labels=3, cache_dir=CACHE_DIR)
    return tokenizer(example["text"], padding="max_length", truncation=True, max_length=70)  # max length 70 for twitter

def compute_metrics(eval_pred):
    metric = load_metric(METRIC_NAME)
    predictions, labels = eval_pred
    predictions = np.argmax(predictions, axis=1)
    return metric.compute(predictions=predictions, references=labels, average="weighted")


In [7]:
def training_loop():
    with wandb.init() as run:
        # Define model and data

        # DATASET = "movies"
        DATASET = "tweets"
        set_caching_enabled(True)
        set_seed(42)
        NUM_LABELS = 3
        dataset_raw = load_dataset(
                DATA_DIR + "/tweet-sentiment-extraction",
                data_files={"train": "train_for_fine_tune.csv", "test": "test_for_fine_tune.csv"},
            )
        model = AutoModelForSequenceClassification.from_pretrained(MODEL_NAME, num_labels=NUM_LABELS, cache_dir=CACHE_DIR)
        global tokenizer
        tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME, cache_dir=CACHE_DIR)
        global metric
        metric = load_metric(METRIC_NAME)

        # Prepate the data
        dataset = dataset_raw.map(tokenize_fn, batched=True)
        data_collator = default_data_collator

        train_dataset = dataset["train"]
        eval_dataset = dataset["test"]

        # Train and evaluate the model
        training_args = TrainingArguments(
            f"{MODEL_DIR}/{MODEL_NAME}-finetuned-" + DATASET,
            per_device_train_batch_size=wandb.config.per_device_train_batch_size,
            per_device_eval_batch_size=wandb.config.per_device_train_batch_size,
            learning_rate=wandb.config.learning_rate,
            num_train_epochs=wandb.config.num_train_epochs,
            logging_dir=LOG_DIR,
            warmup_ratio=wandb.config.warmup_ratio,
            weight_decay=wandb.config.weight_decay,
            metric_for_best_model=METRIC_NAME,
            evaluation_strategy="steps",
            logging_steps=50,
            #save_steps=50,
            load_best_model_at_end=True
            # lr_scheduler_type='cosine_with_restarts'
        )
        trainer = Trainer(
            model=model,
            args=training_args,
            train_dataset=train_dataset,
            eval_dataset=eval_dataset,
            tokenizer=tokenizer,
            compute_metrics=compute_metrics,
            # optimizers=[AdamW(model.parameters(), lr=2e-5), get_cosine_with_hard_restarts_schedule_with_warmup(optimizer=AdamW(model.parameters(), lr=2e-5), num_warmup_steps=300, num_training_steps=3436, num_cycles=3)]
        )

        result_train = trainer.train()
        result_eval = trainer.evaluate()
        trainer.save_model()

In [None]:
wandb.agent(sweep_id, function=training_loop, count=50)

[34m[1mwandb[0m: Agent Starting Run: pgbqf04v with config:
[34m[1mwandb[0m: 	learning_rate: 6.340994941331681e-06
[34m[1mwandb[0m: 	num_train_epochs: 3
[34m[1mwandb[0m: 	per_device_train_batch_size: 20
[34m[1mwandb[0m: 	warmup_ratio: 0.05049849975627213
[34m[1mwandb[0m: 	weight_decay: 0.016067169519792812
2022-04-27 20:04:12.381465: I tensorflow/stream_executor/platform/default/dso_loader.cc:49] Successfully opened dynamic library libcudart.so.10.1


Using custom data configuration tweet-sentiment-extraction-26a05391932e4e2c
Reusing dataset csv (/home/eliott.remmer/.cache/huggingface/datasets/csv/tweet-sentiment-extraction-26a05391932e4e2c/0.0.0/6b9057d9e23d9d8a2f05b985917a0da84d70c5dae3d22ddd8a3f22fb01c69d9e)


  0%|          | 0/2 [00:00<?, ?it/s]

Some weights of the model checkpoint at bert-base-uncased were not used when initializing BertForSequenceClassification: ['cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.decoder.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.transform.dense.bias', 'cls.predictions.bias', 'cls.predictions.transform.LayerNorm.weight']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model checkpoint at

Step,Training Loss,Validation Loss,F1
50,1.1082,1.095607,0.312542
100,1.0933,1.06198,0.433047
150,1.0534,1.00851,0.503555
200,0.9828,0.900186,0.602116
250,0.8794,0.785755,0.670767
300,0.7565,0.681085,0.732422
350,0.7078,0.642355,0.738141
400,0.6395,0.616598,0.751331
450,0.6561,0.595296,0.764201
500,0.614,0.59709,0.756402


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 20
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 20
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 20
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 20
The following columns in the evaluation set  don't have a corresponding 

Saving model checkpoint to /workspace/models/bert-base-uncased-finetuned-tweets
Configuration saved in /workspace/models/bert-base-uncased-finetuned-tweets/config.json
Model weights saved in /workspace/models/bert-base-uncased-finetuned-tweets/pytorch_model.bin
tokenizer config file saved in /workspace/models/bert-base-uncased-finetuned-tweets/tokenizer_config.json
Special tokens file saved in /workspace/models/bert-base-uncased-finetuned-tweets/special_tokens_map.json





VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
eval/f1,▁▄▆▇█▇█▇████████████████████████████████
eval/loss,█▇▄▃▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eval/runtime,▁▄▂▂▃▂▃▄█▄▃▃▃▃▃▃▇▃▄▄▄▄▄▄▄▃▃▄▆▃▄▄▄▃▄▄▄▄▄▄
eval/samples_per_second,█▅▇▇▆▇▆▅▁▅▆▆▆▆▆▆▂▆▄▅▅▅▅▅▅▆▆▅▃▆▅▅▅▆▅▅▅▅▅▅
eval/steps_per_second,█▅▇▇▆▇▆▅▁▅▆▆▆▆▆▆▂▆▄▅▅▅▅▅▅▆▆▅▃▆▅▅▅▆▅▅▅▅▅▅
train/epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
train/global_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
train/learning_rate,▃▆███▇▇▇▇▇▇▆▆▆▆▆▅▅▅▅▅▄▄▄▄▄▃▃▃▃▃▃▂▂▂▂▂▁▁▁
train/loss,█▇▆▄▃▃▃▃▂▃▃▂▂▂▂▂▁▁▂▂▁▂▁▂▂▁▂▁▁▁▁▁▁▁▁▁▁▁▁▁
train/total_flos,▁

0,1
eval/f1,0.7951
eval/loss,0.51693
eval/runtime,5.8898
eval/samples_per_second,600.02
eval/steps_per_second,30.052
train/epoch,3.0
train/global_step,4122.0
train/learning_rate,0.0
train/loss,0.4432
train/total_flos,2965575998095200.0


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: adkk6dr0 with config:
[34m[1mwandb[0m: 	learning_rate: 1.831443119263844e-06
[34m[1mwandb[0m: 	num_train_epochs: 2
[34m[1mwandb[0m: 	per_device_train_batch_size: 10
[34m[1mwandb[0m: 	warmup_ratio: 0.01960502604771487
[34m[1mwandb[0m: 	weight_decay: 0.019650452308337615
2022-04-27 20:21:00.663377: I tensorflow/stream_executor/platform/default/dso_loader.cc:49] Successfully opened dynamic library libcudart.so.10.1


Using custom data configuration tweet-sentiment-extraction-26a05391932e4e2c
Reusing dataset csv (/home/eliott.remmer/.cache/huggingface/datasets/csv/tweet-sentiment-extraction-26a05391932e4e2c/0.0.0/6b9057d9e23d9d8a2f05b985917a0da84d70c5dae3d22ddd8a3f22fb01c69d9e)


  0%|          | 0/2 [00:00<?, ?it/s]

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /.cache/huggingface/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "_name_or_path": "bert-base-uncased",
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_2": 2
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.14.1"

Step,Training Loss,Validation Loss,F1
50,1.11,1.104203,0.274477
100,1.1035,1.084078,0.36489
150,1.0857,1.067239,0.419955
200,1.0768,1.053738,0.451662
250,1.0622,1.037582,0.471164
300,1.0327,1.01496,0.506948
350,1.0152,0.99885,0.533227
400,0.9902,0.966087,0.528131
450,0.995,0.937247,0.569954
500,0.9396,0.907394,0.575436


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 10
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 10
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 10
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 10
The following columns in the evaluation set  don't have a corresponding 

Saving model checkpoint to /workspace/models/bert-base-uncased-finetuned-tweets
Configuration saved in /workspace/models/bert-base-uncased-finetuned-tweets/config.json
Model weights saved in /workspace/models/bert-base-uncased-finetuned-tweets/pytorch_model.bin
tokenizer config file saved in /workspace/models/bert-base-uncased-finetuned-tweets/tokenizer_config.json
Special tokens file saved in /workspace/models/bert-base-uncased-finetuned-tweets/special_tokens_map.json





VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
eval/f1,▁▃▄▅▆▇▇▇▇▇▇█████████████████████████████
eval/loss,██▇▆▅▄▄▃▃▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eval/runtime,▁▃▃▄▃▃▄▄▂▂▂█▂▂▂▃▁▂▄▁▂▃▂▅▃▃▄▃▄▅▄▂▁▃▂▄▃▄▃▆
eval/samples_per_second,█▆▆▅▆▆▅▅▆▇▇▁▇▇▇▆▇▇▅█▇▆▇▄▆▆▅▆▅▄▅▇█▆▇▅▆▅▆▃
eval/steps_per_second,█▆▆▅▆▆▅▅▆▇▇▁▇▇▇▆▇▇▅█▇▆▇▄▆▆▅▆▅▄▅▇█▆▇▅▆▅▆▃
train/epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
train/global_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
train/learning_rate,▄███▇▇▇▇▇▇▆▆▆▆▆▅▅▅▅▅▄▄▄▄▄▄▃▃▃▃▃▃▂▂▂▂▂▁▁▁
train/loss,██▇▇▅▅▄▄▄▃▄▄▃▃▃▃▃▃▂▂▂▂▃▂▂▃▂▂▂▂▂▂▂▂▂▂▂▁▂▂
train/total_flos,▁

0,1
eval/f1,0.77506
eval/loss,0.56681
eval/runtime,6.3752
eval/samples_per_second,554.337
eval/steps_per_second,55.528
train/epoch,2.0
train/global_step,5496.0
train/learning_rate,0.0
train/loss,0.579
train/total_flos,1977050665396800.0


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: vxedv13w with config:
[34m[1mwandb[0m: 	learning_rate: 4.209517912375305e-06
[34m[1mwandb[0m: 	num_train_epochs: 1
[34m[1mwandb[0m: 	per_device_train_batch_size: 17
[34m[1mwandb[0m: 	warmup_ratio: 0.039171741820167194
[34m[1mwandb[0m: 	weight_decay: 0.0057429187590040745
2022-04-27 20:39:58.594960: I tensorflow/stream_executor/platform/default/dso_loader.cc:49] Successfully opened dynamic library libcudart.so.10.1


Using custom data configuration tweet-sentiment-extraction-26a05391932e4e2c
Reusing dataset csv (/home/eliott.remmer/.cache/huggingface/datasets/csv/tweet-sentiment-extraction-26a05391932e4e2c/0.0.0/6b9057d9e23d9d8a2f05b985917a0da84d70c5dae3d22ddd8a3f22fb01c69d9e)


  0%|          | 0/2 [00:00<?, ?it/s]

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /.cache/huggingface/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "_name_or_path": "bert-base-uncased",
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_2": 2
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.14.1"

Step,Training Loss,Validation Loss,F1
50,1.1035,1.082274,0.368325
100,1.0719,1.031448,0.482275
150,1.019,0.978162,0.571756
200,0.95,0.89435,0.646219
250,0.8871,0.82241,0.672516
300,0.8246,0.775568,0.687915
350,0.7658,0.722904,0.709282
400,0.7554,0.688513,0.718245
450,0.7033,0.658545,0.731143
500,0.6668,0.637904,0.742153


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 17
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 17
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 17
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 17
The following columns in the evaluation set  don't have a corresponding 

Saving model checkpoint to /workspace/models/bert-base-uncased-finetuned-tweets
Configuration saved in /workspace/models/bert-base-uncased-finetuned-tweets/config.json
Model weights saved in /workspace/models/bert-base-uncased-finetuned-tweets/pytorch_model.bin
tokenizer config file saved in /workspace/models/bert-base-uncased-finetuned-tweets/tokenizer_config.json
Special tokens file saved in /workspace/models/bert-base-uncased-finetuned-tweets/special_tokens_map.json





VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
eval/f1,▁▃▅▆▆▇▇▇▇████████████████████████
eval/loss,█▇▇▅▄▄▃▃▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eval/runtime,▁▁▂▂▂▂█▂▃▃▂▂▂▃▂▃▂▂▃▃▃▂▃▂▃▃▃▃▂▃▃▃▅
eval/samples_per_second,██▇▇▇▇▁▇▆▆▇▇▇▆▇▆▇▇▆▆▆▇▆▇▆▆▆▆▇▆▆▆▄
eval/steps_per_second,██▇▇▇▇▁▇▆▆▇▇▇▆▇▆▇▇▆▆▆▇▆▇▆▆▆▆▇▆▆▆▄
train/epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▇▇▇▇▇▇████
train/global_step,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▇▇▇▇▇▇████
train/learning_rate,▇███▇▇▇▇▆▆▆▆▅▅▅▅▄▄▄▄▄▃▃▃▃▂▂▂▂▁▁▁
train/loss,██▇▆▅▄▄▄▃▂▂▂▂▂▂▂▂▂▂▁▂▂▂▂▂▂▁▁▂▁▁▁
train/total_flos,▁

0,1
eval/f1,0.76345
eval/loss,0.57306
eval/runtime,6.2733
eval/samples_per_second,563.343
eval/steps_per_second,33.157
train/epoch,1.0
train/global_step,1617.0
train/learning_rate,0.0
train/loss,0.5844
train/total_flos,988525332698400.0


[34m[1mwandb[0m: Agent Starting Run: 3rg1eo05 with config:
[34m[1mwandb[0m: 	learning_rate: 1.3361077839598998e-06
[34m[1mwandb[0m: 	num_train_epochs: 1
[34m[1mwandb[0m: 	per_device_train_batch_size: 21
[34m[1mwandb[0m: 	warmup_ratio: 0.03999780827110677
[34m[1mwandb[0m: 	weight_decay: 0.01590829122600427
2022-04-27 20:46:47.159316: I tensorflow/stream_executor/platform/default/dso_loader.cc:49] Successfully opened dynamic library libcudart.so.10.1


Using custom data configuration tweet-sentiment-extraction-26a05391932e4e2c
Reusing dataset csv (/home/eliott.remmer/.cache/huggingface/datasets/csv/tweet-sentiment-extraction-26a05391932e4e2c/0.0.0/6b9057d9e23d9d8a2f05b985917a0da84d70c5dae3d22ddd8a3f22fb01c69d9e)


  0%|          | 0/2 [00:00<?, ?it/s]

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /.cache/huggingface/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "_name_or_path": "bert-base-uncased",
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_2": 2
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.14.1"

Step,Training Loss,Validation Loss,F1
50,1.1064,1.097227,0.304043
100,1.0902,1.076743,0.395271
150,1.0731,1.059649,0.433491
200,1.06,1.041295,0.456028
250,1.0434,1.022982,0.45257
300,1.033,1.011738,0.456209
350,1.0203,0.986842,0.494751
400,0.9725,0.968425,0.508333
450,0.9669,0.944446,0.505488
500,0.9655,0.924907,0.524708


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 21
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 21
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 21
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 21
The following columns in the evaluation set  don't have a corresponding 

Saving model checkpoint to /workspace/models/bert-base-uncased-finetuned-tweets
Configuration saved in /workspace/models/bert-base-uncased-finetuned-tweets/config.json
Model weights saved in /workspace/models/bert-base-uncased-finetuned-tweets/pytorch_model.bin
tokenizer config file saved in /workspace/models/bert-base-uncased-finetuned-tweets/tokenizer_config.json
Special tokens file saved in /workspace/models/bert-base-uncased-finetuned-tweets/special_tokens_map.json





VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
eval/f1,▁▃▃▄▄▄▄▅▅▅▆▆▆▇▇▇▇█▇████████
eval/loss,██▇▇▆▆▅▅▄▄▄▃▃▃▂▂▂▂▂▁▁▁▁▁▁▁▁
eval/runtime,▁▃▂▁▁▁▃▃▃▄▁▃▃▂▂▂▅▃▃▂▃▃▃█▃▂▂
eval/samples_per_second,█▆▇███▆▆▆▅█▆▆▇▇▇▄▆▆▇▆▆▅▁▆▆▇
eval/steps_per_second,█▆▇███▆▆▆▅█▆▆▇▇▇▄▆▆▇▆▆▅▁▆▆▇
train/epoch,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▇▇▇▇▇▇████
train/global_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▇▇▇▇▇▇████
train/learning_rate,███▇▇▇▇▆▆▆▅▅▅▅▄▄▄▃▃▃▂▂▂▂▁▁
train/loss,██▇▇▇▆▆▅▅▅▄▄▃▃▃▂▃▂▂▂▂▁▂▁▁▁
train/total_flos,▁

0,1
eval/f1,0.67482
eval/loss,0.81085
eval/runtime,5.7133
eval/samples_per_second,618.553
eval/steps_per_second,29.58
train/epoch,1.0
train/global_step,1309.0
train/learning_rate,0.0
train/loss,0.8208
train/total_flos,988525332698400.0


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: d1k38tqj with config:
[34m[1mwandb[0m: 	learning_rate: 7.459411257403022e-07
[34m[1mwandb[0m: 	num_train_epochs: 2
[34m[1mwandb[0m: 	per_device_train_batch_size: 9
[34m[1mwandb[0m: 	warmup_ratio: 0.02884344730004397
[34m[1mwandb[0m: 	weight_decay: 0.01576994972645896
2022-04-27 20:52:32.881701: I tensorflow/stream_executor/platform/default/dso_loader.cc:49] Successfully opened dynamic library libcudart.so.10.1


Using custom data configuration tweet-sentiment-extraction-26a05391932e4e2c
Reusing dataset csv (/home/eliott.remmer/.cache/huggingface/datasets/csv/tweet-sentiment-extraction-26a05391932e4e2c/0.0.0/6b9057d9e23d9d8a2f05b985917a0da84d70c5dae3d22ddd8a3f22fb01c69d9e)


  0%|          | 0/2 [00:00<?, ?it/s]

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /.cache/huggingface/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "_name_or_path": "bert-base-uncased",
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_2": 2
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.14.1"

Step,Training Loss,Validation Loss,F1
50,1.1178,1.108986,0.250013
100,1.1033,1.104588,0.269751
150,1.1113,1.096929,0.311158
200,1.086,1.090233,0.346631
250,1.0941,1.080619,0.381067
300,1.0834,1.074741,0.404105
350,1.0676,1.068388,0.411187
400,1.0687,1.063285,0.424525
450,1.0676,1.055563,0.429722
500,1.0655,1.048942,0.439175


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 9
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 9
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 9
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 9
The following columns in the evaluation set  don't have a corresponding argu

Saving model checkpoint to /workspace/models/bert-base-uncased-finetuned-tweets
Configuration saved in /workspace/models/bert-base-uncased-finetuned-tweets/config.json
Model weights saved in /workspace/models/bert-base-uncased-finetuned-tweets/pytorch_model.bin
tokenizer config file saved in /workspace/models/bert-base-uncased-finetuned-tweets/tokenizer_config.json
Special tokens file saved in /workspace/models/bert-base-uncased-finetuned-tweets/special_tokens_map.json





VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
eval/f1,▁▂▃▄▄▄▅▅▆▆▇▇▇▇▇▇████████████████████████
eval/loss,██▇▇▇▆▆▆▅▅▄▄▄▃▃▃▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eval/runtime,▁▂▂▃▁▂▂▄▁▃▃▂▆▄▄▃▁█▂▄▂▃▅▆▅▃▂▄▄▁▃▅▂▃▅▅▅▅▅▁
eval/samples_per_second,█▇▇▆█▇▇▅█▆▆▇▃▅▅▆█▁▇▅▇▆▄▃▄▆▇▄▅█▆▄▇▆▄▄▄▄▄█
eval/steps_per_second,█▇▇▆█▇▇▅█▆▆▇▃▅▅▆█▁▇▅▇▆▄▃▄▆▇▄▅█▆▄▇▆▄▄▄▄▄█
train/epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
train/global_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇▇███
train/learning_rate,▃███▇▇▇▇▇▇▆▆▆▆▆▅▅▅▅▅▅▄▄▄▄▄▃▃▃▃▃▂▂▂▂▂▂▁▁▁
train/loss,██▇▇▇▆▆▆▅▅▅▄▄▄▄▃▃▂▂▂▂▂▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▂▁
train/total_flos,▁

0,1
eval/f1,0.74153
eval/loss,0.63616
eval/runtime,6.5423
eval/samples_per_second,540.177
eval/steps_per_second,60.071
train/epoch,2.0
train/global_step,6108.0
train/learning_rate,0.0
train/loss,0.6749
train/total_flos,1977050665396800.0


[34m[1mwandb[0m: Agent Starting Run: 6yq3s8r9 with config:
[34m[1mwandb[0m: 	learning_rate: 4.884897966099726e-06
[34m[1mwandb[0m: 	num_train_epochs: 2
[34m[1mwandb[0m: 	per_device_train_batch_size: 27
[34m[1mwandb[0m: 	warmup_ratio: 0.0780993679477932
[34m[1mwandb[0m: 	weight_decay: 0.013225093538967454
2022-04-27 21:13:55.850772: I tensorflow/stream_executor/platform/default/dso_loader.cc:49] Successfully opened dynamic library libcudart.so.10.1


Using custom data configuration tweet-sentiment-extraction-26a05391932e4e2c
Reusing dataset csv (/home/eliott.remmer/.cache/huggingface/datasets/csv/tweet-sentiment-extraction-26a05391932e4e2c/0.0.0/6b9057d9e23d9d8a2f05b985917a0da84d70c5dae3d22ddd8a3f22fb01c69d9e)


  0%|          | 0/2 [00:00<?, ?it/s]

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /.cache/huggingface/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "_name_or_path": "bert-base-uncased",
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_2": 2
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.14.1"

Step,Training Loss,Validation Loss,F1
50,1.1132,1.094276,0.323873
100,1.0835,1.058808,0.434881
150,1.041,0.992354,0.461499
200,0.9631,0.884291,0.604797
250,0.8797,0.806252,0.659191
300,0.7782,0.724762,0.715782
350,0.7181,0.670915,0.736031
400,0.684,0.656561,0.734274
450,0.65,0.621756,0.749739
500,0.6047,0.608493,0.755411


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 27
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 27
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 27
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 27
The following columns in the evaluation set  don't have a corresponding 

Saving model checkpoint to /workspace/models/bert-base-uncased-finetuned-tweets
Configuration saved in /workspace/models/bert-base-uncased-finetuned-tweets/config.json
Model weights saved in /workspace/models/bert-base-uncased-finetuned-tweets/pytorch_model.bin
tokenizer config file saved in /workspace/models/bert-base-uncased-finetuned-tweets/tokenizer_config.json
Special tokens file saved in /workspace/models/bert-base-uncased-finetuned-tweets/special_tokens_map.json





VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
eval/f1,▁▃▃▅▆▇▇▇▇█▇█████████████████████████████
eval/loss,██▇▅▄▃▃▃▂▂▂▂▂▂▂▁▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eval/runtime,▁▂▂▁▃▅▃▃▂▃▂▃▃▃▇▃▃▄▃▂▃▃▅▃▃▄▃▂▃▃▂▃▃▃▃▃▂█▃▃
eval/samples_per_second,█▇▇█▆▄▆▆▇▅▇▆▆▆▂▆▆▅▆▇▆▅▄▆▆▅▆▆▆▆▇▆▆▆▆▆▇▁▆▆
eval/steps_per_second,█▇▇█▆▄▆▆▇▅▇▆▆▆▂▆▆▅▆▇▆▅▄▆▆▅▆▆▆▆▇▆▆▆▆▆▇▁▆▆
train/epoch,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇████
train/global_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇████
train/learning_rate,▃▅████▇▇▇▇▇▆▆▆▆▆▅▅▅▅▅▄▄▄▄▄▄▃▃▃▃▃▂▂▂▂▂▁▁▁
train/loss,██▇▆▅▄▄▃▃▂▃▃▂▃▂▂▂▂▂▂▁▁▂▁▁▁▁▂▁▁▁▁▁▁▁▁▁▁▁▂
train/total_flos,▁

0,1
eval/f1,0.78108
eval/loss,0.53339
eval/runtime,5.8671
eval/samples_per_second,602.346
eval/steps_per_second,22.328
train/epoch,2.0
train/global_step,2036.0
train/learning_rate,0.0
train/loss,0.5644
train/total_flos,1977050665396800.0


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 0nbu0cj6 with config:
[34m[1mwandb[0m: 	learning_rate: 7.067731308485416e-06
[34m[1mwandb[0m: 	num_train_epochs: 2
[34m[1mwandb[0m: 	per_device_train_batch_size: 16
[34m[1mwandb[0m: 	warmup_ratio: 0.05533789415539891
[34m[1mwandb[0m: 	weight_decay: 0.017223270797022638
2022-04-27 21:23:34.351527: I tensorflow/stream_executor/platform/default/dso_loader.cc:49] Successfully opened dynamic library libcudart.so.10.1


Using custom data configuration tweet-sentiment-extraction-26a05391932e4e2c
Reusing dataset csv (/home/eliott.remmer/.cache/huggingface/datasets/csv/tweet-sentiment-extraction-26a05391932e4e2c/0.0.0/6b9057d9e23d9d8a2f05b985917a0da84d70c5dae3d22ddd8a3f22fb01c69d9e)


  0%|          | 0/2 [00:00<?, ?it/s]

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /.cache/huggingface/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "_name_or_path": "bert-base-uncased",
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_2": 2
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.14.1"

Step,Training Loss,Validation Loss,F1
50,1.1039,1.093734,0.329838
100,1.0872,1.059183,0.41511
150,1.056,1.010814,0.523738
200,0.9775,0.896946,0.656552
250,0.8457,0.760457,0.71229
300,0.7735,0.682052,0.718927
350,0.7037,0.64253,0.741818
400,0.6655,0.622186,0.745837
450,0.6573,0.60625,0.758592
500,0.6037,0.604603,0.758089


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 16
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 16
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 16
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 16
The following columns in the evaluation set  don't have a corresponding 

Saving model checkpoint to /workspace/models/bert-base-uncased-finetuned-tweets
Configuration saved in /workspace/models/bert-base-uncased-finetuned-tweets/config.json
Model weights saved in /workspace/models/bert-base-uncased-finetuned-tweets/pytorch_model.bin
tokenizer config file saved in /workspace/models/bert-base-uncased-finetuned-tweets/tokenizer_config.json
Special tokens file saved in /workspace/models/bert-base-uncased-finetuned-tweets/special_tokens_map.json





VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
eval/f1,▁▂▆▇▇▇██▇███████████████████████████████
eval/loss,██▆▃▃▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eval/runtime,▁▁▃▂▄▁▃▇▃▃▃▃▇▃▄▃▄▃▂▄▃▄▄▃▄▅▄▄█▄▂▄▄▅▄▄▄▄▄▃
eval/samples_per_second,██▆▇▅█▆▂▆▆▆▆▂▆▅▆▅▅▇▅▅▅▅▆▅▄▅▅▁▅▆▅▅▄▅▅▅▅▅▆
eval/steps_per_second,██▆▇▅█▆▂▆▆▆▆▂▆▅▆▅▅▇▅▅▅▅▆▅▄▅▅▁▅▆▅▅▄▅▅▅▅▅▆
train/epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
train/global_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
train/learning_rate,▃▅███▇▇▇▇▇▆▆▆▆▆▆▅▅▅▅▅▄▄▄▄▄▄▃▃▃▃▃▂▂▂▂▂▁▁▁
train/loss,██▇▅▄▃▃▃▂▃▃▃▂▃▂▂▂▂▃▂▁▁▂▁▁▁▁▁▁▂▁▂▁▁▁▁▁▁▁▁
train/total_flos,▁

0,1
eval/f1,0.79412
eval/loss,0.50941
eval/runtime,5.8561
eval/samples_per_second,603.472
eval/steps_per_second,37.738
train/epoch,2.0
train/global_step,3436.0
train/learning_rate,0.0
train/loss,0.4778
train/total_flos,1977050665396800.0


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: ucn2og5g with config:
[34m[1mwandb[0m: 	learning_rate: 6.745413609717602e-06
[34m[1mwandb[0m: 	num_train_epochs: 3
[34m[1mwandb[0m: 	per_device_train_batch_size: 18
[34m[1mwandb[0m: 	warmup_ratio: 0.05604512442645369
[34m[1mwandb[0m: 	weight_decay: 0.0174168727361444
2022-04-27 21:36:47.582630: I tensorflow/stream_executor/platform/default/dso_loader.cc:49] Successfully opened dynamic library libcudart.so.10.1


Using custom data configuration tweet-sentiment-extraction-26a05391932e4e2c
Reusing dataset csv (/home/eliott.remmer/.cache/huggingface/datasets/csv/tweet-sentiment-extraction-26a05391932e4e2c/0.0.0/6b9057d9e23d9d8a2f05b985917a0da84d70c5dae3d22ddd8a3f22fb01c69d9e)


  0%|          | 0/2 [00:00<?, ?it/s]

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /.cache/huggingface/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "_name_or_path": "bert-base-uncased",
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_2": 2
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.14.1"

Step,Training Loss,Validation Loss,F1
50,1.1118,1.097173,0.307231
100,1.0957,1.072085,0.400466
150,1.0662,1.030728,0.48681
200,1.0207,0.965035,0.577739
250,0.9376,0.845433,0.658936
300,0.827,0.751379,0.691291
350,0.7476,0.67072,0.727335
400,0.6981,0.637225,0.749691
450,0.6481,0.609788,0.757532
500,0.66,0.59382,0.759619


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 18
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 18
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 18
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 18
The following columns in the evaluation set  don't have a corresponding 

Saving model checkpoint to /workspace/models/bert-base-uncased-finetuned-tweets
Configuration saved in /workspace/models/bert-base-uncased-finetuned-tweets/config.json
Model weights saved in /workspace/models/bert-base-uncased-finetuned-tweets/pytorch_model.bin
tokenizer config file saved in /workspace/models/bert-base-uncased-finetuned-tweets/tokenizer_config.json
Special tokens file saved in /workspace/models/bert-base-uncased-finetuned-tweets/special_tokens_map.json





VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
eval/f1,▁▄▆▇▇██▇████████████████████████████████
eval/loss,█▇▅▃▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eval/runtime,▁▂▃▃▃▃▃▄▃▄▄▄▄▄▄▃▄▃▃▄▅▃▄▄▃▃▄▅▄▃▄▄▃▄▄█▃▄▃▄
eval/samples_per_second,█▇▆▆▆▆▆▅▆▅▅▅▅▅▅▆▅▆▆▅▄▆▅▅▅▆▅▄▅▆▅▅▆▅▅▁▆▅▆▅
eval/steps_per_second,█▇▆▆▆▆▆▅▆▅▅▅▅▅▅▆▅▆▆▅▄▆▅▅▅▆▅▄▅▆▅▅▆▅▅▁▆▅▆▅
train/epoch,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
train/global_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
train/learning_rate,▂▅████▇▇▇▇▇▆▆▆▆▆▅▅▅▅▅▄▄▄▄▄▄▃▃▃▃▃▂▂▂▂▂▁▁▁
train/loss,██▆▄▄▃▃▃▂▂▃▂▃▂▂▂▂▂▂▂▂▂▁▂▁▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁
train/total_flos,▁

0,1
eval/f1,0.79611
eval/loss,0.52187
eval/runtime,6.043
eval/samples_per_second,584.81
eval/steps_per_second,32.6
train/epoch,3.0
train/global_step,4581.0
train/learning_rate,0.0
train/loss,0.4621
train/total_flos,2965575998095200.0


[34m[1mwandb[0m: Agent Starting Run: pxnw0vfv with config:
[34m[1mwandb[0m: 	learning_rate: 9.018328700784296e-06
[34m[1mwandb[0m: 	num_train_epochs: 3
[34m[1mwandb[0m: 	per_device_train_batch_size: 13
[34m[1mwandb[0m: 	warmup_ratio: 0.05425467692768531
[34m[1mwandb[0m: 	weight_decay: 0.0142138125444001
2022-04-27 21:55:04.891894: I tensorflow/stream_executor/platform/default/dso_loader.cc:49] Successfully opened dynamic library libcudart.so.10.1


Using custom data configuration tweet-sentiment-extraction-26a05391932e4e2c
Reusing dataset csv (/home/eliott.remmer/.cache/huggingface/datasets/csv/tweet-sentiment-extraction-26a05391932e4e2c/0.0.0/6b9057d9e23d9d8a2f05b985917a0da84d70c5dae3d22ddd8a3f22fb01c69d9e)


  0%|          | 0/2 [00:00<?, ?it/s]

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /.cache/huggingface/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "_name_or_path": "bert-base-uncased",
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_2": 2
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.14.1"

Step,Training Loss,Validation Loss,F1
50,1.0969,1.098272,0.305536
100,1.0926,1.072134,0.404144
150,1.0756,1.04177,0.468694
200,1.0349,0.978495,0.562186
250,0.9455,0.869553,0.661335
300,0.8329,0.776484,0.674271
350,0.8196,0.709,0.692298
400,0.7273,0.658379,0.726923
450,0.6527,0.629732,0.746297
500,0.6687,0.618813,0.745005


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 13
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 13
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 13
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 13
The following columns in the evaluation set  don't have a corresponding 

Saving model checkpoint to /workspace/models/bert-base-uncased-finetuned-tweets
Configuration saved in /workspace/models/bert-base-uncased-finetuned-tweets/config.json
Model weights saved in /workspace/models/bert-base-uncased-finetuned-tweets/pytorch_model.bin
tokenizer config file saved in /workspace/models/bert-base-uncased-finetuned-tweets/tokenizer_config.json
Special tokens file saved in /workspace/models/bert-base-uncased-finetuned-tweets/special_tokens_map.json





VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
eval/f1,▁▅▆▇▇▇██████████████████████████████████
eval/loss,█▇▃▂▂▂▁▂▁▁▁▁▁▁▁▁▂▁▁▁▁▁▁▁▁▁▁▁▂▂▂▁▂▂▁▁▂▂▂▁
eval/runtime,▂▄▂▂▃▃▃▄▂▃▃▃▁█▂▁▂▃▂▂▁▂▄▃▄▂▃▄▁▂▃▃▄▂▂▄▂▂▄█
eval/samples_per_second,▇▅▇▇▆▆▆▅▇▅▆▆█▁▇█▇▆▇▇█▇▅▆▅▇▆▅█▇▆▅▅▇▇▅▇▇▄▁
eval/steps_per_second,▇▅▇▇▆▆▆▅▇▅▆▆█▁▇█▇▆▇▇█▇▅▆▅▇▆▅█▇▆▅▅▇▇▅▇▇▄▁
train/epoch,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
train/global_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
train/learning_rate,▂▅███▇▇▇▇▇▆▆▆▆▆▆▅▅▅▅▅▄▄▄▄▄▃▃▃▃▃▃▂▂▂▂▂▁▁▁
train/loss,█▇▅▄▄▃▃▃▂▃▃▃▃▃▂▂▂▂▂▂▂▂▂▂▂▂▂▁▂▁▂▁▁▂▁▁▁▁▁▁
train/total_flos,▁

0,1
eval/f1,0.80079
eval/loss,0.52497
eval/runtime,6.3616
eval/samples_per_second,555.521
eval/steps_per_second,42.757
train/epoch,3.0
train/global_step,6342.0
train/learning_rate,0.0
train/loss,0.3789
train/total_flos,2965575998095200.0


[34m[1mwandb[0m: Agent Starting Run: ffbnsspr with config:
[34m[1mwandb[0m: 	learning_rate: 9.039492714858574e-06
[34m[1mwandb[0m: 	num_train_epochs: 3
[34m[1mwandb[0m: 	per_device_train_batch_size: 22
[34m[1mwandb[0m: 	warmup_ratio: 0.07515335370495126
[34m[1mwandb[0m: 	weight_decay: 0.013953418890929535
2022-04-27 22:18:28.443157: I tensorflow/stream_executor/platform/default/dso_loader.cc:49] Successfully opened dynamic library libcudart.so.10.1


Using custom data configuration tweet-sentiment-extraction-26a05391932e4e2c
Reusing dataset csv (/home/eliott.remmer/.cache/huggingface/datasets/csv/tweet-sentiment-extraction-26a05391932e4e2c/0.0.0/6b9057d9e23d9d8a2f05b985917a0da84d70c5dae3d22ddd8a3f22fb01c69d9e)


  0%|          | 0/2 [00:00<?, ?it/s]

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /.cache/huggingface/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "_name_or_path": "bert-base-uncased",
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_2": 2
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.14.1"

Step,Training Loss,Validation Loss,F1
50,1.1069,1.093102,0.328439
100,1.0919,1.057577,0.448442
150,1.0437,1.005191,0.497628
200,0.9832,0.883351,0.620364
250,0.8354,0.750027,0.707329
300,0.73,0.658488,0.723202
350,0.6606,0.640073,0.731874
400,0.636,0.585786,0.766606
450,0.6037,0.604809,0.747001
500,0.6032,0.568566,0.768983


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 22
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 22
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 22
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 22
The following columns in the evaluation set  don't have a corresponding 

Saving model checkpoint to /workspace/models/bert-base-uncased-finetuned-tweets
Configuration saved in /workspace/models/bert-base-uncased-finetuned-tweets/config.json
Model weights saved in /workspace/models/bert-base-uncased-finetuned-tweets/pytorch_model.bin
tokenizer config file saved in /workspace/models/bert-base-uncased-finetuned-tweets/tokenizer_config.json
Special tokens file saved in /workspace/models/bert-base-uncased-finetuned-tweets/special_tokens_map.json





VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
eval/f1,▁▃▅▇▇███████████████████████████████████
eval/loss,██▆▃▂▂▂▂▂▂▂▁▁▂▁▁▁▁▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eval/runtime,▁▅▃▅▆▅▄▄▅▄▃▄▆▄▅▅▃▄▆▃▅▆▃▄█▅▅▃▆▆▄▄▃▄▃▆▅▄▄▄
eval/samples_per_second,█▄▆▄▃▄▅▅▄▅▆▅▃▅▄▄▆▅▃▅▄▃▆▅▁▄▃▆▃▃▅▅▆▅▆▃▄▅▅▅
eval/steps_per_second,█▄▆▄▃▄▅▅▄▅▆▅▃▅▄▄▆▅▃▅▄▃▆▅▁▄▃▆▃▃▅▅▆▅▆▃▄▅▅▅
train/epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇████
train/global_step,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇████
train/learning_rate,▂▃▆███▇▇▇▇▇▆▆▆▆▆▅▅▅▅▅▅▄▄▄▄▄▃▃▃▃▃▂▂▂▂▂▁▁▁
train/loss,██▇▄▄▃▃▃▃▃▃▂▃▃▂▂▁▂▂▂▂▂▂▂▁▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁
train/total_flos,▁

0,1
eval/f1,0.79801
eval/loss,0.52189
eval/runtime,6.623
eval/samples_per_second,533.595
eval/steps_per_second,24.309
train/epoch,3.0
train/global_step,3750.0
train/learning_rate,0.0
train/loss,0.3691
train/total_flos,2965575998095200.0


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: kmcnpgr1 with config:
[34m[1mwandb[0m: 	learning_rate: 9.3386953053127e-06
[34m[1mwandb[0m: 	num_train_epochs: 3
[34m[1mwandb[0m: 	per_device_train_batch_size: 21
[34m[1mwandb[0m: 	warmup_ratio: 0.04160310660485734
[34m[1mwandb[0m: 	weight_decay: 0.01664969329186402
2022-04-27 22:35:46.066860: I tensorflow/stream_executor/platform/default/dso_loader.cc:49] Successfully opened dynamic library libcudart.so.10.1


Using custom data configuration tweet-sentiment-extraction-26a05391932e4e2c
Reusing dataset csv (/home/eliott.remmer/.cache/huggingface/datasets/csv/tweet-sentiment-extraction-26a05391932e4e2c/0.0.0/6b9057d9e23d9d8a2f05b985917a0da84d70c5dae3d22ddd8a3f22fb01c69d9e)


  0%|          | 0/2 [00:00<?, ?it/s]

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /.cache/huggingface/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "_name_or_path": "bert-base-uncased",
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_2": 2
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.14.1"

Step,Training Loss,Validation Loss,F1
50,1.1028,1.082577,0.37216
100,1.0684,1.028374,0.50348
150,0.9917,0.899063,0.637488
200,0.8492,0.735387,0.717955
250,0.7306,0.669372,0.725931
300,0.6524,0.625006,0.750279
350,0.6625,0.59681,0.758182
400,0.6143,0.571887,0.771679
450,0.6186,0.566374,0.77154
500,0.5972,0.57003,0.768496


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 21
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 21
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 21
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 21
The following columns in the evaluation set  don't have a corresponding 

Saving model checkpoint to /workspace/models/bert-base-uncased-finetuned-tweets
Configuration saved in /workspace/models/bert-base-uncased-finetuned-tweets/config.json
Model weights saved in /workspace/models/bert-base-uncased-finetuned-tweets/pytorch_model.bin
tokenizer config file saved in /workspace/models/bert-base-uncased-finetuned-tweets/tokenizer_config.json
Special tokens file saved in /workspace/models/bert-base-uncased-finetuned-tweets/special_tokens_map.json





VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
eval/f1,▁▅▇▇▇███████████████████████████████████
eval/loss,█▆▃▂▂▂▁▁▁▁▂▁▁▁▁▂▁▁▁▁▁▁▁▁▁▁▁▁▂▁▁▁▁▁▁▁▁▁▁▁
eval/runtime,▁▂▂▃▁▁▆▂▂▃▂▄▂▂▂▂▂▂▂█▃▂▃▃▂▁▂▃▂▂▂▁▅▃▃▂▂▂▂▃
eval/samples_per_second,█▇▇▆██▃▇▆▆▇▅▇▇▇▆▇▇▇▁▆▇▅▆▇█▇▆▆▇▇█▄▆▆▇▇▆▇▆
eval/steps_per_second,█▇▇▆██▃▇▆▆▇▅▇▇▇▆▇▇▇▁▆▇▅▆▇█▇▆▆▇▇█▄▆▆▇▇▆▇▆
train/epoch,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇████
train/global_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇▇███
train/learning_rate,▃▅███▇▇▇▇▇▆▆▆▆▆▆▅▅▅▅▅▄▄▄▄▄▃▃▃▃▃▃▂▂▂▂▂▁▁▁
train/loss,██▆▄▃▃▃▃▃▃▃▂▃▂▂▂▂▂▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▂▁▁▁▁▁▁
train/total_flos,▁

0,1
eval/f1,0.80422
eval/loss,0.51144
eval/runtime,5.7689
eval/samples_per_second,612.595
eval/steps_per_second,29.295
train/epoch,3.0
train/global_step,3927.0
train/learning_rate,0.0
train/loss,0.4119
train/total_flos,2965575998095200.0


[34m[1mwandb[0m: Agent Starting Run: y8u2frff with config:
[34m[1mwandb[0m: 	learning_rate: 9.828077271706537e-06
[34m[1mwandb[0m: 	num_train_epochs: 3
[34m[1mwandb[0m: 	per_device_train_batch_size: 13
[34m[1mwandb[0m: 	warmup_ratio: 0.012952487355606376
[34m[1mwandb[0m: 	weight_decay: 0.016366189106043087
2022-04-27 22:51:42.113924: I tensorflow/stream_executor/platform/default/dso_loader.cc:49] Successfully opened dynamic library libcudart.so.10.1


Using custom data configuration tweet-sentiment-extraction-26a05391932e4e2c
Reusing dataset csv (/home/eliott.remmer/.cache/huggingface/datasets/csv/tweet-sentiment-extraction-26a05391932e4e2c/0.0.0/6b9057d9e23d9d8a2f05b985917a0da84d70c5dae3d22ddd8a3f22fb01c69d9e)


  0%|          | 0/2 [00:00<?, ?it/s]

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /.cache/huggingface/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "_name_or_path": "bert-base-uncased",
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_2": 2
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.14.1"

Step,Training Loss,Validation Loss,F1
50,1.087,1.06545,0.418331
100,1.0404,0.969051,0.521171
150,0.9358,0.85097,0.576797
200,0.8273,0.838489,0.594271
250,0.7639,0.693429,0.71947
300,0.6933,0.647055,0.734767
350,0.7157,0.67499,0.710836
400,0.675,0.608232,0.749307
450,0.6163,0.612552,0.747283
500,0.6459,0.598676,0.754649


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 13
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 13
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 13
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 13
The following columns in the evaluation set  don't have a corresponding 

Saving model checkpoint to /workspace/models/bert-base-uncased-finetuned-tweets
Configuration saved in /workspace/models/bert-base-uncased-finetuned-tweets/config.json
Model weights saved in /workspace/models/bert-base-uncased-finetuned-tweets/pytorch_model.bin
tokenizer config file saved in /workspace/models/bert-base-uncased-finetuned-tweets/tokenizer_config.json
Special tokens file saved in /workspace/models/bert-base-uncased-finetuned-tweets/special_tokens_map.json





VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
eval/f1,▁▄▆▇▇▇█▇███▇▇███████████████████████████
eval/loss,█▅▃▂▂▂▁▂▁▁▁▁▁▁▁▁▂▁▂▁▁▁▁▁▁▁▁▂▂▂▂▁▂▂▁▁▂▂▂▁
eval/runtime,▁▂▃▃▃▃▄▃▃▄▄▄█▅▃▄▃▄█▃▃▅▃▃▄▃▃▅▄▄▄▅▃▄▅▃▅▃█▃
eval/samples_per_second,█▇▆▆▆▆▅▆▆▅▅▅▁▄▆▅▆▄▁▆▆▄▆▆▅▆▆▄▅▅▅▄▆▅▄▆▄▅▁▆
eval/steps_per_second,█▇▆▆▆▆▅▆▆▅▅▅▁▄▆▅▆▄▁▆▆▄▆▆▅▆▆▄▅▅▅▄▆▅▄▆▄▅▁▆
train/epoch,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
train/global_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
train/learning_rate,▅███▇▇▇▇▇▇▆▆▆▆▆▅▅▅▅▅▅▄▄▄▄▄▃▃▃▃▃▂▂▂▂▂▂▁▁▁
train/loss,█▆▅▄▄▃▃▃▂▃▃▃▃▃▂▂▂▂▂▂▂▂▂▂▂▂▂▁▂▁▂▁▁▂▁▁▁▁▁▁
train/total_flos,▁

0,1
eval/f1,0.80487
eval/loss,0.53887
eval/runtime,6.1811
eval/samples_per_second,571.743
eval/steps_per_second,44.005
train/epoch,3.0
train/global_step,6342.0
train/learning_rate,0.0
train/loss,0.3762
train/total_flos,2965575998095200.0


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: vh3th6hz with config:
[34m[1mwandb[0m: 	learning_rate: 8.939890110565372e-06
[34m[1mwandb[0m: 	num_train_epochs: 3
[34m[1mwandb[0m: 	per_device_train_batch_size: 12
[34m[1mwandb[0m: 	warmup_ratio: 0.01779760925759143
[34m[1mwandb[0m: 	weight_decay: 0.019620735960260555
2022-04-27 23:15:11.792590: I tensorflow/stream_executor/platform/default/dso_loader.cc:49] Successfully opened dynamic library libcudart.so.10.1


Using custom data configuration tweet-sentiment-extraction-26a05391932e4e2c
Reusing dataset csv (/home/eliott.remmer/.cache/huggingface/datasets/csv/tweet-sentiment-extraction-26a05391932e4e2c/0.0.0/6b9057d9e23d9d8a2f05b985917a0da84d70c5dae3d22ddd8a3f22fb01c69d9e)


  0%|          | 0/2 [00:00<?, ?it/s]

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /.cache/huggingface/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "_name_or_path": "bert-base-uncased",
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_2": 2
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.14.1"

Step,Training Loss,Validation Loss,F1
50,1.1022,1.08098,0.386098
100,1.0642,1.05613,0.388815
150,1.0032,0.943792,0.480749
200,0.8897,0.798167,0.681305
250,0.7356,0.714551,0.671733
300,0.7183,0.649411,0.727319
350,0.7056,0.625576,0.740492
400,0.6878,0.623238,0.739187
450,0.6466,0.599019,0.7549
500,0.593,0.596542,0.758281


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 12
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 12
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 12
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 12
The following columns in the evaluation set  don't have a corresponding 

Saving model checkpoint to /workspace/models/bert-base-uncased-finetuned-tweets
Configuration saved in /workspace/models/bert-base-uncased-finetuned-tweets/config.json
Model weights saved in /workspace/models/bert-base-uncased-finetuned-tweets/pytorch_model.bin
tokenizer config file saved in /workspace/models/bert-base-uncased-finetuned-tweets/tokenizer_config.json
Special tokens file saved in /workspace/models/bert-base-uncased-finetuned-tweets/special_tokens_map.json





VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
eval/f1,▁▆▇█████████████████████████████████████
eval/loss,█▅▃▂▂▁▂▁▂▁▁▁▁▁▁▁▂▂▂▂▁▂▁▁▁▁▁▂▁▂▂▂▂▂▂▂▂▂▂▁
eval/runtime,▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁█▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eval/samples_per_second,████████████████████▁███████████████████
eval/steps_per_second,████████████████████▁███████████████████
train/epoch,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
train/global_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
train/learning_rate,▇███▇▇▇▇▇▇▆▆▆▆▆▅▅▅▅▅▄▄▄▄▄▄▃▃▃▃▃▂▂▂▂▂▂▁▁▁
train/loss,█▆▄▄▃▄▃▄▃▃▃▃▃▃▃▂▂▂▂▃▂▂▂▂▂▂▃▁▂▁▁▂▂▂▁▁▁▁▁▂
train/total_flos,▁

0,1
eval/f1,0.79782
eval/loss,0.5048
eval/runtime,6.4004
eval/samples_per_second,552.156
eval/steps_per_second,46.091
train/epoch,3.0
train/global_step,6870.0
train/learning_rate,0.0
train/loss,0.3339
train/total_flos,2965575998095200.0


[34m[1mwandb[0m: Agent Starting Run: lxn8t4qi with config:
[34m[1mwandb[0m: 	learning_rate: 9.96240459515764e-06
[34m[1mwandb[0m: 	num_train_epochs: 2
[34m[1mwandb[0m: 	per_device_train_batch_size: 11
[34m[1mwandb[0m: 	warmup_ratio: 0.028794991188710845
[34m[1mwandb[0m: 	weight_decay: 0.01687520407386576
2022-04-27 23:41:20.312812: I tensorflow/stream_executor/platform/default/dso_loader.cc:49] Successfully opened dynamic library libcudart.so.10.1


Using custom data configuration tweet-sentiment-extraction-26a05391932e4e2c
Reusing dataset csv (/home/eliott.remmer/.cache/huggingface/datasets/csv/tweet-sentiment-extraction-26a05391932e4e2c/0.0.0/6b9057d9e23d9d8a2f05b985917a0da84d70c5dae3d22ddd8a3f22fb01c69d9e)


  0%|          | 0/2 [00:00<?, ?it/s]

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /.cache/huggingface/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "_name_or_path": "bert-base-uncased",
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_2": 2
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.14.1"

Step,Training Loss,Validation Loss,F1
50,1.112,1.086702,0.355025
100,1.0617,1.025974,0.461645
150,1.0141,0.931987,0.584657
200,0.8776,0.818456,0.656634
250,0.7561,0.704049,0.718473
300,0.7215,0.654817,0.737616
350,0.6848,0.634653,0.743231
400,0.7297,0.624705,0.748118
450,0.6766,0.60695,0.752882
500,0.6423,0.589314,0.762454


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 11
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 11
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 11
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 11
The following columns in the evaluation set  don't have a corresponding 

Saving model checkpoint to /workspace/models/bert-base-uncased-finetuned-tweets
Configuration saved in /workspace/models/bert-base-uncased-finetuned-tweets/config.json
Model weights saved in /workspace/models/bert-base-uncased-finetuned-tweets/pytorch_model.bin
tokenizer config file saved in /workspace/models/bert-base-uncased-finetuned-tweets/tokenizer_config.json
Special tokens file saved in /workspace/models/bert-base-uncased-finetuned-tweets/special_tokens_map.json





VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
eval/f1,▁▅▇▇███▇████████████████████████████████
eval/loss,█▆▃▂▂▂▁▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eval/runtime,▁▂▂▃▂▄▃▂▃▂▂▃▃▄▂▃▄▃▃▃▃▃▂▄▄▃▃▂█▂▃▃▄▃▃▂▂▃▃█
eval/samples_per_second,█▇▇▆▇▅▆▇▆▆▇▆▆▅▇▆▅▆▆▆▆▆▆▅▅▆▆▇▁▆▆▆▅▆▆▇▇▆▆▁
eval/steps_per_second,█▇▇▆▇▅▆▇▆▆▇▆▆▅▇▆▅▆▆▆▆▆▆▅▅▆▆▇▁▆▆▆▅▆▆▇▇▆▆▁
train/epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
train/global_step,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
train/learning_rate,▃███▇▇▇▇▇▇▆▆▆▆▆▅▅▅▅▅▄▄▄▄▄▄▃▃▃▃▃▃▂▂▂▂▂▁▁▁
train/loss,█▇▄▄▃▃▃▃▃▃▃▃▂▃▃▃▂▂▂▁▁▁▂▂▁▁▁▁▁▂▁▁▁▁▁▂▁▁▁▂
train/total_flos,▁

0,1
eval/f1,0.79753
eval/loss,0.51974
eval/runtime,6.9336
eval/samples_per_second,509.692
eval/steps_per_second,46.441
train/epoch,2.0
train/global_step,4998.0
train/learning_rate,0.0
train/loss,0.4828
train/total_flos,1977050665396800.0


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 4dqz6064 with config:
[34m[1mwandb[0m: 	learning_rate: 9.739374396218434e-06
[34m[1mwandb[0m: 	num_train_epochs: 3
[34m[1mwandb[0m: 	per_device_train_batch_size: 29
[34m[1mwandb[0m: 	warmup_ratio: 0.044924916549757846
[34m[1mwandb[0m: 	weight_decay: 0.00670969741446307
2022-04-28 00:00:14.898559: I tensorflow/stream_executor/platform/default/dso_loader.cc:49] Successfully opened dynamic library libcudart.so.10.1


Using custom data configuration tweet-sentiment-extraction-26a05391932e4e2c
Reusing dataset csv (/home/eliott.remmer/.cache/huggingface/datasets/csv/tweet-sentiment-extraction-26a05391932e4e2c/0.0.0/6b9057d9e23d9d8a2f05b985917a0da84d70c5dae3d22ddd8a3f22fb01c69d9e)


  0%|          | 0/2 [00:00<?, ?it/s]

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /.cache/huggingface/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "_name_or_path": "bert-base-uncased",
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_2": 2
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.14.1"

Step,Training Loss,Validation Loss,F1
50,1.1039,1.069895,0.417689
100,1.0506,0.986,0.535174
150,0.9246,0.782095,0.702054
200,0.7333,0.657005,0.726144
250,0.6782,0.619531,0.752884
300,0.644,0.58679,0.768395
350,0.6058,0.577178,0.760969
400,0.6015,0.56018,0.778457
450,0.58,0.554326,0.780346
500,0.567,0.554908,0.772289


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 29
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 29
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 29
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 29
The following columns in the evaluation set  don't have a corresponding 

Saving model checkpoint to /workspace/models/bert-base-uncased-finetuned-tweets
Configuration saved in /workspace/models/bert-base-uncased-finetuned-tweets/config.json
Model weights saved in /workspace/models/bert-base-uncased-finetuned-tweets/pytorch_model.bin
tokenizer config file saved in /workspace/models/bert-base-uncased-finetuned-tweets/tokenizer_config.json
Special tokens file saved in /workspace/models/bert-base-uncased-finetuned-tweets/special_tokens_map.json





VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
eval/f1,▁▃▆▇▇███▇███████████████████████████████
eval/loss,█▇▄▂▂▂▂▁▂▁▁▂▁▁▁▁▁▁▁▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eval/runtime,▁▁▃▂▄▄▃▄▄▃▄▃▃▄▄▃▄▃▃▃▃▃▃▄▃▄▃▅▄█▄▄▄▄▃▅▃▄▄▆
eval/samples_per_second,██▆▇▅▅▆▅▅▆▅▆▆▅▅▆▅▆▆▆▆▆▆▅▆▅▆▄▅▁▅▅▅▅▆▄▆▅▄▃
eval/steps_per_second,██▆▇▅▅▆▅▅▆▅▆▆▅▅▆▅▆▆▆▆▆▆▅▆▅▆▄▅▁▅▅▅▅▆▄▆▅▄▃
train/epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇████
train/global_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇████
train/learning_rate,▄▆███▇▇▇▇▇▆▆▆▆▆▅▅▅▅▅▅▄▄▄▄▄▄▃▃▃▃▃▂▂▂▂▂▁▁▁
train/loss,█▇▆▄▄▃▃▃▃▃▃▂▃▂▂▂▂▂▂▁▂▂▂▂▂▁▂▁▁▁▁▁▁▁▁▁▁▁▁▁
train/total_flos,▁

0,1
eval/f1,0.79606
eval/loss,0.51473
eval/runtime,6.0737
eval/samples_per_second,581.857
eval/steps_per_second,20.087
train/epoch,3.0
train/global_step,2844.0
train/learning_rate,0.0
train/loss,0.4006
train/total_flos,2965575998095200.0


[34m[1mwandb[0m: Agent Starting Run: svd1b1o3 with config:
[34m[1mwandb[0m: 	learning_rate: 8.600787737791735e-06
[34m[1mwandb[0m: 	num_train_epochs: 3
[34m[1mwandb[0m: 	per_device_train_batch_size: 17
[34m[1mwandb[0m: 	warmup_ratio: 0.034674461693173196
[34m[1mwandb[0m: 	weight_decay: 0.006164235104078892
2022-04-28 00:13:32.306799: I tensorflow/stream_executor/platform/default/dso_loader.cc:49] Successfully opened dynamic library libcudart.so.10.1


Using custom data configuration tweet-sentiment-extraction-26a05391932e4e2c
Reusing dataset csv (/home/eliott.remmer/.cache/huggingface/datasets/csv/tweet-sentiment-extraction-26a05391932e4e2c/0.0.0/6b9057d9e23d9d8a2f05b985917a0da84d70c5dae3d22ddd8a3f22fb01c69d9e)


  0%|          | 0/2 [00:00<?, ?it/s]

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /.cache/huggingface/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "_name_or_path": "bert-base-uncased",
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_2": 2
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.14.1"

Step,Training Loss,Validation Loss,F1
50,1.1052,1.088298,0.351016
100,1.0785,1.04035,0.471462
150,1.0153,0.947666,0.603146
200,0.8832,0.785028,0.671424
250,0.7843,0.684391,0.731441
300,0.7061,0.636845,0.741881
350,0.6512,0.616124,0.752317
400,0.6575,0.605086,0.753842
450,0.6377,0.587937,0.764206
500,0.5931,0.575207,0.762624


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 17
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 17
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 17
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 17
The following columns in the evaluation set  don't have a corresponding 

Saving model checkpoint to /workspace/models/bert-base-uncased-finetuned-tweets
Configuration saved in /workspace/models/bert-base-uncased-finetuned-tweets/config.json
Model weights saved in /workspace/models/bert-base-uncased-finetuned-tweets/pytorch_model.bin
tokenizer config file saved in /workspace/models/bert-base-uncased-finetuned-tweets/tokenizer_config.json
Special tokens file saved in /workspace/models/bert-base-uncased-finetuned-tweets/special_tokens_map.json





VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
eval/f1,▁▅▇▇▇███████████████████████████████████
eval/loss,█▆▃▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▂▁▁▁▁▁▁▁▁▁▁▁
eval/runtime,▂▁▁▃▂▃▃▃▂▂▃▂▂█▃▃▃▂▂▂▂▃▃▃▅▂▃▂▃▃▃▂▂▂▄▃▃▃▃▂
eval/samples_per_second,▇██▆▇▆▆▆▇▇▆▇▇▁▆▆▆▆▇▆▇▆▆▆▃▇▆▆▆▆▆▇▇▇▅▆▆▆▆▇
eval/steps_per_second,▇██▆▇▆▆▆▇▇▆▇▇▁▆▆▆▆▇▆▇▆▆▆▃▇▆▆▆▆▆▇▇▇▅▆▆▆▆▇
train/epoch,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇▇███
train/global_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇▇███
train/learning_rate,▃▇███▇▇▇▇▇▆▆▆▆▆▆▅▅▅▅▅▄▄▄▄▄▃▃▃▃▃▃▂▂▂▂▂▁▁▁
train/loss,█▇▅▄▃▃▃▃▃▃▃▃▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▁▂▁▁▂▁▂▂▁▁▁▁▁
train/total_flos,▁

0,1
eval/f1,0.79662
eval/loss,0.51324
eval/runtime,6.111
eval/samples_per_second,578.299
eval/steps_per_second,34.037
train/epoch,3.0
train/global_step,4851.0
train/learning_rate,0.0
train/loss,0.3547
train/total_flos,2965575998095200.0


[34m[1mwandb[0m: Agent Starting Run: uqptmdpv with config:
[34m[1mwandb[0m: 	learning_rate: 9.430715197658142e-06
[34m[1mwandb[0m: 	num_train_epochs: 3
[34m[1mwandb[0m: 	per_device_train_batch_size: 12
[34m[1mwandb[0m: 	warmup_ratio: 0.0975721052306532
[34m[1mwandb[0m: 	weight_decay: 0.007009274908742593
2022-04-28 00:32:47.507335: I tensorflow/stream_executor/platform/default/dso_loader.cc:49] Successfully opened dynamic library libcudart.so.10.1


Using custom data configuration tweet-sentiment-extraction-26a05391932e4e2c
Reusing dataset csv (/home/eliott.remmer/.cache/huggingface/datasets/csv/tweet-sentiment-extraction-26a05391932e4e2c/0.0.0/6b9057d9e23d9d8a2f05b985917a0da84d70c5dae3d22ddd8a3f22fb01c69d9e)


  0%|          | 0/2 [00:00<?, ?it/s]

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /.cache/huggingface/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "_name_or_path": "bert-base-uncased",
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_2": 2
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.14.1"

Step,Training Loss,Validation Loss,F1
50,1.1081,1.104087,0.273054
100,1.1,1.088614,0.353107
150,1.0852,1.070208,0.416486
200,1.074,1.047406,0.434783
250,1.043,1.005326,0.500838
300,1.0026,0.944572,0.585744
350,0.9204,0.858601,0.654049
400,0.8658,0.800716,0.640072
450,0.7904,0.708735,0.723047
500,0.7055,0.649245,0.740461


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 12
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 12
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 12
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 12
The following columns in the evaluation set  don't have a corresponding 

Saving model checkpoint to /workspace/models/bert-base-uncased-finetuned-tweets
Configuration saved in /workspace/models/bert-base-uncased-finetuned-tweets/config.json
Model weights saved in /workspace/models/bert-base-uncased-finetuned-tweets/pytorch_model.bin
tokenizer config file saved in /workspace/models/bert-base-uncased-finetuned-tweets/tokenizer_config.json
Special tokens file saved in /workspace/models/bert-base-uncased-finetuned-tweets/special_tokens_map.json





VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
eval/f1,▁▂▅▇▇█▇█████████████████████████████████
eval/loss,██▅▂▂▂▂▁▁▁▁▁▁▁▁▁▁▂▂▂▁▁▁▁▁▁▁▂▁▂▂▂▂▂▂▂▂▂▂▂
eval/runtime,▂▁▂▂█▂▂▂▂▂▃▂▅▂▂▂▂▂▂▃▄▂▂▂▂▂▂▃▄▂▂▂▂▂▃▂▅▂▂▂
eval/samples_per_second,▇█▇▇▁▇▇▇▇▇▆▇▄▆▇▇▇▇▇▆▅▇▆▇▇▇▇▅▅▇▇▇▇▇▆▇▃▇▆▇
eval/steps_per_second,▇█▇▇▁▇▇▇▇▇▆▇▄▆▇▇▇▇▇▆▅▇▆▇▇▇▇▅▅▇▇▇▇▇▆▇▃▇▆▇
train/epoch,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
train/global_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
train/learning_rate,▂▃▅▇███▇▇▇▇▇▆▆▆▆▆▅▅▅▅▅▄▄▄▄▄▃▃▃▃▃▂▂▂▂▂▁▁▁
train/loss,██▆▄▄▄▃▄▃▃▃▃▃▃▃▂▂▂▃▃▂▂▂▂▂▂▃▁▂▁▁▂▂▂▁▁▂▁▁▂
train/total_flos,▁

0,1
eval/f1,0.7998
eval/loss,0.54399
eval/runtime,6.3028
eval/samples_per_second,560.705
eval/steps_per_second,46.805
train/epoch,3.0
train/global_step,6870.0
train/learning_rate,0.0
train/loss,0.3285
train/total_flos,2965575998095200.0


[34m[1mwandb[0m: Agent Starting Run: v6tzr5ir with config:
[34m[1mwandb[0m: 	learning_rate: 9.609926705839952e-06
[34m[1mwandb[0m: 	num_train_epochs: 3
[34m[1mwandb[0m: 	per_device_train_batch_size: 11
[34m[1mwandb[0m: 	warmup_ratio: 0.09838013176050524
[34m[1mwandb[0m: 	weight_decay: 0.01973679513149403
2022-04-28 00:58:07.156114: I tensorflow/stream_executor/platform/default/dso_loader.cc:49] Successfully opened dynamic library libcudart.so.10.1


Using custom data configuration tweet-sentiment-extraction-26a05391932e4e2c
Reusing dataset csv (/home/eliott.remmer/.cache/huggingface/datasets/csv/tweet-sentiment-extraction-26a05391932e4e2c/0.0.0/6b9057d9e23d9d8a2f05b985917a0da84d70c5dae3d22ddd8a3f22fb01c69d9e)


  0%|          | 0/2 [00:00<?, ?it/s]

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /.cache/huggingface/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "_name_or_path": "bert-base-uncased",
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_2": 2
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.14.1"

Step,Training Loss,Validation Loss,F1
50,1.1176,1.105259,0.270322
100,1.093,1.088687,0.34749
150,1.0968,1.071033,0.412178
200,1.0727,1.047589,0.445696
250,1.0366,1.01488,0.496214
300,1.0066,0.980156,0.561362
350,0.9411,0.881802,0.587222
400,0.9221,0.826881,0.659657
450,0.8284,0.780714,0.668544
500,0.7827,0.713168,0.712217


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 11
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 11
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 11
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 11
The following columns in the evaluation set  don't have a corresponding 

Saving model checkpoint to /workspace/models/bert-base-uncased-finetuned-tweets
Configuration saved in /workspace/models/bert-base-uncased-finetuned-tweets/config.json
Model weights saved in /workspace/models/bert-base-uncased-finetuned-tweets/pytorch_model.bin
tokenizer config file saved in /workspace/models/bert-base-uncased-finetuned-tweets/tokenizer_config.json
Special tokens file saved in /workspace/models/bert-base-uncased-finetuned-tweets/special_tokens_map.json





VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
eval/f1,▁▃▆▆██▇██▇██████████████████████████████
eval/loss,██▅▃▂▂▂▁▂▂▂▁▁▁▁▁▁▂▂▁▂▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▂▁
eval/runtime,▁▃▃▃▄▄▅▄▄▄▃█▃▅▄▄▂▃▇▄▃▃▄▅▄▃▄▃▃▄▄▄▃▆▃▃▃▄▄▄
eval/samples_per_second,█▅▆▆▅▅▄▅▅▅▆▁▆▄▅▅▆▆▂▅▆▆▅▄▅▆▅▅▆▅▅▅▆▃▆▆▆▅▅▅
eval/steps_per_second,█▅▆▆▅▅▄▅▅▅▆▁▆▄▅▅▆▆▂▅▆▆▅▄▅▆▅▅▆▅▅▅▆▃▆▆▆▅▅▅
train/epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇███
train/global_step,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇███
train/learning_rate,▂▃▅▇███▇▇▇▇▇▆▆▆▆▆▅▅▅▅▅▄▄▄▄▄▃▃▃▃▃▂▂▂▂▂▁▁▁
train/loss,██▆▅▄▄▃▄▃▃▃▃▃▃▂▂▂▃▂▂▂▃▂▂▃▂▃▁▂▂▁▂▂▂▁▂▂▂▁▂
train/total_flos,▁

0,1
eval/f1,0.79959
eval/loss,0.50992
eval/runtime,6.6947
eval/samples_per_second,527.879
eval/steps_per_second,48.098
train/epoch,3.0
train/global_step,7497.0
train/learning_rate,0.0
train/loss,0.3752
train/total_flos,2965575998095200.0


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: oj5nbe6x with config:
[34m[1mwandb[0m: 	learning_rate: 9.684561667950975e-06
[34m[1mwandb[0m: 	num_train_epochs: 2
[34m[1mwandb[0m: 	per_device_train_batch_size: 9
[34m[1mwandb[0m: 	warmup_ratio: 0.09315087732337514
[34m[1mwandb[0m: 	weight_decay: 0.015645776061200413
2022-04-28 01:26:17.729555: I tensorflow/stream_executor/platform/default/dso_loader.cc:49] Successfully opened dynamic library libcudart.so.10.1


Using custom data configuration tweet-sentiment-extraction-26a05391932e4e2c
Reusing dataset csv (/home/eliott.remmer/.cache/huggingface/datasets/csv/tweet-sentiment-extraction-26a05391932e4e2c/0.0.0/6b9057d9e23d9d8a2f05b985917a0da84d70c5dae3d22ddd8a3f22fb01c69d9e)


  0%|          | 0/2 [00:00<?, ?it/s]

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /.cache/huggingface/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "_name_or_path": "bert-base-uncased",
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_2": 2
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.14.1"

Step,Training Loss,Validation Loss,F1
50,1.1165,1.104763,0.272145
100,1.0959,1.088369,0.34671
150,1.0911,1.064494,0.417881
200,1.0609,1.046752,0.461434
250,1.0414,1.005529,0.491096
300,0.9867,0.923851,0.61418
350,0.8991,0.848889,0.646758
400,0.8412,0.765451,0.686594
450,0.7623,0.742525,0.65199
500,0.7499,0.68857,0.695087


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 9
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 9
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 9
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 9
The following columns in the evaluation set  don't have a corresponding argu

Saving model checkpoint to /workspace/models/bert-base-uncased-finetuned-tweets
Configuration saved in /workspace/models/bert-base-uncased-finetuned-tweets/config.json
Model weights saved in /workspace/models/bert-base-uncased-finetuned-tweets/pytorch_model.bin
tokenizer config file saved in /workspace/models/bert-base-uncased-finetuned-tweets/tokenizer_config.json
Special tokens file saved in /workspace/models/bert-base-uncased-finetuned-tweets/special_tokens_map.json





VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
eval/f1,▁▄▆▇▇█▇▇████████████████████████████████
eval/loss,█▇▅▃▂▂▂▂▂▁▂▁▁▁▂▁▁▁▁▁▂▂▁▁▂▁▁▂▁▁▁▁▁▁▁▁▁▁▁▁
eval/runtime,▁▁▂▄▂▄▂▅▂▃▃▃▃▄▂▄▅▃▅█▅▅▅▄▄▄▃▅▇▆▅▃▃▄▃▅▅▃▅▃
eval/samples_per_second,██▇▅▇▅▇▄▆▆▆▅▆▄▇▅▄▆▄▁▄▄▄▅▅▅▆▄▂▃▄▅▆▅▆▄▄▆▄▆
eval/steps_per_second,██▇▅▇▅▇▄▆▆▆▅▆▄▇▅▄▆▄▁▄▄▄▅▅▅▆▄▂▃▄▅▆▅▆▄▄▆▄▆
train/epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
train/global_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇▇███
train/learning_rate,▂▃▅▇███▇▇▇▇▇▆▆▆▆▆▅▅▅▅▅▄▄▄▄▄▃▃▃▃▃▂▂▂▂▂▁▁▁
train/loss,█▇▆▅▃▃▃▃▂▃▃▂▃▂▃▃▃▂▂▂▁▁▂▂▂▂▂▂▂▁▂▁▁▁▂▂▁▁▂▁
train/total_flos,▁

0,1
eval/f1,0.80156
eval/loss,0.52556
eval/runtime,6.5645
eval/samples_per_second,538.351
eval/steps_per_second,59.868
train/epoch,2.0
train/global_step,6108.0
train/learning_rate,0.0
train/loss,0.422
train/total_flos,1977050665396800.0


[34m[1mwandb[0m: Agent Starting Run: ttjdz89f with config:
[34m[1mwandb[0m: 	learning_rate: 9.912291707766184e-06
[34m[1mwandb[0m: 	num_train_epochs: 2
[34m[1mwandb[0m: 	per_device_train_batch_size: 26
[34m[1mwandb[0m: 	warmup_ratio: 0.0968691677085702
[34m[1mwandb[0m: 	weight_decay: 0.017896753930457126
2022-04-28 01:47:35.860688: I tensorflow/stream_executor/platform/default/dso_loader.cc:49] Successfully opened dynamic library libcudart.so.10.1


Using custom data configuration tweet-sentiment-extraction-26a05391932e4e2c
Reusing dataset csv (/home/eliott.remmer/.cache/huggingface/datasets/csv/tweet-sentiment-extraction-26a05391932e4e2c/0.0.0/6b9057d9e23d9d8a2f05b985917a0da84d70c5dae3d22ddd8a3f22fb01c69d9e)


  0%|          | 0/2 [00:00<?, ?it/s]

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /.cache/huggingface/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "_name_or_path": "bert-base-uncased",
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_2": 2
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.14.1"

Step,Training Loss,Validation Loss,F1
50,1.1055,1.084861,0.368607
100,1.0733,1.03562,0.473168
150,0.9904,0.912076,0.571555
200,0.8723,0.769947,0.705692
250,0.7362,0.646636,0.735004
300,0.6612,0.618861,0.741519
350,0.6336,0.579558,0.768195
400,0.6147,0.579795,0.757732
450,0.5698,0.566493,0.769717
500,0.5765,0.546398,0.783366


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 26
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 26
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 26
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 26
The following columns in the evaluation set  don't have a corresponding 

Saving model checkpoint to /workspace/models/bert-base-uncased-finetuned-tweets
Configuration saved in /workspace/models/bert-base-uncased-finetuned-tweets/config.json
Model weights saved in /workspace/models/bert-base-uncased-finetuned-tweets/pytorch_model.bin
tokenizer config file saved in /workspace/models/bert-base-uncased-finetuned-tweets/tokenizer_config.json
Special tokens file saved in /workspace/models/bert-base-uncased-finetuned-tweets/special_tokens_map.json





VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
eval/f1,▁▃▄▆▇▇█▇████████████████████████████████
eval/loss,█▇▆▄▃▂▂▂▂▂▂▁▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eval/runtime,▂▁▃▃▅▅▃▄▄▄▄▃▂▄▃▄▄█▃▃▂▄▄▄▄▄▃▅▃▄▃▃▄▅▅▄▃▅▂▆
eval/samples_per_second,▇█▆▆▄▄▆▅▅▅▅▆▇▅▆▅▅▁▆▆▆▅▅▅▅▅▆▄▆▅▆▆▄▄▄▅▆▄▆▃
eval/steps_per_second,▇█▆▆▄▄▆▅▅▅▅▆▇▅▆▅▅▁▆▆▆▅▅▅▅▅▆▄▆▅▆▆▄▄▄▅▆▄▆▃
train/epoch,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇████
train/global_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇████
train/learning_rate,▃▄▆████▇▇▇▇▇▆▆▆▆▆▆▅▅▅▅▄▄▄▄▄▃▃▃▃▃▃▂▂▂▂▂▁▁
train/loss,██▇▆▄▃▃▃▂▂▂▃▂▃▂▂▂▂▂▂▁▁▂▁▁▁▁▁▁▂▁▁▁▁▁▁▁▁▁▂
train/total_flos,▁

0,1
eval/f1,0.79615
eval/loss,0.52332
eval/runtime,6.0061
eval/samples_per_second,588.4
eval/steps_per_second,22.644
train/epoch,2.0
train/global_step,2114.0
train/learning_rate,0.0
train/loss,0.5043
train/total_flos,1977050665396800.0


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: fytl0lhe with config:
[34m[1mwandb[0m: 	learning_rate: 9.259855487778042e-06
[34m[1mwandb[0m: 	num_train_epochs: 3
[34m[1mwandb[0m: 	per_device_train_batch_size: 30
[34m[1mwandb[0m: 	warmup_ratio: 0.09660425700796545
[34m[1mwandb[0m: 	weight_decay: 0.005966513075506588
2022-04-28 01:57:25.248729: I tensorflow/stream_executor/platform/default/dso_loader.cc:49] Successfully opened dynamic library libcudart.so.10.1


Using custom data configuration tweet-sentiment-extraction-26a05391932e4e2c
Reusing dataset csv (/home/eliott.remmer/.cache/huggingface/datasets/csv/tweet-sentiment-extraction-26a05391932e4e2c/0.0.0/6b9057d9e23d9d8a2f05b985917a0da84d70c5dae3d22ddd8a3f22fb01c69d9e)


  0%|          | 0/2 [00:00<?, ?it/s]

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /.cache/huggingface/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "_name_or_path": "bert-base-uncased",
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_2": 2
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.14.1"

Step,Training Loss,Validation Loss,F1
50,1.1096,1.089393,0.349011
100,1.075,1.044207,0.439823
150,1.029,0.958784,0.536021
200,0.9172,0.830484,0.67572
250,0.8125,0.711157,0.717425
300,0.7201,0.640621,0.745427
350,0.6438,0.613863,0.745146
400,0.6118,0.609165,0.74481
450,0.5933,0.576213,0.763662
500,0.6187,0.625738,0.733213


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 30
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 30
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 30
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 30
The following columns in the evaluation set  don't have a corresponding 

Saving model checkpoint to /workspace/models/bert-base-uncased-finetuned-tweets
Configuration saved in /workspace/models/bert-base-uncased-finetuned-tweets/config.json
Model weights saved in /workspace/models/bert-base-uncased-finetuned-tweets/pytorch_model.bin
tokenizer config file saved in /workspace/models/bert-base-uncased-finetuned-tweets/tokenizer_config.json
Special tokens file saved in /workspace/models/bert-base-uncased-finetuned-tweets/special_tokens_map.json





VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
eval/f1,▁▂▄▇▇▇▇▇██▇█████████████████████████████
eval/loss,█▇▆▃▃▂▂▂▂▁▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eval/runtime,▁▁▂▂▁▁▁▁▂▂▁▂▂▂█▂▂▂▂▂▂▂▁▃▂▂▂▂▂▂▄▂▂▂▂▂▂▂▂▂
eval/samples_per_second,██▇▇████▇▇█▇▇▇▁▇▇▇▇▇▇▇█▆▇▇▇▇▇▇▅▇▇▇▇▇▇▇▇▇
eval/steps_per_second,██▇▇████▇▇█▇▇▇▁▇▇▇▇▇▇▇█▆▇▇▇▇▇▇▅▇▇▇▇▇▇▇▇▇
train/epoch,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
train/global_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
train/learning_rate,▂▄▅████▇▇▇▇▇▆▆▆▆▆▅▅▅▅▅▅▄▄▄▄▃▃▃▃▃▂▂▂▂▂▁▁▁
train/loss,██▇▅▄▄▃▃▃▃▃▃▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▁▁▁▂▁▁▁▁▁▂▁
train/total_flos,▁

0,1
eval/f1,0.79688
eval/loss,0.51348
eval/runtime,6.0086
eval/samples_per_second,588.156
eval/steps_per_second,19.638
train/epoch,3.0
train/global_step,2748.0
train/learning_rate,0.0
train/loss,0.4188
train/total_flos,2965575998095200.0


[34m[1mwandb[0m: Agent Starting Run: 06iktv2u with config:
[34m[1mwandb[0m: 	learning_rate: 9.889686759703528e-06
[34m[1mwandb[0m: 	num_train_epochs: 2
[34m[1mwandb[0m: 	per_device_train_batch_size: 18
[34m[1mwandb[0m: 	warmup_ratio: 0.0863000623867988
[34m[1mwandb[0m: 	weight_decay: 0.009800085364689067
2022-04-28 02:10:31.211499: I tensorflow/stream_executor/platform/default/dso_loader.cc:49] Successfully opened dynamic library libcudart.so.10.1


Using custom data configuration tweet-sentiment-extraction-26a05391932e4e2c
Reusing dataset csv (/home/eliott.remmer/.cache/huggingface/datasets/csv/tweet-sentiment-extraction-26a05391932e4e2c/0.0.0/6b9057d9e23d9d8a2f05b985917a0da84d70c5dae3d22ddd8a3f22fb01c69d9e)


  0%|          | 0/2 [00:00<?, ?it/s]

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /.cache/huggingface/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "_name_or_path": "bert-base-uncased",
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_2": 2
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.14.1"

Step,Training Loss,Validation Loss,F1
50,1.1103,1.091957,0.332028
100,1.0892,1.060129,0.434588
150,1.0508,1.00247,0.508225
200,0.9755,0.886947,0.615653
250,0.8615,0.793642,0.64842
300,0.7666,0.679314,0.72477
350,0.6866,0.653137,0.732692
400,0.6721,0.614597,0.758524
450,0.6284,0.59283,0.765838
500,0.6387,0.577924,0.769435


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 18
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 18
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 18
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 18
The following columns in the evaluation set  don't have a corresponding 

Saving model checkpoint to /workspace/models/bert-base-uncased-finetuned-tweets
Configuration saved in /workspace/models/bert-base-uncased-finetuned-tweets/config.json
Model weights saved in /workspace/models/bert-base-uncased-finetuned-tweets/pytorch_model.bin
tokenizer config file saved in /workspace/models/bert-base-uncased-finetuned-tweets/tokenizer_config.json
Special tokens file saved in /workspace/models/bert-base-uncased-finetuned-tweets/special_tokens_map.json





VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
eval/f1,▁▃▅▆▇▇█▇████████████████████████████████
eval/loss,██▆▄▃▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eval/runtime,▁▂▁▄▃▃▂▂▅▃▃▄▂▁▂▅▅▂▃▂▂▃█▂▂▂▂▂▂▃▂▄▂▃▂▆▄▄▁▂
eval/samples_per_second,█▇█▅▆▆▇▇▄▆▆▅▇█▇▄▄▇▆▇▇▆▁▇▇▇▇▇▇▆▇▅▇▆▇▃▅▅█▇
eval/steps_per_second,█▇█▅▆▆▇▇▄▆▆▅▇█▇▄▄▇▆▇▇▆▁▇▇▇▇▇▇▆▇▅▇▆▇▃▅▅█▇
train/epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇████
train/global_step,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇████
train/learning_rate,▂▄▆████▇▇▇▇▇▆▆▆▆▆▅▅▅▅▅▄▄▄▄▄▃▃▃▃▃▂▂▂▂▂▂▁▁
train/loss,██▇▅▄▄▃▃▂▃▃▃▂▂▃▂▂▂▂▂▂▁▂▁▁▂▂▂▁▂▁▁▁▁▁▁▁▁▁▁
train/total_flos,▁

0,1
eval/f1,0.79571
eval/loss,0.53452
eval/runtime,6.0024
eval/samples_per_second,588.764
eval/steps_per_second,32.82
train/epoch,2.0
train/global_step,3054.0
train/learning_rate,0.0
train/loss,0.4607
train/total_flos,1977050665396800.0


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: e253ngj9 with config:
[34m[1mwandb[0m: 	learning_rate: 9.8304541282323e-06
[34m[1mwandb[0m: 	num_train_epochs: 3
[34m[1mwandb[0m: 	per_device_train_batch_size: 12
[34m[1mwandb[0m: 	warmup_ratio: 0.015202679880903854
[34m[1mwandb[0m: 	weight_decay: 0.00957195284247123
2022-04-28 02:22:59.604096: I tensorflow/stream_executor/platform/default/dso_loader.cc:49] Successfully opened dynamic library libcudart.so.10.1


Using custom data configuration tweet-sentiment-extraction-26a05391932e4e2c
Reusing dataset csv (/home/eliott.remmer/.cache/huggingface/datasets/csv/tweet-sentiment-extraction-26a05391932e4e2c/0.0.0/6b9057d9e23d9d8a2f05b985917a0da84d70c5dae3d22ddd8a3f22fb01c69d9e)


  0%|          | 0/2 [00:00<?, ?it/s]

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /.cache/huggingface/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "_name_or_path": "bert-base-uncased",
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_2": 2
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.14.1"

Step,Training Loss,Validation Loss,F1
50,1.1002,1.073676,0.408029
100,1.0534,1.040652,0.4089
150,0.9599,0.894369,0.528252
200,0.8209,0.731616,0.682861
250,0.679,0.702694,0.675289
300,0.702,0.63738,0.732893
350,0.6977,0.607822,0.750386
400,0.6692,0.610504,0.746586
450,0.6346,0.594572,0.757299
500,0.5847,0.59187,0.765091


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 12
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 12
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 12
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 12
The following columns in the evaluation set  don't have a corresponding 

Saving model checkpoint to /workspace/models/bert-base-uncased-finetuned-tweets
Configuration saved in /workspace/models/bert-base-uncased-finetuned-tweets/config.json
Model weights saved in /workspace/models/bert-base-uncased-finetuned-tweets/pytorch_model.bin
tokenizer config file saved in /workspace/models/bert-base-uncased-finetuned-tweets/tokenizer_config.json
Special tokens file saved in /workspace/models/bert-base-uncased-finetuned-tweets/special_tokens_map.json





VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
eval/f1,▁▆▇▇██▇█████████████████████████████████
eval/loss,█▄▂▂▂▁▂▁▂▁▁▁▁▁▁▁▂▂▂▂▁▂▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▂▁
eval/runtime,▂▁▃▂▄▂▄▂▄▂▇▆▄▂▇▃▄▃▅█▄▃▃▅▃▄▇▃▄▅▄▄▃▆▅▃▂▆▆▆
eval/samples_per_second,▇█▆▇▅▇▅▇▅▇▂▃▄▇▂▆▅▆▄▁▅▆▆▄▆▅▂▆▅▄▅▅▆▃▄▆▇▃▃▃
eval/steps_per_second,▇█▆▇▅▇▅▇▅▇▂▃▄▇▂▆▅▆▄▁▅▆▆▄▆▅▂▆▅▄▅▅▆▃▄▆▇▃▃▃
train/epoch,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
train/global_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
train/learning_rate,████▇▇▇▇▇▇▆▆▆▆▆▅▅▅▅▅▅▄▄▄▄▄▃▃▃▃▃▂▂▂▂▂▂▁▁▁
train/loss,█▆▄▄▄▄▃▄▃▃▃▃▃▃▃▂▂▂▃▃▂▂▂▂▂▂▃▁▂▁▁▂▂▂▁▁▁▁▁▂
train/total_flos,▁

0,1
eval/f1,0.79897
eval/loss,0.50331
eval/runtime,6.3746
eval/samples_per_second,554.384
eval/steps_per_second,46.277
train/epoch,3.0
train/global_step,6870.0
train/learning_rate,0.0
train/loss,0.3211
train/total_flos,2965575998095200.0


[34m[1mwandb[0m: Agent Starting Run: qdp3ulbl with config:
[34m[1mwandb[0m: 	learning_rate: 9.479732198649685e-06
[34m[1mwandb[0m: 	num_train_epochs: 3
[34m[1mwandb[0m: 	per_device_train_batch_size: 16
[34m[1mwandb[0m: 	warmup_ratio: 0.06218110403959236
[34m[1mwandb[0m: 	weight_decay: 0.01906891111675305
2022-04-28 02:48:12.443203: I tensorflow/stream_executor/platform/default/dso_loader.cc:49] Successfully opened dynamic library libcudart.so.10.1


Using custom data configuration tweet-sentiment-extraction-26a05391932e4e2c
Reusing dataset csv (/home/eliott.remmer/.cache/huggingface/datasets/csv/tweet-sentiment-extraction-26a05391932e4e2c/0.0.0/6b9057d9e23d9d8a2f05b985917a0da84d70c5dae3d22ddd8a3f22fb01c69d9e)


  0%|          | 0/2 [00:00<?, ?it/s]

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /.cache/huggingface/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "_name_or_path": "bert-base-uncased",
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_2": 2
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.14.1"

Step,Training Loss,Validation Loss,F1
50,1.1045,1.096881,0.311108
100,1.0917,1.068292,0.397859
150,1.0674,1.028081,0.484774
200,1.009,0.953084,0.603285
250,0.9026,0.816077,0.678262
300,0.8306,0.731272,0.685053
350,0.7121,0.651488,0.730149
400,0.6675,0.624519,0.740352
450,0.6617,0.606755,0.757772
500,0.6034,0.596796,0.760079


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 16
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 16
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 16
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 16
The following columns in the evaluation set  don't have a corresponding 

Saving model checkpoint to /workspace/models/bert-base-uncased-finetuned-tweets
Configuration saved in /workspace/models/bert-base-uncased-finetuned-tweets/config.json
Model weights saved in /workspace/models/bert-base-uncased-finetuned-tweets/pytorch_model.bin
tokenizer config file saved in /workspace/models/bert-base-uncased-finetuned-tweets/tokenizer_config.json
Special tokens file saved in /workspace/models/bert-base-uncased-finetuned-tweets/special_tokens_map.json





VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
eval/f1,▁▃▆▇█▇█▇████████████████████████████████
eval/loss,█▇▄▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▂▂▁▁▁▁▁▁▁▁▁▂▁▁▂▂▁▁▁▁▂▁
eval/runtime,▁▂▂▄▂▅▃▄▅▃▄▆▃▅▇▄▅▃▆▃█▃▄▅▇▅▄▃▄▄▄▄▅▄▅▃▄▃▅▅
eval/samples_per_second,█▇▇▅▇▃▆▅▄▆▅▃▆▄▂▅▄▆▃▆▁▆▅▄▂▄▅▆▅▅▅▅▄▅▄▆▅▅▄▄
eval/steps_per_second,█▇▇▅▇▃▆▅▄▆▅▃▆▄▂▅▄▆▃▆▁▆▅▄▂▄▅▆▅▅▅▅▄▅▄▆▅▅▄▄
train/epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇████
train/global_step,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇████
train/learning_rate,▂▄████▇▇▇▇▇▆▆▆▆▆▅▅▅▅▅▅▄▄▄▄▄▃▃▃▃▃▂▂▂▂▂▁▁▁
train/loss,██▆▄▄▃▃▃▃▃▃▃▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▁▁▁▁▂▁▂▂▁▂▁▁▁
train/total_flos,▁

0,1
eval/f1,0.80118
eval/loss,0.53205
eval/runtime,5.8898
eval/samples_per_second,600.017
eval/steps_per_second,37.522
train/epoch,3.0
train/global_step,5154.0
train/learning_rate,0.0
train/loss,0.3321
train/total_flos,2965575998095200.0


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: 7ir1f0my with config:
[34m[1mwandb[0m: 	learning_rate: 9.32520795895725e-06
[34m[1mwandb[0m: 	num_train_epochs: 3
[34m[1mwandb[0m: 	per_device_train_batch_size: 27
[34m[1mwandb[0m: 	warmup_ratio: 0.03184874678544275
[34m[1mwandb[0m: 	weight_decay: 0.01936428996225857
2022-04-28 03:07:45.023040: I tensorflow/stream_executor/platform/default/dso_loader.cc:49] Successfully opened dynamic library libcudart.so.10.1


Using custom data configuration tweet-sentiment-extraction-26a05391932e4e2c
Reusing dataset csv (/home/eliott.remmer/.cache/huggingface/datasets/csv/tweet-sentiment-extraction-26a05391932e4e2c/0.0.0/6b9057d9e23d9d8a2f05b985917a0da84d70c5dae3d22ddd8a3f22fb01c69d9e)


  0%|          | 0/2 [00:00<?, ?it/s]

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /.cache/huggingface/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "_name_or_path": "bert-base-uncased",
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_2": 2
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.14.1"

Step,Training Loss,Validation Loss,F1
50,1.1053,1.066591,0.418808
100,1.0361,0.946664,0.56447
150,0.8693,0.772916,0.679092
200,0.7658,0.668306,0.7369
250,0.6693,0.625257,0.740017
300,0.6455,0.593119,0.76073
350,0.6277,0.574737,0.772232
400,0.6038,0.570248,0.772047
450,0.5812,0.557937,0.77761
500,0.5436,0.545924,0.78305


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 27
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 27
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 27
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 27
The following columns in the evaluation set  don't have a corresponding 

Saving model checkpoint to /workspace/models/bert-base-uncased-finetuned-tweets
Configuration saved in /workspace/models/bert-base-uncased-finetuned-tweets/config.json
Model weights saved in /workspace/models/bert-base-uncased-finetuned-tweets/pytorch_model.bin
tokenizer config file saved in /workspace/models/bert-base-uncased-finetuned-tweets/tokenizer_config.json
Special tokens file saved in /workspace/models/bert-base-uncased-finetuned-tweets/special_tokens_map.json





VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
eval/f1,▁▄▇▇▇▇█▇████████████████████████████████
eval/loss,█▇▃▃▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eval/runtime,▁█▃▂▃▃▂▃▂▅▃▆▃▄▄▃▃▄▃▄▃▄▄▄▃▃▂▃▂▃▃▂▄▂▃▄▄▃▃▃
eval/samples_per_second,█▁▆▇▆▆▇▆▇▄▆▃▅▅▅▆▆▅▆▅▆▅▅▄▆▆▇▆▇▆▆▇▅▇▆▅▅▆▆▆
eval/steps_per_second,█▁▆▇▆▆▇▆▇▄▆▃▅▅▅▆▆▅▆▅▆▅▅▄▆▆▇▆▇▆▆▇▅▇▆▅▅▆▆▆
train/epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇████
train/global_step,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇████
train/learning_rate,▅███▇▇▇▇▇▇▆▆▆▆▆▅▅▅▅▅▅▄▄▄▄▄▃▃▃▃▃▃▂▂▂▂▂▁▁▁
train/loss,█▇▅▄▃▃▃▃▃▃▃▃▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁
train/total_flos,▁

0,1
eval/f1,0.79954
eval/loss,0.49421
eval/runtime,5.8731
eval/samples_per_second,601.728
eval/steps_per_second,22.305
train/epoch,3.0
train/global_step,3054.0
train/learning_rate,0.0
train/loss,0.4013
train/total_flos,2965575998095200.0


[34m[1mwandb[0m: Agent Starting Run: saa8thy5 with config:
[34m[1mwandb[0m: 	learning_rate: 9.086642532152517e-06
[34m[1mwandb[0m: 	num_train_epochs: 3
[34m[1mwandb[0m: 	per_device_train_batch_size: 23
[34m[1mwandb[0m: 	warmup_ratio: 0.0101318078934975
[34m[1mwandb[0m: 	weight_decay: 0.014458637946056951
2022-04-28 03:21:36.675850: I tensorflow/stream_executor/platform/default/dso_loader.cc:49] Successfully opened dynamic library libcudart.so.10.1


Using custom data configuration tweet-sentiment-extraction-26a05391932e4e2c
Reusing dataset csv (/home/eliott.remmer/.cache/huggingface/datasets/csv/tweet-sentiment-extraction-26a05391932e4e2c/0.0.0/6b9057d9e23d9d8a2f05b985917a0da84d70c5dae3d22ddd8a3f22fb01c69d9e)


  0%|          | 0/2 [00:00<?, ?it/s]

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /.cache/huggingface/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "_name_or_path": "bert-base-uncased",
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_2": 2
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.14.1"

Step,Training Loss,Validation Loss,F1
50,1.0844,1.03178,0.473245
100,0.9906,0.886263,0.617636
150,0.8257,0.748403,0.671433
200,0.7386,0.663237,0.727171
250,0.6714,0.646276,0.729799
300,0.6632,0.611872,0.75115
350,0.6286,0.583312,0.762735
400,0.6247,0.57063,0.77586
450,0.5818,0.566665,0.766574
500,0.5994,0.562384,0.76982


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 23
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 23
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 23
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 23
The following columns in the evaluation set  don't have a corresponding 

Saving model checkpoint to /workspace/models/bert-base-uncased-finetuned-tweets
Configuration saved in /workspace/models/bert-base-uncased-finetuned-tweets/config.json
Model weights saved in /workspace/models/bert-base-uncased-finetuned-tweets/pytorch_model.bin
tokenizer config file saved in /workspace/models/bert-base-uncased-finetuned-tweets/tokenizer_config.json
Special tokens file saved in /workspace/models/bert-base-uncased-finetuned-tweets/special_tokens_map.json





VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
eval/f1,▁▄▆▇▇▇▇▇▇▇██▇███████████████████████████
eval/loss,█▆▃▂▂▂▂▂▂▁▁▁▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eval/runtime,▁▃▃▃█▄▄▃▃▃▅▄▅▅▄▅▃▇▄▅▄▅▄▃▅▄▄▃▃▃▃▃▅▅▃▃▃▃▃▃
eval/samples_per_second,█▆▆▆▁▅▅▆▆▆▄▅▄▄▅▄▆▂▅▄▅▄▅▆▄▅▅▆▆▆▆▆▄▄▆▆▆▆▅▆
eval/steps_per_second,█▆▆▆▁▅▅▆▆▆▄▅▄▄▅▄▆▂▅▄▅▄▅▆▄▅▅▆▆▆▆▆▄▄▆▆▆▆▅▆
train/epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
train/global_step,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
train/learning_rate,███▇▇▇▇▇▇▆▆▆▆▆▆▅▅▅▅▅▄▄▄▄▄▄▃▃▃▃▃▂▂▂▂▂▂▁▁▁
train/loss,█▇▅▄▄▃▃▃▃▃▃▃▃▃▂▂▂▂▂▂▂▂▂▂▂▂▂▁▂▁▁▁▁▂▁▁▁▁▁▂
train/total_flos,▁

0,1
eval/f1,0.79852
eval/loss,0.51654
eval/runtime,6.6418
eval/samples_per_second,532.088
eval/steps_per_second,23.187
train/epoch,3.0
train/global_step,3585.0
train/learning_rate,0.0
train/loss,0.4367
train/total_flos,2965575998095200.0


[34m[1mwandb[0m: Agent Starting Run: rrw6lk70 with config:
[34m[1mwandb[0m: 	learning_rate: 9.994260213703804e-06
[34m[1mwandb[0m: 	num_train_epochs: 3
[34m[1mwandb[0m: 	per_device_train_batch_size: 11
[34m[1mwandb[0m: 	warmup_ratio: 0.06756573499615812
[34m[1mwandb[0m: 	weight_decay: 0.00503673885464899
2022-04-28 03:38:04.404217: I tensorflow/stream_executor/platform/default/dso_loader.cc:49] Successfully opened dynamic library libcudart.so.10.1


Using custom data configuration tweet-sentiment-extraction-26a05391932e4e2c
Reusing dataset csv (/home/eliott.remmer/.cache/huggingface/datasets/csv/tweet-sentiment-extraction-26a05391932e4e2c/0.0.0/6b9057d9e23d9d8a2f05b985917a0da84d70c5dae3d22ddd8a3f22fb01c69d9e)


  0%|          | 0/2 [00:00<?, ?it/s]

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /.cache/huggingface/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "_name_or_path": "bert-base-uncased",
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_2": 2
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.14.1"

Step,Training Loss,Validation Loss,F1
50,1.1169,1.102769,0.282082
100,1.0888,1.079172,0.384215
150,1.0882,1.054098,0.438882
200,1.0555,1.020087,0.477747
250,0.9933,0.949455,0.595846
300,0.9387,0.878495,0.649801
350,0.8402,0.780037,0.672194
400,0.8384,0.704586,0.724159
450,0.7376,0.661241,0.729431
500,0.6995,0.622099,0.753065


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 11
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 11
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 11
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 11
The following columns in the evaluation set  don't have a corresponding 

Saving model checkpoint to /workspace/models/bert-base-uncased-finetuned-tweets
Configuration saved in /workspace/models/bert-base-uncased-finetuned-tweets/config.json
Model weights saved in /workspace/models/bert-base-uncased-finetuned-tweets/pytorch_model.bin
tokenizer config file saved in /workspace/models/bert-base-uncased-finetuned-tweets/tokenizer_config.json
Special tokens file saved in /workspace/models/bert-base-uncased-finetuned-tweets/special_tokens_map.json





VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
eval/f1,▁▃▇▇██▇██▇██████████████████████████████
eval/loss,█▇▃▃▂▁▂▁▂▁▁▁▁▁▁▁▁▂▂▁▂▁▁▁▁▁▁▁▂▂▂▂▂▂▂▂▂▂▂▁
eval/runtime,▁▇▃▂▂▃▃▄█▃▃▄▃▄▂▃▄▃▄▄▅▃▄█▄▆▃▃▄▃▃▅▃▄▄▄▃▅▃▂
eval/samples_per_second,█▂▆▇▇▆▆▅▁▆▆▅▆▅▇▆▅▆▅▅▄▆▅▁▅▃▆▆▅▆▆▄▆▅▅▅▆▄▆▇
eval/steps_per_second,█▂▆▇▇▆▆▅▁▆▆▅▆▅▇▆▅▆▅▅▄▆▅▁▅▃▆▆▅▆▆▄▆▅▅▅▆▄▆▇
train/epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇███
train/global_step,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇███
train/learning_rate,▂▄▇███▇▇▇▇▇▆▆▆▆▆▆▅▅▅▅▅▄▄▄▄▄▃▃▃▃▃▂▂▂▂▂▁▁▁
train/loss,██▆▄▄▃▃▄▃▃▄▃▃▃▂▂▂▃▂▂▂▃▂▂▃▂▃▁▂▂▁▂▂▂▁▂▂▂▁▂
train/total_flos,▁

0,1
eval/f1,0.79946
eval/loss,0.51505
eval/runtime,6.6262
eval/samples_per_second,533.34
eval/steps_per_second,48.595
train/epoch,3.0
train/global_step,7497.0
train/learning_rate,0.0
train/loss,0.3741
train/total_flos,2965575998095200.0


[34m[1mwandb[0m: Sweep Agent: Waiting for job.
[34m[1mwandb[0m: Job received.
[34m[1mwandb[0m: Agent Starting Run: hbjad4a8 with config:
[34m[1mwandb[0m: 	learning_rate: 9.485042293629492e-06
[34m[1mwandb[0m: 	num_train_epochs: 2
[34m[1mwandb[0m: 	per_device_train_batch_size: 8
[34m[1mwandb[0m: 	warmup_ratio: 0.09753530955286356
[34m[1mwandb[0m: 	weight_decay: 0.008711860137409115
2022-04-28 04:06:08.562841: I tensorflow/stream_executor/platform/default/dso_loader.cc:49] Successfully opened dynamic library libcudart.so.10.1


Using custom data configuration tweet-sentiment-extraction-26a05391932e4e2c
Reusing dataset csv (/home/eliott.remmer/.cache/huggingface/datasets/csv/tweet-sentiment-extraction-26a05391932e4e2c/0.0.0/6b9057d9e23d9d8a2f05b985917a0da84d70c5dae3d22ddd8a3f22fb01c69d9e)


  0%|          | 0/2 [00:00<?, ?it/s]

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /.cache/huggingface/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "_name_or_path": "bert-base-uncased",
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_2": 2
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.14.1"

Step,Training Loss,Validation Loss,F1
50,1.1114,1.105937,0.265571
100,1.0975,1.092935,0.330832
150,1.0983,1.0788,0.367378
200,1.07,1.051086,0.411678
250,1.0774,1.030608,0.48921
300,1.0305,0.987312,0.541452
350,0.9652,0.922078,0.603284
400,0.9172,0.871897,0.652947
450,0.8516,0.808981,0.644547
500,0.7861,0.77067,0.65634


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 8
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 8
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 8
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 8
The following columns in the evaluation set  don't have a corresponding argu

Saving model checkpoint to /workspace/models/bert-base-uncased-finetuned-tweets
Configuration saved in /workspace/models/bert-base-uncased-finetuned-tweets/config.json
Model weights saved in /workspace/models/bert-base-uncased-finetuned-tweets/pytorch_model.bin
tokenizer config file saved in /workspace/models/bert-base-uncased-finetuned-tweets/tokenizer_config.json
Special tokens file saved in /workspace/models/bert-base-uncased-finetuned-tweets/special_tokens_map.json





VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
eval/f1,▁▂▆▇▇▇████▇█████████████████████████████
eval/loss,█▇▅▃▂▂▁▂▁▁▂▂▁▁▁▁▁▁▁▁▁▁▁▂▂▁▁▂▁▂▁▁▁▁▁▁▁▁▁▁
eval/runtime,▁▄▄▂▄▄▃▂▄▄▅▄▂▅▃▃▃▅▃▅▄▆█▃▃▄▄▃▄▃▃▃▅▄▅▆▅▃▄▃
eval/samples_per_second,█▅▅▇▅▅▆▇▅▅▄▅▇▄▆▆▆▄▆▄▄▃▁▆▆▅▅▅▅▆▆▆▄▅▄▃▄▆▅▆
eval/steps_per_second,█▅▅▇▅▅▆▇▅▅▄▅▇▄▆▆▆▄▆▄▄▃▁▆▆▅▅▅▅▆▆▆▄▅▄▃▄▆▅▆
train/epoch,▁▁▁▁▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
train/global_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▅▆▆▆▆▆▇▇▇▇▇▇███
train/learning_rate,▂▃▅▇███▇▇▇▇▇▆▆▆▆▆▅▅▅▅▅▄▄▄▄▄▃▃▃▃▃▂▂▂▂▂▁▁▁
train/loss,██▆▅▄▄▄▄▃▃▃▃▂▃▃▃▃▃▃▂▁▂▂▂▂▂▁▂▂▂▁▂▂▁▁▂▂▂▂▂
train/total_flos,▁

0,1
eval/f1,0.79906
eval/loss,0.54773
eval/runtime,7.0391
eval/samples_per_second,502.051
eval/steps_per_second,62.792
train/epoch,2.0
train/global_step,6870.0
train/learning_rate,0.0
train/loss,0.4401
train/total_flos,1977050665396800.0


[34m[1mwandb[0m: Agent Starting Run: yiooorms with config:
[34m[1mwandb[0m: 	learning_rate: 9.924254907729883e-06
[34m[1mwandb[0m: 	num_train_epochs: 2
[34m[1mwandb[0m: 	per_device_train_batch_size: 14
[34m[1mwandb[0m: 	warmup_ratio: 0.06683568599979443
[34m[1mwandb[0m: 	weight_decay: 0.01968109060260556
2022-04-28 04:30:55.804752: I tensorflow/stream_executor/platform/default/dso_loader.cc:49] Successfully opened dynamic library libcudart.so.10.1


Using custom data configuration tweet-sentiment-extraction-26a05391932e4e2c
Reusing dataset csv (/home/eliott.remmer/.cache/huggingface/datasets/csv/tweet-sentiment-extraction-26a05391932e4e2c/0.0.0/6b9057d9e23d9d8a2f05b985917a0da84d70c5dae3d22ddd8a3f22fb01c69d9e)


  0%|          | 0/2 [00:00<?, ?it/s]

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /.cache/huggingface/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "_name_or_path": "bert-base-uncased",
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_2": 2
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.14.1"

Step,Training Loss,Validation Loss,F1
50,1.1108,1.092831,0.340434
100,1.0851,1.057159,0.434202
150,1.0541,1.013103,0.536075
200,0.9706,0.880632,0.658487
250,0.8639,0.751814,0.691469
300,0.7522,0.65527,0.739702
350,0.705,0.635328,0.739465
400,0.6614,0.601155,0.757512
450,0.6266,0.616118,0.750414
500,0.6419,0.591134,0.765319


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 14
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 14
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 14
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 14
The following columns in the evaluation set  don't have a corresponding 

Saving model checkpoint to /workspace/models/bert-base-uncased-finetuned-tweets
Configuration saved in /workspace/models/bert-base-uncased-finetuned-tweets/config.json
Model weights saved in /workspace/models/bert-base-uncased-finetuned-tweets/pytorch_model.bin
tokenizer config file saved in /workspace/models/bert-base-uncased-finetuned-tweets/tokenizer_config.json
Special tokens file saved in /workspace/models/bert-base-uncased-finetuned-tweets/special_tokens_map.json





VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
eval/f1,▁▄▆▇▇▇██████████████████████████████████
eval/loss,█▇▄▃▂▂▁▂▂▁▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁
eval/runtime,▂▃▃▄▃▂▂▃▂▂▁▃█▂▂▁▂▂▃▂▂▃▂▂▂▃▂▂▂▃▁▂▁▃▄▂▂▂▃▂
eval/samples_per_second,▇▆▆▅▆▇▇▆▇▇█▆▁▇▇█▇▇▆▇▇▆▇▇▇▆▇▇▇▆█▇█▆▅▇▇▇▆▇
eval/steps_per_second,▇▆▆▅▆▇▇▆▇▇█▆▁▇▇█▇▇▆▇▇▆▇▇▇▆▇▇▇▆█▇█▆▅▇▇▇▆▇
train/epoch,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇████
train/global_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▄▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇████
train/learning_rate,▂▄▆███▇▇▇▇▇▆▆▆▆▆▅▅▅▅▅▄▄▄▄▄▄▃▃▃▃▃▂▂▂▂▂▁▁▁
train/loss,██▇▅▄▃▃▃▃▃▃▃▂▃▃▂▃▂▂▂▂▁▂▂▁▂▂▂▁▁▁▁▁▁▂▂▁▁▂▂
train/total_flos,▁

0,1
eval/f1,0.79872
eval/loss,0.51078
eval/runtime,5.8125
eval/samples_per_second,608.004
eval/steps_per_second,43.527
train/epoch,2.0
train/global_step,3926.0
train/learning_rate,0.0
train/loss,0.4731
train/total_flos,1977050665396800.0


[34m[1mwandb[0m: Agent Starting Run: amnuaim1 with config:
[34m[1mwandb[0m: 	learning_rate: 9.946671407381753e-06
[34m[1mwandb[0m: 	num_train_epochs: 3
[34m[1mwandb[0m: 	per_device_train_batch_size: 17
[34m[1mwandb[0m: 	warmup_ratio: 0.03675389145958507
[34m[1mwandb[0m: 	weight_decay: 0.014297433006695273
2022-04-28 04:45:17.482843: I tensorflow/stream_executor/platform/default/dso_loader.cc:49] Successfully opened dynamic library libcudart.so.10.1


Using custom data configuration tweet-sentiment-extraction-26a05391932e4e2c
Reusing dataset csv (/home/eliott.remmer/.cache/huggingface/datasets/csv/tweet-sentiment-extraction-26a05391932e4e2c/0.0.0/6b9057d9e23d9d8a2f05b985917a0da84d70c5dae3d22ddd8a3f22fb01c69d9e)


  0%|          | 0/2 [00:00<?, ?it/s]

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /.cache/huggingface/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "_name_or_path": "bert-base-uncased",
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_2": 2
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.14.1"

Step,Training Loss,Validation Loss,F1
50,1.1046,1.08637,0.357139
100,1.0763,1.035122,0.477285
150,1.0069,0.942968,0.609309
200,0.8649,0.771823,0.665207
250,0.7627,0.65933,0.743029
300,0.6912,0.623253,0.749359
350,0.6389,0.615743,0.755237
400,0.6498,0.594063,0.761149
450,0.6264,0.576042,0.770393
500,0.5816,0.569026,0.764287


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 17
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 17
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 17
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 17
The following columns in the evaluation set  don't have a corresponding 

Saving model checkpoint to /workspace/models/bert-base-uncased-finetuned-tweets
Configuration saved in /workspace/models/bert-base-uncased-finetuned-tweets/config.json
Model weights saved in /workspace/models/bert-base-uncased-finetuned-tweets/pytorch_model.bin
tokenizer config file saved in /workspace/models/bert-base-uncased-finetuned-tweets/tokenizer_config.json
Special tokens file saved in /workspace/models/bert-base-uncased-finetuned-tweets/special_tokens_map.json





VBox(children=(Label(value='0.001 MB of 0.001 MB uploaded (0.000 MB deduped)\r'), FloatProgress(value=1.0, max…

0,1
eval/f1,▁▅▇▇▇███████████████████████████████████
eval/loss,█▆▃▂▂▂▂▂▂▁▁▁▁▁▂▁▁▁▁▂▁▁▁▁▁▁▁▁▂▂▂▁▁▂▁▁▂▁▂▁
eval/runtime,▁▂▂▅▃▃▄▄▄▃▃▄▃▄▄▃▃▃▄▃▃▃█▃▃▄▃▃▃▄▃▃▃▃▃▃▅▄▅▃
eval/samples_per_second,█▇▇▄▆▆▅▄▅▆▆▅▆▅▅▆▆▆▅▆▆▆▁▆▆▅▆▆▆▅▆▆▆▆▆▆▄▅▄▆
eval/steps_per_second,█▇▇▄▆▆▅▄▅▆▆▅▆▅▅▆▆▆▅▆▆▆▁▆▆▅▆▆▆▅▆▆▆▆▆▆▄▅▄▆
train/epoch,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇▇███
train/global_step,▁▁▁▂▂▂▂▂▂▃▃▃▃▃▃▄▄▄▄▄▅▅▅▅▅▆▆▆▆▆▆▇▇▇▇▇▇███
train/learning_rate,▃▇███▇▇▇▇▇▆▆▆▆▆▆▅▅▅▅▅▄▄▄▄▄▃▃▃▃▃▃▂▂▂▂▂▁▁▁
train/loss,█▇▅▄▃▃▃▃▃▃▃▃▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▂▁▁▂▁▂▂▁▁▁▁▁
train/total_flos,▁

0,1
eval/f1,0.79672
eval/loss,0.52707
eval/runtime,6.0973
eval/samples_per_second,579.602
eval/steps_per_second,34.114
train/epoch,3.0
train/global_step,4851.0
train/learning_rate,0.0
train/loss,0.332
train/total_flos,2965575998095200.0


[34m[1mwandb[0m: Agent Starting Run: gx22sq7i with config:
[34m[1mwandb[0m: 	learning_rate: 9.062797917397618e-06
[34m[1mwandb[0m: 	num_train_epochs: 3
[34m[1mwandb[0m: 	per_device_train_batch_size: 8
[34m[1mwandb[0m: 	warmup_ratio: 0.05409031970679112
[34m[1mwandb[0m: 	weight_decay: 0.017924287303923557
2022-04-28 05:04:36.399039: I tensorflow/stream_executor/platform/default/dso_loader.cc:49] Successfully opened dynamic library libcudart.so.10.1


Using custom data configuration tweet-sentiment-extraction-26a05391932e4e2c
Reusing dataset csv (/home/eliott.remmer/.cache/huggingface/datasets/csv/tweet-sentiment-extraction-26a05391932e4e2c/0.0.0/6b9057d9e23d9d8a2f05b985917a0da84d70c5dae3d22ddd8a3f22fb01c69d9e)


  0%|          | 0/2 [00:00<?, ?it/s]

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /.cache/huggingface/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "_name_or_path": "bert-base-uncased",
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_2": 2
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.14.1"

Step,Training Loss,Validation Loss,F1
50,1.1112,1.105306,0.268833
100,1.0968,1.090529,0.340385
150,1.0956,1.075498,0.376286
200,1.0654,1.043034,0.411776
250,1.0699,1.019861,0.509984
300,1.0152,0.971733,0.569244
350,0.9339,0.880465,0.637439
400,0.8702,0.822818,0.671032
450,0.8169,0.754193,0.692009
500,0.7545,0.724408,0.685376


The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 8
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 8
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 8
The following columns in the evaluation set  don't have a corresponding argument in `BertForSequenceClassification.forward` and have been ignored: text, textID.
***** Running Evaluation *****
  Num examples = 3534
  Batch size = 8
The following columns in the evaluation set  don't have a corresponding argu