<h1>Table of Contents<span class="tocSkip"></span></h1>
<div class="toc"><ul class="toc-item"><li><span><a href="#imports-and-functions" data-toc-modified-id="imports-and-functions-1"><span class="toc-item-num">1&nbsp;&nbsp;</span>imports and functions</a></span></li><li><span><a href="#experiments" data-toc-modified-id="experiments-2"><span class="toc-item-num">2&nbsp;&nbsp;</span>experiments</a></span><ul class="toc-item"><li><span><a href="#0" data-toc-modified-id="0-2.1"><span class="toc-item-num">2.1&nbsp;&nbsp;</span>0</a></span></li><li><span><a href="#1" data-toc-modified-id="1-2.2"><span class="toc-item-num">2.2&nbsp;&nbsp;</span>1</a></span></li><li><span><a href="#2" data-toc-modified-id="2-2.3"><span class="toc-item-num">2.3&nbsp;&nbsp;</span>2</a></span></li></ul></li></ul></div>

# imports and functions

In [None]:
import collections
import pandas as pd
import os
import sys
import json
import matplotlib.pyplot as plt
from tqdm.auto import tqdm, trange

import numpy as np
import torch
import torch.nn as nn
import torch.nn.functional as F
from torch.utils.data import Dataset, DataLoader
from torch import optim
from torch.optim import lr_scheduler
# import torchmetrics

import datasets
from datasets import load_metric
from transformers import AutoConfig, AutoTokenizer, BertModel, RobertaModel
from transformers import BertForSequenceClassification
from transformers import TrainingArguments, Trainer

from sklearn.metrics import mean_squared_error, accuracy_score, precision_recall_fscore_support


In [None]:
# https://github.com/huggingface/transformers/issues/5486
# os.environ["TOKENIZERS_PARALLELISM"] = "false"
os.environ["TOKENIZERS_PARALLELISM"] = "true"

In [None]:
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
device

device(type='cuda')

In [None]:
with open('../../data/xslue/tasks.json', 'r') as f:
    tasks = json.load(f)
tasks

{'CrowdFlower': 13,
 'DailyDialog': 7,
 'EmoBank_Valence': 1,
 'EmoBank_Arousal': 1,
 'EmoBank_Dominance': 1,
 'HateOffensive': 3,
 'PASTEL_age': 8,
 'PASTEL_country': 2,
 'PASTEL_education': 10,
 'PASTEL_ethnic': 10,
 'PASTEL_gender': 3,
 'PASTEL_politics': 3,
 'PASTEL_tod': 5,
 'SARC': 2,
 'SarcasmGhosh': 2,
 'SentiTreeBank': 1,
 'ShortHumor': 2,
 'ShortJokeKaggle': 2,
 'ShortRomance': 2,
 'StanfordPoliteness': 1,
 'TroFi': 2,
 'VUA': 2}

In [None]:
class MyDataset(Dataset): 
    # currently it's a Mapping-style dataset. Not sure if a Iterable-style dataset will be better
    def __init__(self, tsv_file):
        self.tokenizer = AutoTokenizer.from_pretrained("bert-base-uncased")
        self.df = pd.read_csv(tsv_file, sep='\t')
        self.df = self.df.dropna()
        self.df = self.df.reset_index(drop=True)
        self.encodings = self.tokenizer(self.df['text'].tolist(), truncation=True, padding=True, max_length=128)
        if self.df['label'].dtype == 'float64':
            self.df['label'] = self.df['label'].astype('float32')
        self.labels = self.df['label'].tolist()
    def __len__(self):
        return len(self.df)

    def __getitem__(self, idx):
        if torch.is_tensor(idx):
            idx = idx.tolist()
        item = {k: torch.tensor(v[idx]) for k, v in self.encodings.items()}
        item["labels"] = torch.tensor([self.labels[idx]])
        return item


In [None]:
pearsonr = load_metric("pearsonr")
spearmanr = load_metric("spearmanr")

In [None]:
# GPU memory usage: 6617 - 6680mb with bs 32
# bs 64 gives OOM
# bs 48 GPU memory 7894
batch_size = 32

In [None]:
def train_baseline(task, freeze_bert=False):
    torch.cuda.empty_cache()
    model = None
    trainer = None 
    num_labels = tasks[task]
    
    data_folder = '../../data/xslue'
    train_dataset = MyDataset(f'{data_folder}/processed/train/{task}.tsv')
    test_dataset = MyDataset(f'{data_folder}/processed/test/{task}.tsv')
    valid_dataset = MyDataset(f'{data_folder}/processed/dev/{task}.tsv')
    
    singletaskbert = BertForSequenceClassification.from_pretrained("bert-base-uncased", num_labels=num_labels) 
    if freeze_bert:
        for param in singletaskbert.bert.parameters():
            param.requires_grad = False
    result_folder = '../../result'
    training_args = TrainingArguments(
        output_dir=f"{result_folder}/baselines/{task+'_freezed' if freeze_bert else task}",   # output directory
        num_train_epochs=5,              # total number of training epochs
        per_device_train_batch_size=batch_size,  # batch size per device during training
        per_device_eval_batch_size=batch_size,   # batch size for evaluation
        warmup_steps=500,                # number of warmup steps for learning rate scheduler
        weight_decay=0.01,               # strength of weight decay
        logging_dir=f"{result_folder}/baselines/{task+'_freezed' if freeze_bert else task}/logs",  # directory for storing logs
#         logging_first_step = True, 
#         logging_steps=500,               # log & save weights each logging_steps
#         save_steps=500,
        evaluation_strategy="epoch",     # evaluate each `logging_steps`
        save_total_limit = 1,
        save_strategy = 'epoch',
        load_best_model_at_end=True, # decide on loss
    )
    
    if num_labels == 1:
        def compute_metrics(pred):
            predictions, labels = pred
            rmse = mean_squared_error(labels, predictions, squared=False)
            return {"rmse": rmse}
    elif num_labels == 2:
        def compute_metrics(pred):
            labels = pred.label_ids
            preds = pred.predictions.argmax(-1)
            precision, recall, f1, _ = precision_recall_fscore_support(labels, preds, average='binary')
            acc = accuracy_score(labels, preds)
            return {
                'accuracy': acc,
                'f1': f1,
                'precision': precision,
                'recall': recall
            }
    else:
        def compute_metrics(pred):
            labels = pred.label_ids
            preds = pred.predictions.argmax(-1)
            precision, recall, f1, _ = precision_recall_fscore_support(labels, preds, average='macro')
            acc = accuracy_score(labels, preds)
            return {
                'accuracy': acc,
                'f1': f1,
                'precision': precision,
                'recall': recall
            }
    
    trainer = Trainer(
        model=singletaskbert,   # the instantiated Transformers model to be trained
        args=training_args,                  # training arguments, defined above
        train_dataset=train_dataset,         # training dataset
        eval_dataset=valid_dataset,          # evaluation dataset
#         test_dataset=test_dataset,            # test dataset
        compute_metrics=compute_metrics,     # the callback that computes metrics of interest
    )
    trainer.train()

# experiments

## 17

In [None]:
task = list(tasks.keys())[17]
train_baseline(task)

Some weights of the model checkpoint at bert-base-uncased were not used when initializing BertForSequenceClassification: ['cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.decoder.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model checkpoint at

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.0967,0.089392,0.969527,0.969484,0.969312,0.969657
2,0.0555,0.087918,0.976235,0.976109,0.97974,0.972504
3,0.0287,0.103096,0.979789,0.979639,0.985327,0.974017
4,0.011,0.09244,0.982187,0.98204,0.988637,0.975529
5,0.0037,0.113888,0.982054,0.981869,0.990493,0.973394


***** Running Evaluation *****
  Num examples = 22512
  Batch size = 32
Saving model checkpoint to ../../result/baselines/ShortJokeKaggle/checkpoint-12709
Configuration saved in ../../result/baselines/ShortJokeKaggle/checkpoint-12709/config.json
Model weights saved in ../../result/baselines/ShortJokeKaggle/checkpoint-12709/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 22512
  Batch size = 32
Saving model checkpoint to ../../result/baselines/ShortJokeKaggle/checkpoint-25418
Configuration saved in ../../result/baselines/ShortJokeKaggle/checkpoint-25418/config.json
Model weights saved in ../../result/baselines/ShortJokeKaggle/checkpoint-25418/pytorch_model.bin
Deleting older checkpoint [../../result/baselines/ShortJokeKaggle/checkpoint-12709] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 22512
  Batch size = 32
Saving model checkpoint to ../../result/baselines/ShortJokeKaggle/checkpoint-38127
Configuration saved in ../../result/baselines/

In [None]:
task = list(tasks.keys())[17]
train_baseline(task, freeze_bert=True)

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /home/jz17d/.cache/huggingface/transformers/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.12.3",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading file https://huggingface.co/bert-base-uncased/resolve/main/vocab.txt from cache at /home/j

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /home/jz17d/.cache/huggingface/transformers/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.12.3",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weights file https://huggingface.co/bert-base-uncased/resolve/main/pytorch_model.bin from 

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,0.4606,0.426597,0.827958,0.840637,0.78186,0.90897
2,0.4333,0.395988,0.838086,0.849536,0.792331,0.915643
3,0.4239,0.384267,0.841507,0.852586,0.795774,0.918135
4,0.4161,0.375889,0.846926,0.856081,0.806627,0.911995
5,0.4173,0.374724,0.847237,0.856559,0.806155,0.913686


***** Running Evaluation *****
  Num examples = 22512
  Batch size = 32
Saving model checkpoint to ../../result/baselines/ShortJokeKaggle_freezed/checkpoint-12709
Configuration saved in ../../result/baselines/ShortJokeKaggle_freezed/checkpoint-12709/config.json
Model weights saved in ../../result/baselines/ShortJokeKaggle_freezed/checkpoint-12709/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 22512
  Batch size = 32
Saving model checkpoint to ../../result/baselines/ShortJokeKaggle_freezed/checkpoint-25418
Configuration saved in ../../result/baselines/ShortJokeKaggle_freezed/checkpoint-25418/config.json
Model weights saved in ../../result/baselines/ShortJokeKaggle_freezed/checkpoint-25418/pytorch_model.bin
Deleting older checkpoint [../../result/baselines/ShortJokeKaggle_freezed/checkpoint-12709] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 22512
  Batch size = 32
Saving model checkpoint to ../../result/baselines/ShortJokeKaggle_freezed

## 18

In [None]:
task = list(tasks.keys())[18]
train_baseline(task)

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /home/jz17d/.cache/huggingface/transformers/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.12.3",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading file https://huggingface.co/bert-base-uncased/resolve/main/vocab.txt from cache at /home/j

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /home/jz17d/.cache/huggingface/transformers/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.12.3",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weights file https://huggingface.co/bert-base-uncased/resolve/main/pytorch_model.bin from 

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.420221,0.943396,0.94,1.0,0.886792
2,No log,0.037682,0.990566,0.990476,1.0,0.981132
3,No log,0.004325,1.0,1.0,1.0,1.0
4,No log,0.001907,1.0,1.0,1.0,1.0
5,No log,0.090246,0.981132,0.980769,1.0,0.962264


***** Running Evaluation *****
  Num examples = 106
  Batch size = 32
Saving model checkpoint to ../../result/baselines/ShortRomance/checkpoint-60
Configuration saved in ../../result/baselines/ShortRomance/checkpoint-60/config.json
Model weights saved in ../../result/baselines/ShortRomance/checkpoint-60/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 106
  Batch size = 32
Saving model checkpoint to ../../result/baselines/ShortRomance/checkpoint-120
Configuration saved in ../../result/baselines/ShortRomance/checkpoint-120/config.json
Model weights saved in ../../result/baselines/ShortRomance/checkpoint-120/pytorch_model.bin
Deleting older checkpoint [../../result/baselines/ShortRomance/checkpoint-60] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 106
  Batch size = 32
Saving model checkpoint to ../../result/baselines/ShortRomance/checkpoint-180
Configuration saved in ../../result/baselines/ShortRomance/checkpoint-180/config.json
Model weig

In [None]:
task = list(tasks.keys())[18]
train_baseline(task, freeze_bert=True)

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /home/jz17d/.cache/huggingface/transformers/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.12.3",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading file https://huggingface.co/bert-base-uncased/resolve/main/vocab.txt from cache at /home/j

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /home/jz17d/.cache/huggingface/transformers/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.12.3",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weights file https://huggingface.co/bert-base-uncased/resolve/main/pytorch_model.bin from 

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.688077,0.566038,0.557692,0.568627,0.54717
2,No log,0.679605,0.613208,0.713287,0.566667,0.962264
3,No log,0.668829,0.584906,0.706667,0.546392,1.0
4,No log,0.653131,0.632075,0.731034,0.576087,1.0
5,No log,0.635425,0.613208,0.717241,0.565217,0.981132


***** Running Evaluation *****
  Num examples = 106
  Batch size = 32
Saving model checkpoint to ../../result/baselines/ShortRomance_freezed/checkpoint-60
Configuration saved in ../../result/baselines/ShortRomance_freezed/checkpoint-60/config.json
Model weights saved in ../../result/baselines/ShortRomance_freezed/checkpoint-60/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 106
  Batch size = 32
Saving model checkpoint to ../../result/baselines/ShortRomance_freezed/checkpoint-120
Configuration saved in ../../result/baselines/ShortRomance_freezed/checkpoint-120/config.json
Model weights saved in ../../result/baselines/ShortRomance_freezed/checkpoint-120/pytorch_model.bin
Deleting older checkpoint [../../result/baselines/ShortRomance_freezed/checkpoint-60] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 106
  Batch size = 32
Saving model checkpoint to ../../result/baselines/ShortRomance_freezed/checkpoint-180
Configuration saved in ../../res

## 19

In [None]:
task = list(tasks.keys())[19]
train_baseline(task)

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /home/jz17d/.cache/huggingface/transformers/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.12.3",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading file https://huggingface.co/bert-base-uncased/resolve/main/vocab.txt from cache at /home/j

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /home/jz17d/.cache/huggingface/transformers/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.12.3",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weights file

Epoch,Training Loss,Validation Loss,Rmse
1,No log,0.008661,0.093067
2,0.046300,0.007674,0.087601
3,0.046300,0.008196,0.090534
4,0.008000,0.009194,0.095887
5,0.004600,0.008774,0.093668


***** Running Evaluation *****
  Num examples = 530
  Batch size = 32
Saving model checkpoint to ../../result/baselines/StanfordPoliteness/checkpoint-309
Configuration saved in ../../result/baselines/StanfordPoliteness/checkpoint-309/config.json
Model weights saved in ../../result/baselines/StanfordPoliteness/checkpoint-309/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 530
  Batch size = 32
Saving model checkpoint to ../../result/baselines/StanfordPoliteness/checkpoint-618
Configuration saved in ../../result/baselines/StanfordPoliteness/checkpoint-618/config.json
Model weights saved in ../../result/baselines/StanfordPoliteness/checkpoint-618/pytorch_model.bin
Deleting older checkpoint [../../result/baselines/StanfordPoliteness/checkpoint-309] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 530
  Batch size = 32
Saving model checkpoint to ../../result/baselines/StanfordPoliteness/checkpoint-927
Configuration saved in ../../result/baseline

In [None]:
task = list(tasks.keys())[19]
train_baseline(task, freeze_bert=True)

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /home/jz17d/.cache/huggingface/transformers/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.12.3",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading file https://huggingface.co/bert-base-uncased/resolve/main/vocab.txt from cache at /home/j

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /home/jz17d/.cache/huggingface/transformers/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.12.3",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weights file

Epoch,Training Loss,Validation Loss,Rmse
1,No log,0.01628,0.127593
2,0.176900,0.013194,0.114866
3,0.176900,0.012059,0.109815
4,0.024000,0.01208,0.109911
5,0.022300,0.011856,0.108884


***** Running Evaluation *****
  Num examples = 530
  Batch size = 32
Saving model checkpoint to ../../result/baselines/StanfordPoliteness_freezed/checkpoint-309
Configuration saved in ../../result/baselines/StanfordPoliteness_freezed/checkpoint-309/config.json
Model weights saved in ../../result/baselines/StanfordPoliteness_freezed/checkpoint-309/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 530
  Batch size = 32
Saving model checkpoint to ../../result/baselines/StanfordPoliteness_freezed/checkpoint-618
Configuration saved in ../../result/baselines/StanfordPoliteness_freezed/checkpoint-618/config.json
Model weights saved in ../../result/baselines/StanfordPoliteness_freezed/checkpoint-618/pytorch_model.bin
Deleting older checkpoint [../../result/baselines/StanfordPoliteness_freezed/checkpoint-309] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 530
  Batch size = 32
Saving model checkpoint to ../../result/baselines/StanfordPoliteness_fre

## 20

In [None]:
task = list(tasks.keys())[20]
train_baseline(task)

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /home/jz17d/.cache/huggingface/transformers/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.12.3",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading file https://huggingface.co/bert-base-uncased/resolve/main/vocab.txt from cache at /home/j

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /home/jz17d/.cache/huggingface/transformers/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.12.3",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weights file https://huggingface.co/bert-base-uncased/resolve/main/pytorch_model.bin from 

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.653478,0.588571,0.217391,0.909091,0.123457
2,No log,0.627876,0.668571,0.608108,0.671642,0.555556
3,No log,0.598571,0.651429,0.596026,0.642857,0.555556
4,No log,0.701564,0.674286,0.662722,0.636364,0.691358
5,0.496500,0.839991,0.714286,0.675325,0.712329,0.641975


***** Running Evaluation *****
  Num examples = 175
  Batch size = 32
Saving model checkpoint to ../../result/baselines/TroFi/checkpoint-105
Configuration saved in ../../result/baselines/TroFi/checkpoint-105/config.json
Model weights saved in ../../result/baselines/TroFi/checkpoint-105/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 175
  Batch size = 32
Saving model checkpoint to ../../result/baselines/TroFi/checkpoint-210
Configuration saved in ../../result/baselines/TroFi/checkpoint-210/config.json
Model weights saved in ../../result/baselines/TroFi/checkpoint-210/pytorch_model.bin
Deleting older checkpoint [../../result/baselines/TroFi/checkpoint-105] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 175
  Batch size = 32
Saving model checkpoint to ../../result/baselines/TroFi/checkpoint-315
Configuration saved in ../../result/baselines/TroFi/checkpoint-315/config.json
Model weights saved in ../../result/baselines/TroFi/checkpoint-315/py

In [None]:
task = list(tasks.keys())[20]
train_baseline(task, freeze_bert=True)

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /home/jz17d/.cache/huggingface/transformers/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.12.3",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading file https://huggingface.co/bert-base-uncased/resolve/main/vocab.txt from cache at /home/j

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /home/jz17d/.cache/huggingface/transformers/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.12.3",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weights file https://huggingface.co/bert-base-uncased/resolve/main/pytorch_model.bin from 

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.687581,0.531429,0.068182,0.428571,0.037037
2,No log,0.687925,0.531429,0.0,0.0,0.0
3,No log,0.689353,0.537143,0.0,0.0,0.0
4,No log,0.689072,0.537143,0.0,0.0,0.0
5,0.687700,0.685814,0.548571,0.048193,1.0,0.024691


***** Running Evaluation *****
  Num examples = 175
  Batch size = 32
Saving model checkpoint to ../../result/baselines/TroFi_freezed/checkpoint-105
Configuration saved in ../../result/baselines/TroFi_freezed/checkpoint-105/config.json
Model weights saved in ../../result/baselines/TroFi_freezed/checkpoint-105/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 175
  Batch size = 32
Saving model checkpoint to ../../result/baselines/TroFi_freezed/checkpoint-210
Configuration saved in ../../result/baselines/TroFi_freezed/checkpoint-210/config.json
Model weights saved in ../../result/baselines/TroFi_freezed/checkpoint-210/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 175
  Batch size = 32
  _warn_prf(average, modifier, msg_start, len(result))
Saving model checkpoint to ../../result/baselines/TroFi_freezed/checkpoint-315
Configuration saved in ../../result/baselines/TroFi_freezed/checkpoint-315/config.json
Model weights saved in ../../result/baselines/TroFi

## 21

In [None]:
task = list(tasks.keys())[21]
train_baseline(task)

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /home/jz17d/.cache/huggingface/transformers/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.12.3",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading file https://huggingface.co/bert-base-uncased/resolve/main/vocab.txt from cache at /home/j

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /home/jz17d/.cache/huggingface/transformers/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.12.3",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weights file https://huggingface.co/bert-base-uncased/resolve/main/pytorch_model.bin from 

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.400075,0.831502,0.638743,0.760125,0.55079
2,0.506900,0.334926,0.85409,0.712395,0.762887,0.668172
3,0.336600,0.468239,0.862027,0.728365,0.77892,0.683973
4,0.168400,0.619311,0.864469,0.729927,0.791557,0.677201
5,0.079800,0.759781,0.8663,0.740828,0.778607,0.706546


***** Running Evaluation *****
  Num examples = 1638
  Batch size = 32
Saving model checkpoint to ../../result/baselines/VUA/checkpoint-474
Configuration saved in ../../result/baselines/VUA/checkpoint-474/config.json
Model weights saved in ../../result/baselines/VUA/checkpoint-474/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 1638
  Batch size = 32
Saving model checkpoint to ../../result/baselines/VUA/checkpoint-948
Configuration saved in ../../result/baselines/VUA/checkpoint-948/config.json
Model weights saved in ../../result/baselines/VUA/checkpoint-948/pytorch_model.bin
Deleting older checkpoint [../../result/baselines/VUA/checkpoint-474] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1638
  Batch size = 32
Saving model checkpoint to ../../result/baselines/VUA/checkpoint-1422
Configuration saved in ../../result/baselines/VUA/checkpoint-1422/config.json
Model weights saved in ../../result/baselines/VUA/checkpoint-1422/pytorch_model.bi

In [None]:
task = list(tasks.keys())[21]
train_baseline(task, freeze_bert=True)

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /home/jz17d/.cache/huggingface/transformers/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.12.3",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading file https://huggingface.co/bert-base-uncased/resolve/main/vocab.txt from cache at /home/j

loading configuration file https://huggingface.co/bert-base-uncased/resolve/main/config.json from cache at /home/jz17d/.cache/huggingface/transformers/3c61d016573b14f7f008c02c4e51a366c67ab274726fe2910691e2a761acf43e.37395cee442ab11005bcd270f3c34464dc1704b715b5d7d52b1a461abe3b9e4e
Model config BertConfig {
  "architectures": [
    "BertForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "classifier_dropout": null,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "position_embedding_type": "absolute",
  "transformers_version": "4.12.3",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 30522
}

loading weights file https://huggingface.co/bert-base-uncased/resolve/main/pytorch_model.bin from 

Epoch,Training Loss,Validation Loss,Accuracy,F1,Precision,Recall
1,No log,0.580977,0.729548,0.0,0.0,0.0
2,0.614200,0.573718,0.729548,0.0,0.0,0.0
3,0.589700,0.571166,0.729548,0.0,0.0,0.0
4,0.588800,0.569901,0.729548,0.0,0.0,0.0
5,0.582000,0.568249,0.729548,0.0,0.0,0.0


***** Running Evaluation *****
  Num examples = 1638
  Batch size = 32
  _warn_prf(average, modifier, msg_start, len(result))
Saving model checkpoint to ../../result/baselines/VUA_freezed/checkpoint-474
Configuration saved in ../../result/baselines/VUA_freezed/checkpoint-474/config.json
Model weights saved in ../../result/baselines/VUA_freezed/checkpoint-474/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 1638
  Batch size = 32
  _warn_prf(average, modifier, msg_start, len(result))
Saving model checkpoint to ../../result/baselines/VUA_freezed/checkpoint-948
Configuration saved in ../../result/baselines/VUA_freezed/checkpoint-948/config.json
Model weights saved in ../../result/baselines/VUA_freezed/checkpoint-948/pytorch_model.bin
Deleting older checkpoint [../../result/baselines/VUA_freezed/checkpoint-474] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 1638
  Batch size = 32
  _warn_prf(average, modifier, msg_start, len(result))
Saving mo