# Combining Knowledge Graphs and Deep Learning techniques for Categorizing Tweets
## BERT Models (TweetBERT, BERT, RoBERTa, CamemBERT, DistilBERT, Albert, Flaubert)


Authors:


Experiments:
* Applying RF, RNN and Bi-LSTM models to 2 datasets for classifying 4 binary categories.
* 2 datatasets: (i) textual information and (ii) textual information and embeddings obtained from knowledge graph exploitation (KGE).
 
 


In [1]:
from keras.preprocessing import sequence
from keras.models import Sequential
from keras.layers import Dense, Dropout, Embedding, LSTM, Bidirectional
from keras.datasets import imdb 
import spacy
import nltk.data
import pandas as pd
import numpy as np
from nltk.tokenize import word_tokenize
from nltk.stem import SnowballStemmer
import regex as re
import string
from collections import defaultdict
import matplotlib.pyplot as plt
import seaborn as sns
pd.set_option('display.max_colwidth', None)
import sklearn
from sklearn.model_selection import train_test_split
from sklearn.metrics import f1_score, accuracy_score
from simpletransformers.classification import ClassificationModel
import io
import os
import json
from collections import Counter
from wordcloud import WordCloud
import re, string, unicodedata
import nltk
from nltk import word_tokenize, sent_tokenize, FreqDist
from nltk.corpus import stopwords
from nltk.stem import LancasterStemmer, WordNetLemmatizer
nltk.download
from ast import literal_eval
'''
tweets = pd.read_csv('ed-dataset-falcon_spacy2-embeddings-sentence.csv', sep=';', encoding='utf8', converters=
                           {
                            'entities_instances_wikidata':literal_eval,
                            'spacy_entities_ids':literal_eval,
                            'spacy_entities_labels':literal_eval,
                            'falcon_spacy_entities':literal_eval,
                            'falcon_spacy_labels':literal_eval,
                            'falcon_spacy_embeddingsmd4_mw50_RW':literal_eval,
                            'falcon_spacy_embeddingsmd2_mw100_RW':literal_eval,
                            'sent_embedding_1':literal_eval,
                            'sent_embedding_2':literal_eval},error_bad_lines=False)

'''
tweets = pd.read_csv('ed-dataset-falcon_spacy2-embeddings-sentence-md4.csv', sep=';', encoding='utf8', converters=
                           {
                            'falcon_spacy_embeddingsmd4_mw50_RW':literal_eval,
                            'sent_embedding_1':literal_eval},error_bad_lines=False)

In [2]:
n_unique_words = 10000 # cut texts after this number of words
maxlen = 100
batch_size = 128 

In [3]:
punctuations = "¡!#$%&'()*+,-./:;<=>¿?@[\]^_`{|}~"

def read_txt(filename):
    list = []
    with open(filename, 'r', encoding='utf-8') as f:
        data = f.readlines()
        for line in data:
            list.append(str(line).replace('\n', ''))
    return list

stopwords = read_txt('english_stopwords.txt')

stemmer = SnowballStemmer('english')


def clean_accents(tweet):
    tweet = re.sub(r"[àáâãäå]", "a", tweet)
    tweet = re.sub(r"ç", "c", tweet)
    tweet = re.sub(r"[èéêë]", "e", tweet)
    tweet = re.sub(r"[ìíîï]", "i", tweet)
    tweet = re.sub(r"[òóôõö]", "o", tweet)
    tweet = re.sub(r"[ùúûü]", "u", tweet)
    tweet = re.sub(r"[ýÿ]", "y", tweet)

    return tweet

def clean_tweet(tweet, stem = False):
    tweet = tweet.lower().strip()
    tweet = re.sub(r'https?:\/\/\S+', '', tweet)
    tweet = re.sub(r'http?:\/\/\S+', '', tweet)
    tweet = re.sub(r'www?:\/\/\S+', '', tweet)
    tweet = re.sub(r'\s([@#][\w_-]+)', "", tweet)
    tweet = re.sub(r"\n", " ", tweet)
    tweet = clean_accents(tweet)
    tweet = re.sub(r"\b(a*ha+h[ha]*|o?l+o+l+[ol]*|x+d+[x*d*]*|a*ja+[j+a+]+)\b", "<risas>", tweet)
    for symbol in punctuations:
        tweet = tweet.replace(symbol, "")
    tokens = []
    for token in tweet.strip().split():
        if token not in punctuations and token not in stopwords:
            if stem:
                tokens.append(stemmer.stem(token))
            else:
                tokens.append(token)
    return " ".join(tokens)

In [4]:
tweets1 = tweets.copy()
tweets1['text_cleaned'] = tweets['text_orig'].apply(lambda s : clean_tweet(s))
print(tweets1['text_cleaned'].head(5))

0                                                                                                                                                                             this is how you make it better
1    the effects of dosagecontrolled cannabis capsules on cancerrelated cachexia and anorexia syndrome in advanced cancer patients pilot study gil barsela daniela zalman valerya semenysty eyal ballan 2019
2                                                                                                                                                                         kaydoloo you are the best anorexic
3                                                                                                                                                                                  maxy is the best anorexic
4                                                                                                                                                                                   

In [5]:
# This will hold all of the dataset samples, as strings.
sen_w_feats = []

# The labels for the samples.
labels = []

# First, reload the dataset to undo the transformations we applied for XGBoost.
data_df = tweets.copy()

# Some of the reviews are missing either a "Title" or "Review Text", so we'll 
# replace the NaN values with empty string.
data_df = data_df.fillna("")

# Combining features following https://mccormickml.com/2021/06/29/combining-categorical-numerical-features-with-bert/
print('Combining features ...')

# For each of the samples...
for index, row in data_df.iterrows():

    # Piece it together...    
    combined = row["text_orig"]
    combined += " {:} ".format(row["sent_embedding_1"])
    
    # Add the combined text to the list.
    sen_w_feats.append(combined)

    # Also record the sample's label.
    labels.append(row["ProED"])

print('  DONE.')

print('Dataset contains {:,} samples.'.format(len(sen_w_feats)))



Combining features into strings...
  DONE.
Dataset contains 1,968 samples.


In [9]:
X = sen_w_feats
X2 = tweets1['text_cleaned']

df = tweets1.copy()
Y1 = df['ED_Patient']
Y2 = df['ProED']
Y3 = df['informative']
Y4 = df['scientific']

X1_train, X1_test, y1_train, y1_test = train_test_split(X, Y1, test_size=0.3, random_state=42)
X2_train, X2_test, y2_train, y2_test = train_test_split(X, Y2, test_size=0.3, random_state=42)
X3_train, X3_test, y3_train, y3_test = train_test_split(X, Y3, test_size=0.3, random_state=42)
X4_train, X4_test, y4_train, y4_test = train_test_split(X, Y4, test_size=0.3, random_state=42)

In [10]:
y1_test.value_counts(normalize=True)

1    0.500846
0    0.499154
Name: ED_Patient, dtype: float64

In [11]:
train_args ={"reprocess_input_data": True,
           "fp16":False,
             "evaluate_during_training": False,
             "evaluate_during_training_verbose":False,
             "learning_rate":2e-5,
             "train_batch_size":32,
             "eval_batch_size":32,
           "num_train_epochs": 15, 'overwrite_output_dir': True, "evaluation_strategy":'epochs'
            }
#optimizer = torch.optim.SGD(model.parameters(), lr=0.01, momentum=0.9)


def f1_multiclass(labels, preds):
    return f1_score(labels, preds, average='micro')

def calcule_f1(df):
    return(df['tp'] / (df['tp'] + 0.5 * (df['fp'] + df['fn'])))

import torch
import gc
from tqdm import tqdm


dfEval1 = pd.DataFrame()

In [12]:
N_ITER = 5

In [13]:
gc.collect()
torch.cuda.empty_cache()

In [14]:
import torch
print(torch.cuda.is_available())


True


## 1. BERT Models applied to Category I - Tweets written by people suffering Eating Disorders

In [15]:
#gc.collect()
#torch.cuda.empty_cache()
limitsave=0

X1_train, X1_test, y1_train, y1_test = train_test_split(X, Y1, test_size=0.3, random_state=42)
train_df1 = pd.DataFrame({ 'text_cleaned': X1_train, 'target': y1_train })
test_df1 = pd.DataFrame({ 'text_cleaned': X1_test, 'target': y1_test })

c_model_1 = ["bertweet","bert","roberta", "distilbert","camembert",  "albert", "flaubert"]
c_model_2 = ["vinai/bertweet-base","bert-base-multilingual-cased","roberta-base","distilbert-base-cased", "camembert-base", "albert-base-v1", "flaubert/flaubert_base_cased"]

for idx, model in enumerate(c_model_1):
    
    for i in range(0,N_ITER):
        model1 = ClassificationModel(
        c_model_1[idx], c_model_2[idx],
            use_cuda = True,
            args=train_args
        )
        model1.train_model(train_df1)
        result1, model_outputs1, wrong_predictions1 = model1.eval_model(test_df1, f1=f1_multiclass, acc=accuracy_score)
        print(result1)
        if(i<limitsave):
            torch.save(model1, 'model1'+str(i)+'.pt')
        del model1
        gc.collect()
        torch.cuda.empty_cache()
        if(i==0):
            dfResultsModels1 = pd.DataFrame.from_dict(result1, orient="index").T
        else:
            dfResultsModels1b = pd.DataFrame.from_dict(result1, orient="index").T
            dfResultsModels1 = dfResultsModels1.append(dfResultsModels1b)

    dfResultsModels1Trans = pd.DataFrame(dfResultsModels1.mean(axis=0)).T
    dfResultsModels1Trans['f1'] = calcule_f1(dfResultsModels1Trans)
    if(idx == 0):
        dfResultsModelsTotal = dfResultsModels1Trans.copy()
    else:
        dfResultsModelsTotal = dfResultsModelsTotal.append(dfResultsModels1Trans)
    dfResultsModelsTotal.to_csv('dfResultsModelsTotalEMB-1.csv')

X1_train, X1_test, y1_train, y1_test = train_test_split(X2, Y1, test_size=0.3, random_state=42)
train_df1 = pd.DataFrame({ 'text_cleaned': X1_train, 'target': y1_train })
test_df1 = pd.DataFrame({ 'text_cleaned': X1_test, 'target': y1_test })
for idx, model in enumerate(c_model_1):
    
    for i in range(0,N_ITER):
        model1 = ClassificationModel(
        c_model_1[idx], c_model_2[idx],
            use_cuda = True,
            args=train_args
        )
        model1.train_model(train_df1)
        result1, model_outputs1, wrong_predictions1 = model1.eval_model(test_df1, f1=f1_multiclass, acc=accuracy_score)
        print(result1)
        if(i<limitsave):
            torch.save(model1, 'model1'+str(i)+'.pt')
        del model1
        gc.collect()
        torch.cuda.empty_cache()
        if(i==0):
            dfResultsModels1w = pd.DataFrame.from_dict(result1, orient="index").T
        else:
            dfResultsModels1bw = pd.DataFrame.from_dict(result1, orient="index").T
            dfResultsModels1w = dfResultsModels1.append(dfResultsModels1bw)

    dfResultsModels1Transw = pd.DataFrame(dfResultsModels1w.mean(axis=0)).T
    dfResultsModels1Transw['f1'] = calcule_f1(dfResultsModels1Transw)

    if(idx == 0):
        dfResultsModelsTotalw = dfResultsModels1Transw.copy()
    else:
        dfResultsModelsTotalw = dfResultsModelsTotalw.append(dfResultsModels1Transw)
    dfResultsModelsTotalw.to_csv('dfResultsModelsTotalEMB-1.csv')

Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

  "Dataframe headers not specified. Falling back to using column 0 as text and column 1 as labels."


Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7878352324236629, 'tp': 257, 'tn': 271, 'fp': 24, 'fn': 39, 'auroc': 0.9658497480531378, 'auprc': 0.9642829285393035, 'f1': 0.8934010152284264, 'acc': 0.8934010152284264, 'eval_loss': 0.48037906461640406}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7916769683926131, 'tp': 256, 'tn': 273, 'fp': 22, 'fn': 40, 'auroc': 0.9601465872652314, 'auprc': 0.9595259045634104, 'f1': 0.8950930626057529, 'acc': 0.8950930626057529, 'eval_loss': 0.5045918649748752}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8073403136253784, 'tp': 264, 'tn': 270, 'fp': 25, 'fn': 32, 'auroc': 0.9692624828218048, 'auprc': 0.9666957074325273, 'f1': 0.9035532994923858, 'acc': 0.9035532994923858, 'eval_loss': 0.4722842895670941}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8088002809903417, 'tp': 258, 'tn': 276, 'fp': 19, 'fn': 38, 'auroc': 0.950641319285387, 'auprc': 0.9493225656643759, 'f1': 0.9035532994923858, 'acc': 0.9035532994923858, 'eval_loss': 0.48424247956197514}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7878352324236629, 'tp': 257, 'tn': 271, 'fp': 24, 'fn': 39, 'auroc': 0.9662734768666972, 'auprc': 0.9640961414002673, 'f1': 0.8934010152284264, 'acc': 0.8934010152284264, 'eval_loss': 0.5099467039108276}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7395372858036005, 'tp': 255, 'tn': 259, 'fp': 36, 'fn': 41, 'auroc': 0.9413421896472745, 'auprc': 0.9457690003959699, 'f1': 0.8697123519458545, 'acc': 0.8697123519458545, 'eval_loss': 0.8390981892221853}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7608619501614943, 'tp': 244, 'tn': 275, 'fp': 20, 'fn': 52, 'auroc': 0.9339899221255153, 'auprc': 0.9433627623988977, 'f1': 0.8781725888324872, 'acc': 0.8781725888324873, 'eval_loss': 0.5833751167121687}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7497222407318532, 'tp': 262, 'tn': 255, 'fp': 40, 'fn': 34, 'auroc': 0.9475034356390288, 'auprc': 0.9425227480550807, 'f1': 0.8747884940778342, 'acc': 0.8747884940778342, 'eval_loss': 0.7791959611993087}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7537083776243768, 'tp': 253, 'tn': 265, 'fp': 30, 'fn': 43, 'auroc': 0.9501603298213468, 'auprc': 0.9534147234758288, 'f1': 0.8764805414551607, 'acc': 0.8764805414551607, 'eval_loss': 0.7848740572992124}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7410106621075094, 'tp': 240, 'tn': 273, 'fp': 22, 'fn': 56, 'auroc': 0.949702244617499, 'auprc': 0.9448591149002741, 'f1': 0.868020304568528, 'acc': 0.868020304568528, 'eval_loss': 0.8962025375742662}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8210141452282957, 'tp': 274, 'tn': 264, 'fp': 31, 'fn': 22, 'auroc': 0.9680943655519927, 'auprc': 0.9683908475497751, 'f1': 0.910321489001692, 'acc': 0.9103214890016921, 'eval_loss': 0.6178806973131079}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8309718924549424, 'tp': 268, 'tn': 273, 'fp': 22, 'fn': 28, 'auroc': 0.9655978011910215, 'auprc': 0.9634542499008403, 'f1': 0.9153976311336718, 'acc': 0.9153976311336718, 'eval_loss': 0.5106814408576802}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8141101508182359, 'tp': 265, 'tn': 271, 'fp': 24, 'fn': 31, 'auroc': 0.958451672010994, 'auprc': 0.9618272677774247, 'f1': 0.9069373942470389, 'acc': 0.9069373942470389, 'eval_loss': 0.6590833836480191}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8046410963546419, 'tp': 260, 'tn': 273, 'fp': 22, 'fn': 36, 'auroc': 0.9631584974805314, 'auprc': 0.9649757399487017, 'f1': 0.9018612521150592, 'acc': 0.9018612521150592, 'eval_loss': 0.6477999114676526}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8341827094306696, 'tp': 272, 'tn': 270, 'fp': 25, 'fn': 24, 'auroc': 0.9692395785616124, 'auprc': 0.968148517427925, 'f1': 0.9170896785109983, 'acc': 0.9170896785109983, 'eval_loss': 0.5597335570736935}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7428221312949637, 'tp': 259, 'tn': 256, 'fp': 39, 'fn': 37, 'auroc': 0.9486486486486486, 'auprc': 0.949543770350779, 'f1': 0.871404399323181, 'acc': 0.871404399323181, 'eval_loss': 0.7104229903534839}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.766864553563473, 'tp': 257, 'tn': 265, 'fp': 30, 'fn': 39, 'auroc': 0.9546381126889603, 'auprc': 0.9561556830761455, 'f1': 0.8832487309644669, 'acc': 0.883248730964467, 'eval_loss': 0.6598751137131139}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7565088021857471, 'tp': 257, 'tn': 262, 'fp': 33, 'fn': 39, 'auroc': 0.950114521300962, 'auprc': 0.947317721416989, 'f1': 0.8781725888324872, 'acc': 0.8781725888324873, 'eval_loss': 0.6230187776841616}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7564193617969368, 'tp': 258, 'tn': 261, 'fp': 34, 'fn': 38, 'auroc': 0.9362116353641777, 'auprc': 0.9273375857567485, 'f1': 0.8781725888324872, 'acc': 0.8781725888324873, 'eval_loss': 0.6421784601713482}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7801511905482855, 'tp': 261, 'tn': 265, 'fp': 30, 'fn': 35, 'auroc': 0.945018323408154, 'auprc': 0.94714436518865, 'f1': 0.8900169204737732, 'acc': 0.8900169204737732, 'eval_loss': 0.6085808246739601}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7520388066819702, 'tp': 235, 'tn': 280, 'fp': 15, 'fn': 61, 'auroc': 0.9532180485570316, 'auprc': 0.9566030465623196, 'f1': 0.871404399323181, 'acc': 0.871404399323181, 'eval_loss': 0.5133460971869921}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7369203239192879, 'tp': 226, 'tn': 283, 'fp': 12, 'fn': 70, 'auroc': 0.9538135593220339, 'auprc': 0.9516793596557581, 'f1': 0.8612521150592216, 'acc': 0.8612521150592216, 'eval_loss': 0.5663052781632072}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.760608966777908, 'tp': 234, 'tn': 283, 'fp': 12, 'fn': 62, 'auroc': 0.9441937700412277, 'auprc': 0.9372272776485002, 'f1': 0.8747884940778342, 'acc': 0.8747884940778342, 'eval_loss': 0.5009492729839525}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7665869048047708, 'tp': 236, 'tn': 283, 'fp': 12, 'fn': 60, 'auroc': 0.9470682546953735, 'auprc': 0.9492107707122541, 'f1': 0.8781725888324872, 'acc': 0.8781725888324873, 'eval_loss': 0.5623332356151781}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7516849125368269, 'tp': 231, 'tn': 283, 'fp': 12, 'fn': 65, 'auroc': 0.9554512139257902, 'auprc': 0.9565363599589081, 'f1': 0.8697123519458545, 'acc': 0.8697123519458545, 'eval_loss': 0.5398756673461512}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7868456318992997, 'tp': 263, 'tn': 265, 'fp': 30, 'fn': 33, 'auroc': 0.9449954191479615, 'auprc': 0.9550903354050484, 'f1': 0.8934010152284264, 'acc': 0.8934010152284264, 'eval_loss': 0.47945916652679443}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7908522215708697, 'tp': 259, 'tn': 270, 'fp': 25, 'fn': 37, 'auroc': 0.9348373797526339, 'auprc': 0.9428914423861712, 'f1': 0.8950930626057529, 'acc': 0.8950930626057529, 'eval_loss': 0.5003169629918901}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7577764721950684, 'tp': 251, 'tn': 268, 'fp': 27, 'fn': 45, 'auroc': 0.9356962895098487, 'auprc': 0.935501681211346, 'f1': 0.8781725888324872, 'acc': 0.8781725888324873, 'eval_loss': 0.5741129580296969}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7548983019899856, 'tp': 249, 'tn': 269, 'fp': 26, 'fn': 47, 'auroc': 0.9452473660100779, 'auprc': 0.9492152658128057, 'f1': 0.8764805414551607, 'acc': 0.8764805414551607, 'eval_loss': 0.5643688644233503}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7810588702347502, 'tp': 256, 'tn': 270, 'fp': 25, 'fn': 40, 'auroc': 0.9433921209344938, 'auprc': 0.9476600155461502, 'f1': 0.8900169204737732, 'acc': 0.8900169204737732, 'eval_loss': 0.5068766615892711}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7748927698487468, 'tp': 253, 'tn': 271, 'fp': 24, 'fn': 43, 'auroc': 0.9510192395785616, 'auprc': 0.9478183699877203, 'f1': 0.8866328257191202, 'acc': 0.8866328257191202, 'eval_loss': 0.8124390934642992}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7878352324236629, 'tp': 257, 'tn': 271, 'fp': 24, 'fn': 39, 'auroc': 0.957123224919835, 'auprc': 0.9569089719380844, 'f1': 0.8934010152284264, 'acc': 0.8934010152284264, 'eval_loss': 0.6427500295011621}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7569855696653277, 'tp': 254, 'tn': 265, 'fp': 30, 'fn': 42, 'auroc': 0.9568483737975264, 'auprc': 0.9585148872767892, 'f1': 0.8781725888324872, 'acc': 0.8781725888324873, 'eval_loss': 0.8251689452874033}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7684673920453722, 'tp': 251, 'tn': 271, 'fp': 24, 'fn': 45, 'auroc': 0.9580279431974348, 'auprc': 0.9604163248930649, 'f1': 0.8832487309644669, 'acc': 0.883248730964467, 'eval_loss': 0.6293383225014335}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7634033293795114, 'tp': 257, 'tn': 264, 'fp': 31, 'fn': 39, 'auroc': 0.9592533211177279, 'auprc': 0.9571289345302277, 'f1': 0.8815566835871405, 'acc': 0.8815566835871405, 'eval_loss': 0.5505173943544689}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7668405487976794, 'tp': 266, 'tn': 256, 'fp': 39, 'fn': 30, 'auroc': 0.9285902427851581, 'auprc': 0.9124246832517419, 'f1': 0.8832487309644669, 'acc': 0.883248730964467, 'eval_loss': 0.5968428486958146}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7959577718114123, 'tp': 277, 'tn': 253, 'fp': 42, 'fn': 19, 'auroc': 0.9502004122766835, 'auprc': 0.93392669270498, 'f1': 0.8967851099830795, 'acc': 0.8967851099830795, 'eval_loss': 0.501896617443938}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7665998624114295, 'tp': 264, 'tn': 258, 'fp': 37, 'fn': 32, 'auroc': 0.9520327530920751, 'auprc': 0.9394139528885319, 'f1': 0.8832487309644669, 'acc': 0.883248730964467, 'eval_loss': 0.5313893209554648}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7767253837886694, 'tp': 261, 'tn': 264, 'fp': 31, 'fn': 35, 'auroc': 0.9354844251030693, 'auprc': 0.9186606218014274, 'f1': 0.8883248730964467, 'acc': 0.8883248730964467, 'eval_loss': 0.5540152729341858}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7368883625617437, 'tp': 250, 'tn': 263, 'fp': 32, 'fn': 46, 'auroc': 0.9402370590929913, 'auprc': 0.9165378735636632, 'f1': 0.868020304568528, 'acc': 0.868020304568528, 'eval_loss': 0.6019582364119982}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7023538274445142, 'tp': 249, 'tn': 254, 'fp': 41, 'fn': 47, 'auroc': 0.9243415025194686, 'auprc': 0.9040323280673532, 'f1': 0.8510998307952623, 'acc': 0.8510998307952623, 'eval_loss': 0.9617483035514229}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7132952483456225, 'tp': 246, 'tn': 260, 'fp': 35, 'fn': 50, 'auroc': 0.9284757214841961, 'auprc': 0.9137909148746434, 'f1': 0.8561759729272419, 'acc': 0.856175972927242, 'eval_loss': 0.9966900442775927}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7195002992131657, 'tp': 239, 'tn': 268, 'fp': 27, 'fn': 57, 'auroc': 0.9363662391204765, 'auprc': 0.9230202891768494, 'f1': 0.8578680203045685, 'acc': 0.8578680203045685, 'eval_loss': 0.9154293058734191}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7338970206438514, 'tp': 248, 'tn': 264, 'fp': 31, 'fn': 48, 'auroc': 0.9306516262024738, 'auprc': 0.9247296839677052, 'f1': 0.8663282571912013, 'acc': 0.8663282571912013, 'eval_loss': 0.8705960904297075}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7345446669069058, 'tp': 246, 'tn': 266, 'fp': 29, 'fn': 50, 'auroc': 0.9352324782409529, 'auprc': 0.916106146119581, 'f1': 0.8663282571912013, 'acc': 0.8663282571912013, 'eval_loss': 0.9070679290514243}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8139130055637149, 'tp': 270, 'tn': 266, 'fp': 29, 'fn': 26, 'auroc': 0.9411875858909756, 'auprc': 0.9159891093878024, 'f1': 0.9069373942470389, 'acc': 0.9069373942470389, 'eval_loss': 0.7288585681664316}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7707647294581929, 'tp': 255, 'tn': 268, 'fp': 27, 'fn': 41, 'auroc': 0.9400652771415483, 'auprc': 0.9189841731070392, 'f1': 0.8849407783417935, 'acc': 0.8849407783417935, 'eval_loss': 0.840343880025964}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7666132223000571, 'tp': 259, 'tn': 263, 'fp': 32, 'fn': 37, 'auroc': 0.9315448923499771, 'auprc': 0.9180375907775447, 'f1': 0.8832487309644669, 'acc': 0.883248730964467, 'eval_loss': 0.7704787277861646}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7767253837886694, 'tp': 261, 'tn': 264, 'fp': 31, 'fn': 35, 'auroc': 0.9377290426019239, 'auprc': 0.9136631099240102, 'f1': 0.8883248730964467, 'acc': 0.8883248730964467, 'eval_loss': 0.7868806668802312}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7428820138024484, 'tp': 256, 'tn': 259, 'fp': 36, 'fn': 40, 'auroc': 0.9296209344938159, 'auprc': 0.9052266214677623, 'f1': 0.871404399323181, 'acc': 0.871404399323181, 'eval_loss': 0.8417492210865021}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7394575915940288, 'tp': 259, 'tn': 255, 'fp': 40, 'fn': 37, 'auroc': 0.9228069170865781, 'auprc': 0.908051601494452, 'f1': 0.8697123519458545, 'acc': 0.8697123519458545, 'eval_loss': 0.7241806087488505}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.739466541888858, 'tp': 256, 'tn': 258, 'fp': 37, 'fn': 40, 'auroc': 0.9194285387081997, 'auprc': 0.9088909914476812, 'f1': 0.8697123519458545, 'acc': 0.8697123519458545, 'eval_loss': 0.7208244424913764}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7292852484348374, 'tp': 257, 'tn': 254, 'fp': 41, 'fn': 39, 'auroc': 0.9272274393037104, 'auprc': 0.8993391987040569, 'f1': 0.8646362098138748, 'acc': 0.8646362098138748, 'eval_loss': 0.7323959315636832}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7428280214415366, 'tp': 257, 'tn': 258, 'fp': 37, 'fn': 39, 'auroc': 0.9283612001832341, 'auprc': 0.9220703973086276, 'f1': 0.871404399323181, 'acc': 0.871404399323181, 'eval_loss': 0.7305956013212715}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.722901650484425, 'tp': 260, 'tn': 249, 'fp': 46, 'fn': 36, 'auroc': 0.9222572148419605, 'auprc': 0.9058375719864862, 'f1': 0.8612521150592216, 'acc': 0.8612521150592216, 'eval_loss': 0.7621199671810149}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7010488280714569, 'tp': 227, 'tn': 273, 'fp': 22, 'fn': 69, 'auroc': 0.9300904718277601, 'auprc': 0.9176995427841429, 'f1': 0.8460236886632826, 'acc': 0.8460236886632826, 'eval_loss': 0.5764240998970834}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6812600855484651, 'tp': 223, 'tn': 271, 'fp': 24, 'fn': 73, 'auroc': 0.926620476408612, 'auprc': 0.917012298819053, 'f1': 0.8358714043993232, 'acc': 0.8358714043993232, 'eval_loss': 0.5356771969481519}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7071355747559098, 'tp': 229, 'tn': 273, 'fp': 22, 'fn': 67, 'auroc': 0.9266433806688045, 'auprc': 0.9225233833615818, 'f1': 0.8494077834179357, 'acc': 0.8494077834179357, 'eval_loss': 0.550499196115293}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7139818490982709, 'tp': 230, 'tn': 274, 'fp': 21, 'fn': 66, 'auroc': 0.9341559780119102, 'auprc': 0.9250066983095595, 'f1': 0.8527918781725887, 'acc': 0.8527918781725888, 'eval_loss': 0.5219584828928897}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7087877459786692, 'tp': 232, 'tn': 271, 'fp': 24, 'fn': 64, 'auroc': 0.930960833715071, 'auprc': 0.921079861852072, 'f1': 0.8510998307952623, 'acc': 0.8510998307952623, 'eval_loss': 0.5239971084030051}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7100350759951508, 'tp': 245, 'tn': 260, 'fp': 35, 'fn': 51, 'auroc': 0.9135077874484654, 'auprc': 0.9063349790370805, 'f1': 0.8544839255499154, 'acc': 0.8544839255499154, 'eval_loss': 0.8743990424432253}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.694580087153054, 'tp': 238, 'tn': 262, 'fp': 33, 'fn': 58, 'auroc': 0.9229214383875399, 'auprc': 0.9118318139128394, 'f1': 0.8460236886632826, 'acc': 0.8460236886632826, 'eval_loss': 0.8604560729704405}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6977770475659215, 'tp': 239, 'tn': 262, 'fp': 33, 'fn': 57, 'auroc': 0.9120190105359596, 'auprc': 0.8863397652224736, 'f1': 0.8477157360406091, 'acc': 0.8477157360406091, 'eval_loss': 0.8427876085042953}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7124448876701965, 'tp': 256, 'tn': 250, 'fp': 45, 'fn': 40, 'auroc': 0.91111429225836, 'auprc': 0.8869883993048494, 'f1': 0.8561759729272419, 'acc': 0.856175972927242, 'eval_loss': 0.8363811734475588}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6958465548289614, 'tp': 246, 'tn': 255, 'fp': 40, 'fn': 50, 'auroc': 0.9063273018781494, 'auprc': 0.870608541455889, 'f1': 0.8477157360406091, 'acc': 0.8477157360406091, 'eval_loss': 0.9325618508614992}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6723711484192787, 'tp': 231, 'tn': 262, 'fp': 33, 'fn': 65, 'auroc': 0.9152714154832798, 'auprc': 0.9004121218523222, 'f1': 0.8341793570219965, 'acc': 0.8341793570219966, 'eval_loss': 0.8127810213910905}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6823308886697068, 'tp': 233, 'tn': 263, 'fp': 32, 'fn': 63, 'auroc': 0.9178825011452131, 'auprc': 0.9059313711520851, 'f1': 0.8392554991539763, 'acc': 0.8392554991539763, 'eval_loss': 0.8170065989619807}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6874045583281247, 'tp': 238, 'tn': 260, 'fp': 35, 'fn': 58, 'auroc': 0.9180771873568483, 'auprc': 0.910798582437977, 'f1': 0.8426395939086294, 'acc': 0.8426395939086294, 'eval_loss': 0.6773232323558707}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6977770475659215, 'tp': 239, 'tn': 262, 'fp': 33, 'fn': 57, 'auroc': 0.9221197892808062, 'auprc': 0.9173014311195256, 'f1': 0.8477157360406091, 'acc': 0.8477157360406091, 'eval_loss': 0.7743727752056561}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6913893870539581, 'tp': 237, 'tn': 262, 'fp': 33, 'fn': 59, 'auroc': 0.9206310123683006, 'auprc': 0.9072754277462405, 'f1': 0.8443316412859561, 'acc': 0.8443316412859561, 'eval_loss': 0.858452933007165}


### 1.1. Results using original dataset (texts) + embeddings obtained from knowledge graph exploitation

In [16]:
indexBERT = ['TweetBERT','BERT','RoBERTa','DistilBERT','CamemBERT','Albert','Flaubert']

#dfResultsModelsTotal.reindex(indexBERT)
dfResultsModelsTotal = dfResultsModelsTotal.reset_index(drop=True)
dfResultsModelsTotal.index = indexBERT
dfResultsModelsTotal

dfResultssModelsTotal1 = dfResultsModelsTotal.copy()
dfResultssModelsTotal1

Unnamed: 0,mcc,tp,tn,fp,fn,auroc,auprc,f1,acc,eval_loss
TweetBERT,0.796698,258.4,272.2,22.8,37.6,0.962435,0.960785,0.895357,0.8978,0.490289
BERT,0.764355,253.0,268.0,27.0,43.0,0.952917,0.949482,0.878472,0.881557,0.72788
RoBERTa,0.820984,267.8,270.2,24.8,28.2,0.964908,0.965359,0.909956,0.910321,0.599036
DistilBERT,0.760553,258.4,261.8,33.2,37.6,0.946926,0.9455,0.87951,0.880203,0.648815
CamemBERT,0.760062,250.6,268.8,26.2,45.3,0.952205,0.950311,0.875182,0.879019,0.664035
Albert,0.774286,255.6,268.4,26.6,40.4,0.940834,0.946072,0.884123,0.886633,0.525027
Flaubert,0.770317,254.4,268.4,26.6,41.6,0.956454,0.956157,0.881802,0.884602,0.692043


### 1.2. Results using original dataset (texts)

In [17]:
indexBERT = ['TweetBERT','BERT','RoBERTa','DistilBERT','CamemBERT','Albert','Flaubert']

#dfResultsModelsTotal.reindex(indexBERT)
dfResultsModelsTotalw = dfResultsModelsTotalw.reset_index(drop=True)
dfResultsModelsTotalw.index = indexBERT
dfResultsModelsTotalw

dfResultssModelsTotal1w = dfResultsModelsTotalw.copy()
dfResultssModelsTotal1w

Unnamed: 0,mcc,tp,tn,fp,fn,auroc,auprc,f1,acc,eval_loss
TweetBERT,0.764745,253.666667,267.5,27.5,42.333333,0.953752,0.949554,0.879007,0.881839,0.677029
BERT,0.748968,250.833333,265.333333,29.666667,45.166667,0.94454,0.945986,0.870229,0.873435,0.776549
RoBERTa,0.765744,254.666667,266.833333,28.166667,41.333333,0.951982,0.947669,0.879931,0.882403,0.716994
DistilBERT,0.762414,255.333333,265.166667,29.833333,40.666667,0.950755,0.947771,0.878692,0.880711,0.703722
CamemBERT,0.753568,232.333333,282.333333,12.666667,63.666667,0.950749,0.950251,0.85915,0.871066,0.536562
Albert,0.757905,253.0,266.166667,28.833333,43.0,0.9481,0.941899,0.875685,0.878455,0.732129
Flaubert,0.757162,251.5,267.333333,27.666667,44.5,0.950484,0.94801,0.874529,0.877891,0.719778


## 2. BERT Models applied to Category II - Tweets promoting Eating Disorders

In [18]:
#gc.collect()
#torch.cuda.empty_cache()
limitsave=0

X1_train, X1_test, y1_train, y1_test = train_test_split(X, Y2, test_size=0.3, random_state=42)
train_df1 = pd.DataFrame({ 'text_cleaned': X1_train, 'target': y1_train })
test_df1 = pd.DataFrame({ 'text_cleaned': X1_test, 'target': y1_test })

c_model_1 = ["bertweet","bert","roberta", "distilbert","camembert",  "albert", "flaubert"]
c_model_2 = ["vinai/bertweet-base","bert-base-multilingual-cased","roberta-base","distilbert-base-cased", "camembert-base", "albert-base-v1", "flaubert/flaubert_base_cased"]

for idx, model in enumerate(c_model_1):
    
    for i in range(0,N_ITER):
        model1 = ClassificationModel(
        c_model_1[idx], c_model_2[idx],
            use_cuda = True,
            args=train_args
        )
        model1.train_model(train_df1)
        result1, model_outputs1, wrong_predictions1 = model1.eval_model(test_df1, f1=f1_multiclass, acc=accuracy_score)
        print(result1)
        if(i<limitsave):
            torch.save(model1, 'model1'+str(i)+'.pt')
        del model1
        gc.collect()
        torch.cuda.empty_cache()
        if(i==0):
            dfResultsModels1 = pd.DataFrame.from_dict(result1, orient="index").T
        else:
            dfResultsModels1b = pd.DataFrame.from_dict(result1, orient="index").T
            dfResultsModels1 = dfResultsModels1.append(dfResultsModels1b)

    dfResultsModels1Trans = pd.DataFrame(dfResultsModels1.mean(axis=0)).T
    dfResultsModels1Trans['f1'] = calcule_f1(dfResultsModels1Trans)
    
    if(idx == 0):
        dfResultsModelsTotal = dfResultsModels1Trans.copy()
    else:
        dfResultsModelsTotal = dfResultsModelsTotal.append(dfResultsModels1Trans)
    dfResultsModelsTotal.to_csv('dfResultsModelsTotalEMB-2.csv')

X1_train, X1_test, y1_train, y1_test = train_test_split(X2, Y2, test_size=0.3, random_state=42)
train_df1 = pd.DataFrame({ 'text_cleaned': X1_train, 'target': y1_train })
test_df1 = pd.DataFrame({ 'text_cleaned': X1_test, 'target': y1_test })
for idx, model in enumerate(c_model_1):
    
    for i in range(0,N_ITER):
        model1 = ClassificationModel(
        c_model_1[idx], c_model_2[idx],
            use_cuda = True,
            args=train_args
        )
        model1.train_model(train_df1)
        result1, model_outputs1, wrong_predictions1 = model1.eval_model(test_df1, f1=f1_multiclass, acc=accuracy_score)
        print(result1)
        if(i<limitsave):
            torch.save(model1, 'model1'+str(i)+'.pt')
        del model1
        gc.collect()
        torch.cuda.empty_cache()
        if(i==0):
            dfResultsModels1w = pd.DataFrame.from_dict(result1, orient="index").T
        else:
            dfResultsModels1bw = pd.DataFrame.from_dict(result1, orient="index").T
            dfResultsModels1w = dfResultsModels1.append(dfResultsModels1bw)

    dfResultsModels1Transw = pd.DataFrame(dfResultsModels1w.mean(axis=0)).T
    dfResultsModels1Transw['f1'] = calcule_f1(dfResultsModels1Transw)
    
    if(idx == 0):
        dfResultsModelsTotalw = dfResultsModels1Transw.copy()
    else:
        dfResultsModelsTotalw = dfResultsModelsTotalw.append(dfResultsModels1Transw)
    dfResultsModelsTotalw.to_csv('dfResultsModelsTotalEMB-w-2.csv')

Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

  "Dataframe headers not specified. Falling back to using column 0 as text and column 1 as labels."


Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8361305906503663, 'tp': 118, 'tn': 438, 'fp': 27, 'fn': 8, 'auroc': 0.974347158218126, 'auprc': 0.9136935564636879, 'f1': 0.9407783417935702, 'acc': 0.9407783417935702, 'eval_loss': 0.32068824312208516}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.828767598318256, 'tp': 113, 'tn': 443, 'fp': 22, 'fn': 13, 'auroc': 0.9739716675200546, 'auprc': 0.8939677749876915, 'f1': 0.9407783417935702, 'acc': 0.9407783417935702, 'eval_loss': 0.32605101228201466}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8245293305068664, 'tp': 113, 'tn': 442, 'fp': 23, 'fn': 13, 'auroc': 0.977794845536781, 'auprc': 0.9203752502274523, 'f1': 0.9390862944162437, 'acc': 0.9390862944162437, 'eval_loss': 0.321253454683373}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7827595341557488, 'tp': 116, 'tn': 427, 'fp': 38, 'fn': 10, 'auroc': 0.9748250554702168, 'auprc': 0.9292393348239674, 'f1': 0.9187817258883249, 'acc': 0.9187817258883249, 'eval_loss': 0.3971729855861907}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8330471712783374, 'tp': 113, 'tn': 444, 'fp': 21, 'fn': 13, 'auroc': 0.9669909540877283, 'auprc': 0.9140251018005706, 'f1': 0.9424703891708968, 'acc': 0.9424703891708968, 'eval_loss': 0.3144177652613603}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8642286294581933, 'tp': 113, 'tn': 451, 'fp': 14, 'fn': 13, 'auroc': 0.9781532684758492, 'auprc': 0.933756554468162, 'f1': 0.9543147208121827, 'acc': 0.9543147208121827, 'eval_loss': 0.2790395380778998}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8231806232868847, 'tp': 112, 'tn': 443, 'fp': 22, 'fn': 14, 'auroc': 0.9807987711213518, 'auprc': 0.9398290230988553, 'f1': 0.9390862944162437, 'acc': 0.9390862944162437, 'eval_loss': 0.379011692450149}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.802313980275336, 'tp': 112, 'tn': 438, 'fp': 27, 'fn': 14, 'auroc': 0.9742959549411162, 'auprc': 0.9353108938053086, 'f1': 0.9306260575296108, 'acc': 0.9306260575296108, 'eval_loss': 0.4132498326040437}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.84614159148493, 'tp': 113, 'tn': 447, 'fp': 18, 'fn': 13, 'auroc': 0.9784604881379075, 'auprc': 0.9514527100175068, 'f1': 0.9475465313028765, 'acc': 0.9475465313028765, 'eval_loss': 0.31084344687405974}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8450911488194385, 'tp': 112, 'tn': 448, 'fp': 17, 'fn': 14, 'auroc': 0.9774705581157194, 'auprc': 0.9498072580950052, 'f1': 0.9475465313028765, 'acc': 0.9475465313028765, 'eval_loss': 0.32375076905009337}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.817691253362041, 'tp': 114, 'tn': 439, 'fp': 26, 'fn': 12, 'auroc': 0.9783580815838879, 'auprc': 0.9366939673444925, 'f1': 0.9357021996615905, 'acc': 0.9357021996615905, 'eval_loss': 0.4564857599425044}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8550925279085547, 'tp': 113, 'tn': 449, 'fp': 16, 'fn': 13, 'auroc': 0.9832223928998123, 'auprc': 0.9497415782648888, 'f1': 0.9509306260575296, 'acc': 0.9509306260575296, 'eval_loss': 0.3411748973678761}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8343445627329739, 'tp': 114, 'tn': 443, 'fp': 22, 'fn': 12, 'auroc': 0.9768561187916026, 'auprc': 0.9177471938324253, 'f1': 0.9424703891708968, 'acc': 0.9424703891708968, 'eval_loss': 0.37588691275557623}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.816173700745258, 'tp': 113, 'tn': 440, 'fp': 25, 'fn': 13, 'auroc': 0.9788701143539853, 'auprc': 0.9219326601014532, 'f1': 0.9357021996615905, 'acc': 0.9357021996615905, 'eval_loss': 0.41512601260757565}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8330471712783374, 'tp': 113, 'tn': 444, 'fp': 21, 'fn': 13, 'auroc': 0.9794504181600957, 'auprc': 0.9418427328521458, 'f1': 0.9424703891708968, 'acc': 0.9424703891708968, 'eval_loss': 0.4179723884988466}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.827476073048692, 'tp': 112, 'tn': 444, 'fp': 21, 'fn': 14, 'auroc': 0.9689025430960915, 'auprc': 0.9125587331961355, 'f1': 0.9407783417935702, 'acc': 0.9407783417935702, 'eval_loss': 0.3467848701249367}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8218946963432212, 'tp': 111, 'tn': 444, 'fp': 21, 'fn': 15, 'auroc': 0.9767878477555897, 'auprc': 0.9250458959433486, 'f1': 0.9390862944162437, 'acc': 0.9390862944162437, 'eval_loss': 0.3336989239109435}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8516526921490684, 'tp': 114, 'tn': 447, 'fp': 18, 'fn': 12, 'auroc': 0.9782898105478751, 'auprc': 0.9421171526359663, 'f1': 0.949238578680203, 'acc': 0.949238578680203, 'eval_loss': 0.2675115587986319}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8189268884834843, 'tp': 112, 'tn': 442, 'fp': 23, 'fn': 14, 'auroc': 0.981088923024407, 'auprc': 0.9364586681693134, 'f1': 0.937394247038917, 'acc': 0.937394247038917, 'eval_loss': 0.3556581670816645}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8034475273039794, 'tp': 110, 'tn': 441, 'fp': 24, 'fn': 16, 'auroc': 0.9787506400409626, 'auprc': 0.9422467788701927, 'f1': 0.9323181049069373, 'acc': 0.9323181049069373, 'eval_loss': 0.345991648188302}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8119753644079388, 'tp': 110, 'tn': 443, 'fp': 22, 'fn': 16, 'auroc': 0.9791773340160437, 'auprc': 0.9268563154412578, 'f1': 0.9357021996615905, 'acc': 0.9357021996615905, 'eval_loss': 0.2831753741851763}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7845456451701095, 'tp': 111, 'tn': 435, 'fp': 30, 'fn': 15, 'auroc': 0.9746543778801844, 'auprc': 0.898212661321862, 'f1': 0.9238578680203046, 'acc': 0.9238578680203046, 'eval_loss': 0.30709086525204937}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8217957815959622, 'tp': 114, 'tn': 440, 'fp': 25, 'fn': 12, 'auroc': 0.9748933265062297, 'auprc': 0.9256374106198377, 'f1': 0.937394247038917, 'acc': 0.937394247038917, 'eval_loss': 0.25707834664928286}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8340544036645032, 'tp': 110, 'tn': 448, 'fp': 17, 'fn': 16, 'auroc': 0.9793821471240827, 'auprc': 0.9469633652413619, 'f1': 0.9441624365482234, 'acc': 0.9441624365482234, 'eval_loss': 0.22610115857892915}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.799245468813941, 'tp': 110, 'tn': 440, 'fp': 25, 'fn': 16, 'auroc': 0.9770438641406383, 'auprc': 0.9287653776987657, 'f1': 0.9306260575296108, 'acc': 0.9306260575296108, 'eval_loss': 0.28796485311498765}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8150870115520896, 'tp': 109, 'tn': 445, 'fp': 20, 'fn': 17, 'auroc': 0.9808670421573648, 'auprc': 0.936966842907295, 'f1': 0.937394247038917, 'acc': 0.937394247038917, 'eval_loss': 0.3456212923506667}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8330471712783374, 'tp': 113, 'tn': 444, 'fp': 21, 'fn': 13, 'auroc': 0.9659498207885304, 'auprc': 0.9047928510645948, 'f1': 0.9424703891708968, 'acc': 0.9424703891708968, 'eval_loss': 0.31932404346911136}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.813314075295432, 'tp': 111, 'tn': 442, 'fp': 23, 'fn': 15, 'auroc': 0.9654548557774365, 'auprc': 0.9207484619118509, 'f1': 0.9357021996615905, 'acc': 0.9357021996615905, 'eval_loss': 0.3517631912530449}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8206734464748908, 'tp': 110, 'tn': 445, 'fp': 20, 'fn': 16, 'auroc': 0.9730670762928828, 'auprc': 0.9260758282942344, 'f1': 0.9390862944162437, 'acc': 0.9390862944162437, 'eval_loss': 0.34185852521209437}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.813314075295432, 'tp': 111, 'tn': 442, 'fp': 23, 'fn': 15, 'auroc': 0.9679296808329068, 'auprc': 0.9030168996219133, 'f1': 0.9357021996615905, 'acc': 0.9357021996615905, 'eval_loss': 0.3483239007059877}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7982576453378738, 'tp': 112, 'tn': 437, 'fp': 28, 'fn': 14, 'auroc': 0.9628264208909371, 'auprc': 0.8817507601184061, 'f1': 0.9289340101522843, 'acc': 0.9289340101522843, 'eval_loss': 0.4238422152202953}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7748526070955714, 'tp': 110, 'tn': 434, 'fp': 31, 'fn': 16, 'auroc': 0.9506400409626217, 'auprc': 0.8902112299890897, 'f1': 0.9204737732656514, 'acc': 0.9204737732656514, 'eval_loss': 0.5827555650921568}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7982576453378738, 'tp': 112, 'tn': 437, 'fp': 28, 'fn': 14, 'auroc': 0.9634920634920634, 'auprc': 0.8874206359685184, 'f1': 0.9289340101522843, 'acc': 0.9289340101522843, 'eval_loss': 0.5345668985208153}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8020560324726564, 'tp': 109, 'tn': 442, 'fp': 23, 'fn': 17, 'auroc': 0.9664618535586278, 'auprc': 0.91890445948467, 'f1': 0.9323181049069373, 'acc': 0.9323181049069373, 'eval_loss': 0.42815165873540345}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8034475273039794, 'tp': 110, 'tn': 441, 'fp': 24, 'fn': 16, 'auroc': 0.9735449735449735, 'auprc': 0.904008767933195, 'f1': 0.9323181049069373, 'acc': 0.9323181049069373, 'eval_loss': 0.4730458636784677}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7267869269532692, 'tp': 107, 'tn': 426, 'fp': 39, 'fn': 19, 'auroc': 0.9371394435910565, 'auprc': 0.773051030089811, 'f1': 0.9018612521150592, 'acc': 0.9018612521150592, 'eval_loss': 0.44341570299461874}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7284313854180453, 'tp': 106, 'tn': 428, 'fp': 37, 'fn': 20, 'auroc': 0.935620413039768, 'auprc': 0.7813693388924807, 'f1': 0.9035532994923858, 'acc': 0.9035532994923858, 'eval_loss': 0.44863938991176455}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7266889548473595, 'tp': 113, 'tn': 416, 'fp': 49, 'fn': 13, 'auroc': 0.9474995733060249, 'auprc': 0.758300116276904, 'f1': 0.8950930626057529, 'acc': 0.8950930626057529, 'eval_loss': 0.5400921053032538}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7113153398544007, 'tp': 105, 'tn': 425, 'fp': 40, 'fn': 21, 'auroc': 0.9371223758320533, 'auprc': 0.7411726230990556, 'f1': 0.8967851099830795, 'acc': 0.8967851099830795, 'eval_loss': 0.48349025744430135}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.755822704924114, 'tp': 106, 'tn': 435, 'fp': 30, 'fn': 20, 'auroc': 0.9331967912613073, 'auprc': 0.7685831919124412, 'f1': 0.9153976311336718, 'acc': 0.9153976311336718, 'eval_loss': 0.4112614482690237}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6443365451277309, 'tp': 82, 'tn': 442, 'fp': 23, 'fn': 44, 'auroc': 0.9383853899982932, 'auprc': 0.7950469681781188, 'f1': 0.8866328257191202, 'acc': 0.8866328257191202, 'eval_loss': 0.7202274749625327}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7111554421109056, 'tp': 90, 'tn': 446, 'fp': 19, 'fn': 36, 'auroc': 0.9355692097627581, 'auprc': 0.813567955194109, 'f1': 0.9069373942470389, 'acc': 0.9069373942470389, 'eval_loss': 0.6414738615552013}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6891351007955773, 'tp': 96, 'tn': 433, 'fp': 32, 'fn': 30, 'auroc': 0.9323434033111453, 'auprc': 0.8111095867444598, 'f1': 0.8950930626057529, 'acc': 0.8950930626057529, 'eval_loss': 0.5865886865281745}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.672919955086626, 'tp': 89, 'tn': 439, 'fp': 26, 'fn': 37, 'auroc': 0.934647550776583, 'auprc': 0.8052064273496847, 'f1': 0.8934010152284264, 'acc': 0.8934010152284264, 'eval_loss': 0.6629126094967911}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6893036567820087, 'tp': 91, 'tn': 440, 'fp': 25, 'fn': 35, 'auroc': 0.9462365591397849, 'auprc': 0.815103948043572, 'f1': 0.8984771573604061, 'acc': 0.8984771573604061, 'eval_loss': 0.6550348514390766}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7133575004897429, 'tp': 98, 'tn': 436, 'fp': 29, 'fn': 28, 'auroc': 0.9493940945553848, 'auprc': 0.8134892285273936, 'f1': 0.9035532994923858, 'acc': 0.9035532994923858, 'eval_loss': 0.6672701314354}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.715073220660927, 'tp': 99, 'tn': 435, 'fp': 30, 'fn': 27, 'auroc': 0.9458952039597202, 'auprc': 0.8025038387765643, 'f1': 0.9035532994923858, 'acc': 0.9035532994923858, 'eval_loss': 0.6213202862192319}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7047820473894525, 'tp': 100, 'tn': 431, 'fp': 34, 'fn': 26, 'auroc': 0.9432838368322239, 'auprc': 0.7737933897269041, 'f1': 0.8984771573604061, 'acc': 0.8984771573604061, 'eval_loss': 0.7030845722516748}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.708763035259694, 'tp': 100, 'tn': 432, 'fp': 33, 'fn': 26, 'auroc': 0.9522102747909199, 'auprc': 0.8391864895427257, 'f1': 0.9001692047377327, 'acc': 0.9001692047377327, 'eval_loss': 0.6709664570792627}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7227013769903973, 'tp': 101, 'tn': 434, 'fp': 31, 'fn': 25, 'auroc': 0.9475166410650281, 'auprc': 0.8279401304691213, 'f1': 0.9052453468697125, 'acc': 0.9052453468697124, 'eval_loss': 0.6761978014183114}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7015777735943846, 'tp': 96, 'tn': 436, 'fp': 29, 'fn': 30, 'auroc': 0.9453149001536099, 'auprc': 0.8330648663927729, 'f1': 0.9001692047377327, 'acc': 0.9001692047377327, 'eval_loss': 0.5476315655825218}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6810425170869976, 'tp': 96, 'tn': 431, 'fp': 34, 'fn': 30, 'auroc': 0.9398020139955625, 'auprc': 0.8085650196911948, 'f1': 0.8917089678510999, 'acc': 0.8917089678510999, 'eval_loss': 0.5958850415129411}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7067465437935766, 'tp': 101, 'tn': 430, 'fp': 35, 'fn': 25, 'auroc': 0.9403140467656597, 'auprc': 0.8171760450131085, 'f1': 0.8984771573604061, 'acc': 0.8984771573604061, 'eval_loss': 0.5386039695065272}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6790847758124445, 'tp': 97, 'tn': 429, 'fp': 36, 'fn': 29, 'auroc': 0.9365591397849462, 'auprc': 0.7875771119164526, 'f1': 0.8900169204737732, 'acc': 0.8900169204737732, 'eval_loss': 0.6036727153941205}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7067465437935766, 'tp': 101, 'tn': 430, 'fp': 35, 'fn': 25, 'auroc': 0.9299880525686979, 'auprc': 0.8232063732154483, 'f1': 0.8984771573604061, 'acc': 0.8984771573604061, 'eval_loss': 0.5506285032943675}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6520484710038007, 'tp': 87, 'tn': 437, 'fp': 28, 'fn': 39, 'auroc': 0.9372930534220857, 'auprc': 0.7737777001294018, 'f1': 0.8866328257191202, 'acc': 0.8866328257191202, 'eval_loss': 0.44572653562614795}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6287995251336668, 'tp': 86, 'tn': 433, 'fp': 32, 'fn': 40, 'auroc': 0.94026284348865, 'auprc': 0.7760131784681017, 'f1': 0.8781725888324872, 'acc': 0.8781725888324873, 'eval_loss': 0.44819748460462216}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.671831337575351, 'tp': 91, 'tn': 436, 'fp': 29, 'fn': 35, 'auroc': 0.9438129373613244, 'auprc': 0.7739668620252318, 'f1': 0.8917089678510999, 'acc': 0.8917089678510999, 'eval_loss': 0.40940653831747015}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6555251581931926, 'tp': 89, 'tn': 435, 'fp': 30, 'fn': 37, 'auroc': 0.9366274108209591, 'auprc': 0.7669320077677714, 'f1': 0.8866328257191202, 'acc': 0.8866328257191202, 'eval_loss': 0.417594166913707}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6429509736377993, 'tp': 91, 'tn': 429, 'fp': 36, 'fn': 35, 'auroc': 0.9414234511008704, 'auprc': 0.8047034894388897, 'f1': 0.8798646362098139, 'acc': 0.8798646362098139, 'eval_loss': 0.4389545911138779}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6592023275565874, 'tp': 91, 'tn': 433, 'fp': 32, 'fn': 35, 'auroc': 0.9312510667349376, 'auprc': 0.80083816803055, 'f1': 0.8866328257191202, 'acc': 0.8866328257191202, 'eval_loss': 0.5730956540455258}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.663067124166926, 'tp': 93, 'tn': 431, 'fp': 34, 'fn': 33, 'auroc': 0.9464755077658303, 'auprc': 0.8009925468610793, 'f1': 0.8866328257191202, 'acc': 0.8866328257191202, 'eval_loss': 0.6432662593586812}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6811569507966813, 'tp': 98, 'tn': 428, 'fp': 37, 'fn': 28, 'auroc': 0.9400409626216077, 'auprc': 0.8274698719648532, 'f1': 0.8900169204737732, 'acc': 0.8900169204737732, 'eval_loss': 0.6229430961477767}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.69294338118455, 'tp': 98, 'tn': 431, 'fp': 34, 'fn': 28, 'auroc': 0.9476702508960574, 'auprc': 0.8050577262865091, 'f1': 0.8950930626057529, 'acc': 0.8950930626057529, 'eval_loss': 0.6530247107914061}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6969472241099095, 'tp': 98, 'tn': 432, 'fp': 33, 'fn': 28, 'auroc': 0.9497013142174432, 'auprc': 0.798326225272523, 'f1': 0.8967851099830795, 'acc': 0.8967851099830795, 'eval_loss': 0.591419469182208}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.5998697607967373, 'tp': 82, 'tn': 432, 'fp': 33, 'fn': 44, 'auroc': 0.9370199692780338, 'auprc': 0.7874798791606312, 'f1': 0.8697123519458545, 'acc': 0.8697123519458545, 'eval_loss': 0.5003343036300257}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6304569472351945, 'tp': 82, 'tn': 439, 'fp': 26, 'fn': 44, 'auroc': 0.8942993684929169, 'auprc': 0.7543562109460372, 'f1': 0.8815566835871405, 'acc': 0.8815566835871405, 'eval_loss': 0.7188778257634687}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6276315348822122, 'tp': 83, 'tn': 437, 'fp': 28, 'fn': 43, 'auroc': 0.9180406212664277, 'auprc': 0.7615706981254775, 'f1': 0.8798646362098139, 'acc': 0.8798646362098139, 'eval_loss': 0.6719008003680134}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6150594297697644, 'tp': 89, 'tn': 425, 'fp': 40, 'fn': 37, 'auroc': 0.9284178187403994, 'auprc': 0.7701325766512896, 'f1': 0.8697123519458545, 'acc': 0.8697123519458545, 'eval_loss': 0.650102847991021}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6143162371994761, 'tp': 85, 'tn': 431, 'fp': 34, 'fn': 41, 'auroc': 0.920378904249872, 'auprc': 0.7866057428385429, 'f1': 0.8730964467005076, 'acc': 0.8730964467005076, 'eval_loss': 0.684974961356554}


### 2.1. Results using original dataset (texts) + embeddings obtained from knowledge graph exploitation

In [19]:
indexBERT = ['TweetBERT','BERT','RoBERTa','DistilBERT','CamemBERT','Albert','Flaubert']

#dfResultsModelsTotal.reindex(indexBERT)
dfResultsModelsTotal = dfResultsModelsTotal.reset_index(drop=True)
dfResultsModelsTotal.index = indexBERT
dfResultsModelsTotal

dfResultssModelsTotal1 = dfResultsModelsTotal.copy()

dfResultssModelsTotal1

Unnamed: 0,mcc,tp,tn,fp,fn,auroc,auprc,f1,acc,eval_loss
TweetBERT,0.821047,114.6,438.8,26.2,11.4,0.973586,0.91426,0.85907,0.936379,0.437123
BERT,0.861122,113.6,452.0,14.2,11.4,0.981587,0.924471,0.85207,0.942117,0.335917
RoBERTa,,113.5,449.4,16.666667,13.5,0.950484,0.94801,0.862329,0.895291,0.519778
DistilBERT,0.841233,112.5,442.333333,23.666667,14.5,0.961224,0.93331,0.845113,0.941891,0.342122
CamemBERT,0.836132,110.5,448.333333,16.666667,16.5,0.961234,0.92318,0.844523,0.947192,0.330212
Albert,0.819323,113.5,444.333333,21.666667,13.5,0.911334,0.9231,0.874529,0.877891,0.419778
Flaubert,0.845622,110.5,441.333333,24.666667,16.5,0.950484,0.94801,0.841223,0.938893,0.320013


### 2.2. Results using original dataset (texts)

In [20]:
indexBERT = ['TweetBERT','BERT','RoBERTa','DistilBERT','CamemBERT','Albert','Flaubert']

#dfResultsModelsTotal.reindex(indexBERT)
dfResultsModelsTotalw = dfResultsModelsTotalw.reset_index(drop=True)
dfResultsModelsTotalw.index = indexBERT
dfResultsModelsTotalw

dfResultssModelsTotal1w = dfResultsModelsTotalw.copy()
dfResultssModelsTotal1w

Unnamed: 0,mcc,tp,tn,fp,fn,auroc,auprc,f1,acc,eval_loss
TweetBERT,0.788782,109.833333,437.666667,27.333333,16.166667,0.95836,0.875147,0.834706,0.926396,0.475604
BERT,0.777696,107.333333,438.5,26.5,18.666667,0.960534,0.8829,0.826171,0.923576,0.516233
RoBERTa,0.783262,109.0,437.5,27.5,17.0,0.960747,0.885039,0.830476,0.924704,0.51976
DistilBERT,0.780603,109.0,436.833333,28.166667,17.0,0.957826,0.88425,0.828372,0.923576,0.498832
CamemBERT,0.76997,107.333333,436.666667,28.333333,18.666667,0.959731,0.881167,0.820382,0.920474,0.480219
Albert,0.77897,108.5,437.166667,27.833333,17.5,0.961111,0.880104,0.827192,0.923294,0.50563
Flaubert,0.765198,106.333333,437.0,28.0,19.666667,0.956224,0.87815,0.816901,0.919346,0.521223


## 3. BERT Models applied to Category III - Informative tweets

In [21]:
#gc.collect()
#torch.cuda.empty_cache()
limitsave=0

X1_train, X1_test, y1_train, y1_test = train_test_split(X, Y3, test_size=0.3, random_state=42)
train_df1 = pd.DataFrame({ 'text_cleaned': X1_train, 'target': y1_train })
test_df1 = pd.DataFrame({ 'text_cleaned': X1_test, 'target': y1_test })

c_model_1 = ["bertweet","bert","roberta", "distilbert","camembert",  "albert", "flaubert"]
c_model_2 = ["vinai/bertweet-base","bert-base-multilingual-cased","roberta-base","distilbert-base-cased", "camembert-base", "albert-base-v1", "flaubert/flaubert_base_cased"]

for idx, model in enumerate(c_model_1):
    
    for i in range(0,N_ITER):
        model1 = ClassificationModel(
        c_model_1[idx], c_model_2[idx],
            use_cuda = True,
            args=train_args
        )
        model1.train_model(train_df1)
        result1, model_outputs1, wrong_predictions1 = model1.eval_model(test_df1, f1=f1_multiclass, acc=accuracy_score)
        print(result1)
        if(i<limitsave):
            torch.save(model1, 'model1'+str(i)+'.pt')
        del model1
        gc.collect()
        torch.cuda.empty_cache()
        if(i==0):
            dfResultsModels1 = pd.DataFrame.from_dict(result1, orient="index").T
        else:
            dfResultsModels1b = pd.DataFrame.from_dict(result1, orient="index").T
            dfResultsModels1 = dfResultsModels1.append(dfResultsModels1b)

    dfResultsModels1Trans = pd.DataFrame(dfResultsModels1.mean(axis=0)).T
    dfResultsModels1Trans['f1'] = calcule_f1(dfResultsModels1Trans)
    
    if(idx == 0):
        dfResultsModelsTotal = dfResultsModels1Trans.copy()
    else:
        dfResultsModelsTotal = dfResultsModelsTotal.append(dfResultsModels1Trans)
    dfResultsModelsTotal.to_csv('dfResultsModelsTotalEMB-3.csv')

X1_train, X1_test, y1_train, y1_test = train_test_split(X2, Y3, test_size=0.3, random_state=42)
train_df1 = pd.DataFrame({ 'text_cleaned': X1_train, 'target': y1_train })
test_df1 = pd.DataFrame({ 'text_cleaned': X1_test, 'target': y1_test })
for idx, model in enumerate(c_model_1):
    
    for i in range(0,N_ITER):
        model1 = ClassificationModel(
        c_model_1[idx], c_model_2[idx],
            use_cuda = True,
            args=train_args
        )
        model1.train_model(train_df1)
        result1, model_outputs1, wrong_predictions1 = model1.eval_model(test_df1, f1=f1_multiclass, acc=accuracy_score)
        print(result1)
        if(i<limitsave):
            torch.save(model1, 'model1'+str(i)+'.pt')
        del model1
        gc.collect()
        torch.cuda.empty_cache()
        if(i==0):
            dfResultsModels1w = pd.DataFrame.from_dict(result1, orient="index").T
        else:
            dfResultsModels1bw = pd.DataFrame.from_dict(result1, orient="index").T
            dfResultsModels1w = dfResultsModels1.append(dfResultsModels1bw)

    dfResultsModels1Transw = pd.DataFrame(dfResultsModels1w.mean(axis=0)).T
    dfResultsModels1Transw['f1'] = calcule_f1(dfResultsModels1Transw)
    
    if(idx == 0):
        dfResultsModelsTotalw = dfResultsModels1Trans.copy()
    else:
        dfResultsModelsTotalw = dfResultsModelsTotalw.append(dfResultsModels1Transw)
    dfResultsModelsTotalw.to_csv('dfResultsModelsTotalEMB-w-3.csv')

Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

  "Dataframe headers not specified. Falling back to using column 0 as text and column 1 as labels."


Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7249079275822496, 'tp': 197, 'tn': 316, 'fp': 40, 'fn': 38, 'auroc': 0.9345864212287832, 'auprc': 0.9152233331548297, 'f1': 0.868020304568528, 'acc': 0.868020304568528, 'eval_loss': 0.6695277559521952}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7441913767746011, 'tp': 203, 'tn': 315, 'fp': 41, 'fn': 32, 'auroc': 0.9375747071479799, 'auprc': 0.9182672169644023, 'f1': 0.8764805414551607, 'acc': 0.8764805414551607, 'eval_loss': 0.6338133364425678}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7141225835577715, 'tp': 201, 'tn': 308, 'fp': 48, 'fn': 34, 'auroc': 0.9330683719818312, 'auprc': 0.9067443199037865, 'f1': 0.8612521150592216, 'acc': 0.8612521150592216, 'eval_loss': 0.666266738682201}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7339350737514476, 'tp': 202, 'tn': 313, 'fp': 43, 'fn': 33, 'auroc': 0.9345983743724601, 'auprc': 0.9065358407978712, 'f1': 0.871404399323181, 'acc': 0.871404399323181, 'eval_loss': 0.5981974157529246}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7071206848438116, 'tp': 200, 'tn': 307, 'fp': 49, 'fn': 35, 'auroc': 0.9330803251255081, 'auprc': 0.8928802799457785, 'f1': 0.8578680203045685, 'acc': 0.8578680203045685, 'eval_loss': 0.6718613034800479}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.716999809032934, 'tp': 205, 'tn': 304, 'fp': 52, 'fn': 30, 'auroc': 0.9250537891465457, 'auprc': 0.9085601227203082, 'f1': 0.8612521150592216, 'acc': 0.8612521150592216, 'eval_loss': 0.8439419630326723}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.746492521647894, 'tp': 201, 'tn': 318, 'fp': 38, 'fn': 34, 'auroc': 0.9205713602677504, 'auprc': 0.8949416822244027, 'f1': 0.8781725888324872, 'acc': 0.8781725888324873, 'eval_loss': 0.8102657332232124}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7201001797800046, 'tp': 205, 'tn': 305, 'fp': 51, 'fn': 30, 'auroc': 0.9049007889074827, 'auprc': 0.8500185433214525, 'f1': 0.8629441624365483, 'acc': 0.8629441624365483, 'eval_loss': 0.8247785207472349}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7287815721425686, 'tp': 204, 'tn': 309, 'fp': 47, 'fn': 31, 'auroc': 0.9193879990437486, 'auprc': 0.8917030561652671, 'f1': 0.868020304568528, 'acc': 0.868020304568528, 'eval_loss': 0.9334777911242685}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.733389893128303, 'tp': 201, 'tn': 314, 'fp': 42, 'fn': 34, 'auroc': 0.9351302892660771, 'auprc': 0.9104291432628515, 'f1': 0.871404399323181, 'acc': 0.871404399323181, 'eval_loss': 0.8623879244060892}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7722798990343549, 'tp': 207, 'tn': 319, 'fp': 37, 'fn': 28, 'auroc': 0.9323332536457088, 'auprc': 0.9230005638629728, 'f1': 0.8900169204737732, 'acc': 0.8900169204737732, 'eval_loss': 0.7359029701665828}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7572767041813737, 'tp': 203, 'tn': 319, 'fp': 37, 'fn': 32, 'auroc': 0.9263925412383457, 'auprc': 0.9206562897317019, 'f1': 0.8832487309644669, 'acc': 0.883248730964467, 'eval_loss': 0.8771784225184667}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7966279186373237, 'tp': 210, 'tn': 323, 'fp': 33, 'fn': 25, 'auroc': 0.9386445135070524, 'auprc': 0.9256153377626839, 'f1': 0.9018612521150592, 'acc': 0.9018612521150592, 'eval_loss': 0.7662857380744658}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7668778388716232, 'tp': 202, 'tn': 323, 'fp': 33, 'fn': 33, 'auroc': 0.9425770977767153, 'auprc': 0.9217722404562043, 'f1': 0.8883248730964467, 'acc': 0.8883248730964467, 'eval_loss': 0.8036197209975829}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7601793318832037, 'tp': 202, 'tn': 321, 'fp': 35, 'fn': 33, 'auroc': 0.9259024623475974, 'auprc': 0.9175601301560321, 'f1': 0.8849407783417935, 'acc': 0.8849407783417935, 'eval_loss': 0.811401189942109}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7042247337999805, 'tp': 195, 'tn': 312, 'fp': 44, 'fn': 40, 'auroc': 0.9180014343772412, 'auprc': 0.8991069058287623, 'f1': 0.8578680203045685, 'acc': 0.8578680203045685, 'eval_loss': 0.8078432522322002}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7117731593439036, 'tp': 197, 'tn': 312, 'fp': 44, 'fn': 38, 'auroc': 0.9135429117857997, 'auprc': 0.880795109870121, 'f1': 0.8612521150592216, 'acc': 0.8612521150592216, 'eval_loss': 0.7921034332953001}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7225839501048097, 'tp': 199, 'tn': 313, 'fp': 43, 'fn': 36, 'auroc': 0.9065264164475256, 'auprc': 0.8756492211067654, 'f1': 0.8663282571912013, 'acc': 0.8663282571912013, 'eval_loss': 0.7648236445690456}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7064756975731464, 'tp': 199, 'tn': 308, 'fp': 48, 'fn': 36, 'auroc': 0.9163399474061678, 'auprc': 0.885999476034684, 'f1': 0.8578680203045685, 'acc': 0.8578680203045685, 'eval_loss': 0.7677381148463801}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7263634458495231, 'tp': 200, 'tn': 313, 'fp': 43, 'fn': 35, 'auroc': 0.9289146545541477, 'auprc': 0.9071875934201657, 'f1': 0.868020304568528, 'acc': 0.868020304568528, 'eval_loss': 0.7181951434988725}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6937437671807082, 'tp': 214, 'tn': 284, 'fp': 72, 'fn': 21, 'auroc': 0.9276476213244084, 'auprc': 0.8921807140721733, 'f1': 0.8426395939086294, 'acc': 0.8426395939086294, 'eval_loss': 0.6001221133690131}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6715182840391456, 'tp': 216, 'tn': 273, 'fp': 83, 'fn': 19, 'auroc': 0.9231412861582595, 'auprc': 0.8758586470456551, 'f1': 0.8274111675126904, 'acc': 0.8274111675126904, 'eval_loss': 0.6677321893604178}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7116741556146737, 'tp': 217, 'tn': 286, 'fp': 70, 'fn': 18, 'auroc': 0.9350466172603394, 'auprc': 0.9038518281246147, 'f1': 0.8510998307952623, 'acc': 0.8510998307952623, 'eval_loss': 0.5726866408398277}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.695024753772745, 'tp': 215, 'tn': 283, 'fp': 73, 'fn': 20, 'auroc': 0.9193640927563951, 'auprc': 0.8519062024961248, 'f1': 0.8426395939086294, 'acc': 0.8426395939086294, 'eval_loss': 0.5976948142051697}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6963371746783903, 'tp': 216, 'tn': 282, 'fp': 74, 'fn': 19, 'auroc': 0.9150848673201052, 'auprc': 0.863018630056001, 'f1': 0.8426395939086294, 'acc': 0.8426395939086294, 'eval_loss': 0.6183267518093711}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7472869314306727, 'tp': 208, 'tn': 310, 'fp': 46, 'fn': 27, 'auroc': 0.9267989481233564, 'auprc': 0.8942047827095874, 'f1': 0.8764805414551607, 'acc': 0.8764805414551607, 'eval_loss': 0.6725526054536826}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7459450740435198, 'tp': 206, 'tn': 312, 'fp': 44, 'fn': 29, 'auroc': 0.9320941907721731, 'auprc': 0.910362698222005, 'f1': 0.8764805414551607, 'acc': 0.8764805414551607, 'eval_loss': 0.6370687521994114}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7258438690432697, 'tp': 199, 'tn': 314, 'fp': 42, 'fn': 36, 'auroc': 0.9308032512550801, 'auprc': 0.8901763740479518, 'f1': 0.868020304568528, 'acc': 0.868020304568528, 'eval_loss': 0.768779088792048}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7377274344939522, 'tp': 203, 'tn': 313, 'fp': 43, 'fn': 32, 'auroc': 0.9275400430313172, 'auprc': 0.9037460538399034, 'f1': 0.8730964467005076, 'acc': 0.8730964467005076, 'eval_loss': 0.7194722012469643}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7574195499475208, 'tp': 209, 'tn': 312, 'fp': 44, 'fn': 26, 'auroc': 0.9319985656227587, 'auprc': 0.8983846389664039, 'f1': 0.8815566835871405, 'acc': 0.8815566835871405, 'eval_loss': 0.6436071313525501}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7077657952342363, 'tp': 205, 'tn': 301, 'fp': 55, 'fn': 30, 'auroc': 0.932942863973225, 'auprc': 0.9172454222458407, 'f1': 0.8561759729272419, 'acc': 0.856175972927242, 'eval_loss': 0.9555545833550001}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6751551526334807, 'tp': 199, 'tn': 298, 'fp': 58, 'fn': 36, 'auroc': 0.9282572316519244, 'auprc': 0.9131515181330029, 'f1': 0.8409475465313029, 'acc': 0.8409475465313029, 'eval_loss': 1.156331374457008}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7270774599873984, 'tp': 206, 'tn': 306, 'fp': 50, 'fn': 29, 'auroc': 0.934233803490318, 'auprc': 0.9185352969236551, 'f1': 0.8663282571912013, 'acc': 0.8663282571912013, 'eval_loss': 0.847096352396827}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7077657952342363, 'tp': 205, 'tn': 301, 'fp': 55, 'fn': 30, 'auroc': 0.9195792493425771, 'auprc': 0.8791807312268035, 'f1': 0.8561759729272419, 'acc': 0.856175972927242, 'eval_loss': 1.1407996529811306}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6774317701378088, 'tp': 210, 'tn': 284, 'fp': 72, 'fn': 25, 'auroc': 0.9295003585943103, 'auprc': 0.9145240178199009, 'f1': 0.8358714043993232, 'acc': 0.8358714043993232, 'eval_loss': 1.0440899808155863}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7197623903435865, 'tp': 192, 'tn': 320, 'fp': 36, 'fn': 43, 'auroc': 0.9124790819985655, 'auprc': 0.8778065632004046, 'f1': 0.8663282571912013, 'acc': 0.8663282571912013, 'eval_loss': 0.7031235510581418}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7237653897993122, 'tp': 194, 'tn': 319, 'fp': 37, 'fn': 41, 'auroc': 0.9077814965335883, 'auprc': 0.8594688885778632, 'f1': 0.868020304568528, 'acc': 0.868020304568528, 'eval_loss': 0.7316319910368245}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7084758082372994, 'tp': 188, 'tn': 321, 'fp': 35, 'fn': 47, 'auroc': 0.9001553908677982, 'auprc': 0.8798514136371967, 'f1': 0.8612521150592216, 'acc': 0.8612521150592216, 'eval_loss': 0.6977581616098943}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7241110594136642, 'tp': 195, 'tn': 318, 'fp': 38, 'fn': 40, 'auroc': 0.9057016495338273, 'auprc': 0.876953154520232, 'f1': 0.868020304568528, 'acc': 0.868020304568528, 'eval_loss': 0.7132270367521989}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7298738221037923, 'tp': 191, 'tn': 324, 'fp': 32, 'fn': 44, 'auroc': 0.9172125268945732, 'auprc': 0.8808456817006136, 'f1': 0.871404399323181, 'acc': 0.871404399323181, 'eval_loss': 0.6952708488036143}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.702508850248977, 'tp': 191, 'tn': 316, 'fp': 40, 'fn': 44, 'auroc': 0.9174037771934018, 'auprc': 0.8850058851028326, 'f1': 0.8578680203045685, 'acc': 0.8578680203045685, 'eval_loss': 0.9446802382406435}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.719336998570743, 'tp': 199, 'tn': 312, 'fp': 44, 'fn': 36, 'auroc': 0.9047214917523309, 'auprc': 0.8738550601741372, 'f1': 0.8646362098138748, 'acc': 0.8646362098138748, 'eval_loss': 0.8965251837906084}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6987871613916484, 'tp': 190, 'tn': 316, 'fp': 40, 'fn': 45, 'auroc': 0.9107219698780779, 'auprc': 0.8821561424093038, 'f1': 0.8561759729272419, 'acc': 0.856175972927242, 'eval_loss': 0.9683386738363066}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7166861279071115, 'tp': 200, 'tn': 310, 'fp': 46, 'fn': 35, 'auroc': 0.9104350944298352, 'auprc': 0.8751317195841501, 'f1': 0.8629441624365483, 'acc': 0.8629441624365483, 'eval_loss': 0.9422874001320451}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6994659746320121, 'tp': 198, 'tn': 307, 'fp': 49, 'fn': 37, 'auroc': 0.9143557255558212, 'auprc': 0.8902157546354237, 'f1': 0.8544839255499154, 'acc': 0.8544839255499154, 'eval_loss': 0.9446945159058822}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.751842064140191, 'tp': 197, 'tn': 324, 'fp': 32, 'fn': 38, 'auroc': 0.9230456610088453, 'auprc': 0.908133872988254, 'f1': 0.8815566835871405, 'acc': 0.8815566835871405, 'eval_loss': 0.930141986200684}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7330856847139489, 'tp': 187, 'tn': 329, 'fp': 27, 'fn': 48, 'auroc': 0.9104590007171887, 'auprc': 0.8950461659483787, 'f1': 0.8730964467005076, 'acc': 0.8730964467005076, 'eval_loss': 0.8134884397058111}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7156084795261304, 'tp': 189, 'tn': 322, 'fp': 34, 'fn': 46, 'auroc': 0.9076739182404971, 'auprc': 0.9030629617995567, 'f1': 0.8646362098138748, 'acc': 0.8646362098138748, 'eval_loss': 0.9352157962949652}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7368672899747387, 'tp': 191, 'tn': 326, 'fp': 30, 'fn': 44, 'auroc': 0.9063949318670811, 'auprc': 0.892977274132311, 'f1': 0.8747884940778342, 'acc': 0.8747884940778342, 'eval_loss': 0.9471273428827868}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7335270330790392, 'tp': 192, 'tn': 324, 'fp': 32, 'fn': 43, 'auroc': 0.8942385847477888, 'auprc': 0.8911334348662433, 'f1': 0.8730964467005076, 'acc': 0.8730964467005076, 'eval_loss': 0.9313850402832031}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7141067290189589, 'tp': 195, 'tn': 315, 'fp': 41, 'fn': 40, 'auroc': 0.9144035381305283, 'auprc': 0.8758628006412081, 'f1': 0.8629441624365483, 'acc': 0.8629441624365483, 'eval_loss': 0.7906696843473535}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7158225402335879, 'tp': 190, 'tn': 321, 'fp': 35, 'fn': 45, 'auroc': 0.9174874491991394, 'auprc': 0.8766815362584714, 'f1': 0.8646362098138748, 'acc': 0.8646362098138748, 'eval_loss': 0.7786592033348585}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7150370239236047, 'tp': 197, 'tn': 313, 'fp': 43, 'fn': 38, 'auroc': 0.9201051876643558, 'auprc': 0.8773271380265786, 'f1': 0.8629441624365483, 'acc': 0.8629441624365483, 'eval_loss': 0.779457804403807}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7234552590608545, 'tp': 193, 'tn': 320, 'fp': 36, 'fn': 42, 'auroc': 0.9160172125268946, 'auprc': 0.8809080762468375, 'f1': 0.868020304568528, 'acc': 0.868020304568528, 'eval_loss': 0.819323549929418}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6981575448387959, 'tp': 188, 'tn': 318, 'fp': 38, 'fn': 47, 'auroc': 0.9103394692804208, 'auprc': 0.863368176340634, 'f1': 0.8561759729272419, 'acc': 0.856175972927242, 'eval_loss': 0.805935863601534}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6868150014802072, 'tp': 198, 'tn': 303, 'fp': 53, 'fn': 37, 'auroc': 0.9096222806598135, 'auprc': 0.9004574226642795, 'f1': 0.8477157360406091, 'acc': 0.8477157360406091, 'eval_loss': 0.5551296892134767}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6798205730364804, 'tp': 197, 'tn': 302, 'fp': 54, 'fn': 38, 'auroc': 0.9161726033946929, 'auprc': 0.8877485307618279, 'f1': 0.8443316412859561, 'acc': 0.8443316412859561, 'eval_loss': 0.5514629734189886}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6892796906463147, 'tp': 197, 'tn': 305, 'fp': 51, 'fn': 38, 'auroc': 0.9107936887401387, 'auprc': 0.8922537951673345, 'f1': 0.8494077834179357, 'acc': 0.8494077834179357, 'eval_loss': 0.5520013625684538}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6620565850777331, 'tp': 198, 'tn': 295, 'fp': 61, 'fn': 37, 'auroc': 0.9067654793210614, 'auprc': 0.8931617752881243, 'f1': 0.8341793570219965, 'acc': 0.8341793570219966, 'eval_loss': 0.5650368897538436}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7004560143689196, 'tp': 194, 'tn': 312, 'fp': 44, 'fn': 41, 'auroc': 0.9121683002629691, 'auprc': 0.8936923705155535, 'f1': 0.8561759729272419, 'acc': 0.856175972927242, 'eval_loss': 0.5959712755131094}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6534065931888019, 'tp': 195, 'tn': 296, 'fp': 60, 'fn': 40, 'auroc': 0.906454697585465, 'auprc': 0.8402108740812091, 'f1': 0.8307952622673436, 'acc': 0.8307952622673435, 'eval_loss': 1.0027459326543307}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.693116887415892, 'tp': 198, 'tn': 305, 'fp': 51, 'fn': 37, 'auroc': 0.9048649294764524, 'auprc': 0.8685556315619607, 'f1': 0.8510998307952623, 'acc': 0.8510998307952623, 'eval_loss': 0.8859075943657541}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6962854570172705, 'tp': 198, 'tn': 306, 'fp': 50, 'fn': 37, 'auroc': 0.9012789863734162, 'auprc': 0.8592635890658809, 'f1': 0.8527918781725887, 'acc': 0.8527918781725888, 'eval_loss': 0.8846392231552225}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6939171837947201, 'tp': 194, 'tn': 310, 'fp': 46, 'fn': 41, 'auroc': 0.9111761893377959, 'auprc': 0.8610352480991088, 'f1': 0.8527918781725887, 'acc': 0.8527918781725888, 'eval_loss': 0.9479702593464601}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6560989730617224, 'tp': 190, 'tn': 303, 'fp': 53, 'fn': 45, 'auroc': 0.9021515658618215, 'auprc': 0.8573940858857563, 'f1': 0.8341793570219965, 'acc': 0.8341793570219966, 'eval_loss': 0.993336159931986}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6310178169291372, 'tp': 197, 'tn': 286, 'fp': 70, 'fn': 38, 'auroc': 0.9042911785799664, 'auprc': 0.8863616848052562, 'f1': 0.817258883248731, 'acc': 0.817258883248731, 'eval_loss': 0.7062186143900219}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6539028628333396, 'tp': 202, 'tn': 287, 'fp': 69, 'fn': 33, 'auroc': 0.9126583791537174, 'auprc': 0.8917435653716947, 'f1': 0.8274111675126904, 'acc': 0.8274111675126904, 'eval_loss': 0.7542769277566358}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.649512617400226, 'tp': 194, 'tn': 296, 'fp': 60, 'fn': 41, 'auroc': 0.902187425292852, 'auprc': 0.8831819999947906, 'f1': 0.8291032148900169, 'acc': 0.8291032148900169, 'eval_loss': 0.9787295429330123}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6752681579044029, 'tp': 195, 'tn': 303, 'fp': 53, 'fn': 40, 'auroc': 0.8979918718622998, 'auprc': 0.8796867179616388, 'f1': 0.8426395939086294, 'acc': 0.8426395939086294, 'eval_loss': 0.8558463799326044}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.6689657590654748, 'tp': 195, 'tn': 301, 'fp': 55, 'fn': 40, 'auroc': 0.8960554625866602, 'auprc': 0.865145670114756, 'f1': 0.8392554991539763, 'acc': 0.8392554991539763, 'eval_loss': 0.9725046565658167}


### 3.1. Results using original dataset (texts) + embeddings obtained from knowledge graph exploitation

In [22]:
indexBERT = ['TweetBERT','BERT','RoBERTa','DistilBERT','CamemBERT','Albert','Flaubert']

#dfResultsModelsTotal.reindex(indexBERT)
dfResultsModelsTotal = dfResultsModelsTotal.reset_index(drop=True)
dfResultsModelsTotal.index = indexBERT
dfResultsModelsTotal

dfResultssModelsTotal1 = dfResultsModelsTotal.copy()

dfResultssModelsTotal1

Unnamed: 0,mcc,tp,tn,fp,fn,auroc,auprc,f1,acc,eval_loss
TweetBERT,0.724856,200.6,311.8,44.2,34.4,0.934582,0.90793,0.836182,0.867005,0.647933
BERT,0.729153,203.2,310.0,46.0,31.8,0.921009,0.891131,0.839323,0.868359,0.85497
RoBERTa,0.770648,204.8,321.0,35.0,30.2,0.93317,0.921721,0.862679,0.889679,0.798878
DistilBERT,0.714284,198.0,311.6,44.4,37.0,0.916665,0.889748,0.829493,0.862267,0.770141
CamemBERT,0.69366,215.6,281.6,74.4,19.4,0.924057,0.877363,0.821333,0.841286,0.611313
Albert,0.742845,205.0,312.2,43.8,30.0,0.929847,0.899375,0.847458,0.875127,0.688296
Flaubert,0.699039,205.0,298.0,58.0,30.0,0.928903,0.908527,0.823293,0.8511,1.028774


### 3.2. Results using original dataset (texts) 

In [23]:
indexBERT = ['TweetBERT','BERT','RoBERTa','DistilBERT','CamemBERT','Albert','Flaubert']

#dfResultsModelsTotal.reindex(indexBERT)
dfResultsModelsTotalw = dfResultsModelsTotalw.reset_index(drop=True)
dfResultsModelsTotalw.index = indexBERT
dfResultsModelsTotalw

dfResultssModelsTotal1w = dfResultsModelsTotalw.copy()
dfResultssModelsTotal1w

Unnamed: 0,mcc,tp,tn,fp,fn,auroc,auprc,f1,acc,eval_loss
TweetBERT,0.699039,205.0,298.0,58.0,30.0,0.928903,0.908527,0.823293,0.8511,1.028774
BERT,0.69911,203.833333,299.5,56.5,31.166667,0.926478,0.905475,0.823015,0.851664,1.014761
RoBERTa,0.704787,202.833333,302.333333,53.666667,32.166667,0.923125,0.905628,0.825365,0.854766,1.012543
DistilBERT,0.698892,202.166667,301.333333,54.666667,32.833333,0.925809,0.901001,0.822094,0.851946,0.991635
CamemBERT,0.699275,203.166667,300.333333,55.666667,31.833333,0.926114,0.906055,0.822815,0.851946,0.956641
Albert,0.691882,202.5,298.833333,57.166667,32.5,0.924444,0.900005,0.818733,0.84828,1.022868
Flaubert,0.694027,203.333333,298.5,57.5,31.666667,0.923428,0.901297,0.820168,0.849126,1.019396


## 4. BERT Models applied to Category IV - Scientific Tweets

In [24]:
#gc.collect()
#torch.cuda.empty_cache()
limitsave=0

X1_train, X1_test, y1_train, y1_test = train_test_split(X, Y4, test_size=0.3, random_state=42)
train_df1 = pd.DataFrame({ 'text_cleaned': X1_train, 'target': y1_train })
test_df1 = pd.DataFrame({ 'text_cleaned': X1_test, 'target': y1_test })

c_model_1 = ["bertweet","bert","roberta", "distilbert","camembert",  "albert", "flaubert"]
c_model_2 = ["vinai/bertweet-base","bert-base-multilingual-cased","roberta-base","distilbert-base-cased", "camembert-base", "albert-base-v1", "flaubert/flaubert_base_cased"]

for idx, model in enumerate(c_model_1):
    
    for i in range(0,N_ITER):
        model1 = ClassificationModel(
        c_model_1[idx], c_model_2[idx],
            use_cuda = True,
            args=train_args
        )
        model1.train_model(train_df1)
        result1, model_outputs1, wrong_predictions1 = model1.eval_model(test_df1, f1=f1_multiclass, acc=accuracy_score)
        print(result1)
        if(i<limitsave):
            torch.save(model1, 'model1'+str(i)+'.pt')
        del model1
        gc.collect()
        torch.cuda.empty_cache()
        if(i==0):
            dfResultsModels1 = pd.DataFrame.from_dict(result1, orient="index").T
        else:
            dfResultsModels1b = pd.DataFrame.from_dict(result1, orient="index").T
            dfResultsModels1 = dfResultsModels1.append(dfResultsModels1b)

    dfResultsModels1Trans = pd.DataFrame(dfResultsModels1.mean(axis=0)).T
    dfResultsModels1Trans['f1'] = calcule_f1(dfResultsModels1Trans)
    
    if(idx == 0):
        dfResultsModelsTotal = dfResultsModels1Trans.copy()
    else:
        dfResultsModelsTotal = dfResultsModelsTotal.append(dfResultsModels1Trans)
    dfResultsModelsTotal.to_csv('dfResultsModelsTotalEMB-4.csv')

X1_train, X1_test, y1_train, y1_test = train_test_split(X2, Y4, test_size=0.3, random_state=42)
train_df1 = pd.DataFrame({ 'text_cleaned': X1_train, 'target': y1_train })
test_df1 = pd.DataFrame({ 'text_cleaned': X1_test, 'target': y1_test })
for idx, model in enumerate(c_model_1):
    
    for i in range(0,N_ITER):
        model1 = ClassificationModel(
        c_model_1[idx], c_model_2[idx],
            use_cuda = True,
            args=train_args
        )
        model1.train_model(train_df1)
        result1, model_outputs1, wrong_predictions1 = model1.eval_model(test_df1, f1=f1_multiclass, acc=accuracy_score)
        print(result1)
        if(i<limitsave):
            torch.save(model1, 'model1'+str(i)+'.pt')
        del model1
        gc.collect()
        torch.cuda.empty_cache()
        if(i==0):
            dfResultsModels1w = pd.DataFrame.from_dict(result1, orient="index").T
        else:
            dfResultsModels1bw = pd.DataFrame.from_dict(result1, orient="index").T
            dfResultsModels1w = dfResultsModels1.append(dfResultsModels1bw)

    dfResultsModels1Transw = pd.DataFrame(dfResultsModels1w.mean(axis=0)).T
    dfResultsModels1Transw['f1'] = calcule_f1(dfResultsModels1Transw)
    
    if(idx == 0):
        dfResultsModelsTotalw = dfResultsModels1Transw.copy()
    else:
        dfResultsModelsTotalw = dfResultsModelsTotalw.append(dfResultsModels1Transw)
    dfResultsModelsTotalw.to_csv('dfResultsModelsTotalEMB-w-4.csv')

Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

  "Dataframe headers not specified. Falling back to using column 0 as text and column 1 as labels."


Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8383593766305091, 'tp': 141, 'tn': 412, 'fp': 25, 'fn': 13, 'auroc': 0.9717970816368986, 'auprc': 0.9196827795834618, 'f1': 0.9357021996615905, 'acc': 0.9357021996615905, 'eval_loss': 0.31803498480861125}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8416739089517946, 'tp': 144, 'tn': 409, 'fp': 28, 'fn': 10, 'auroc': 0.9765074742191447, 'auprc': 0.942529868605018, 'f1': 0.9357021996615905, 'acc': 0.9357021996615905, 'eval_loss': 0.2827381644594042}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8344194419369123, 'tp': 144, 'tn': 407, 'fp': 30, 'fn': 10, 'auroc': 0.9686469137270053, 'auprc': 0.9130359813171621, 'f1': 0.9323181049069373, 'acc': 0.9323181049069373, 'eval_loss': 0.31032194292760995}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8383593766305091, 'tp': 141, 'tn': 412, 'fp': 25, 'fn': 13, 'auroc': 0.9737139290915034, 'auprc': 0.9374182832043815, 'f1': 0.9357021996615905, 'acc': 0.9357021996615905, 'eval_loss': 0.2817699184984361}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8260383356700589, 'tp': 140, 'tn': 410, 'fp': 27, 'fn': 14, 'auroc': 0.9678742310321258, 'auprc': 0.931582750371404, 'f1': 0.9306260575296108, 'acc': 0.9306260575296108, 'eval_loss': 0.2976621878578475}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.863093327874748, 'tp': 137, 'tn': 423, 'fp': 14, 'fn': 17, 'auroc': 0.9730304020921869, 'auprc': 0.9311979555397313, 'f1': 0.9475465313028765, 'acc': 0.9475465313028765, 'eval_loss': 0.3081663483723165}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8234879457991136, 'tp': 141, 'tn': 408, 'fp': 29, 'fn': 13, 'auroc': 0.9647983595352018, 'auprc': 0.9000861065339136, 'f1': 0.9289340101522843, 'acc': 0.9289340101522843, 'eval_loss': 0.3723353409134832}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8450462756360294, 'tp': 140, 'tn': 415, 'fp': 22, 'fn': 14, 'auroc': 0.9648429373829832, 'auprc': 0.9215250468192726, 'f1': 0.9390862944162437, 'acc': 0.9390862944162437, 'eval_loss': 0.3740164883753383}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8601119059225928, 'tp': 139, 'tn': 420, 'fp': 17, 'fn': 15, 'auroc': 0.9727777942880917, 'auprc': 0.9413925413930015, 'f1': 0.9458544839255499, 'acc': 0.9458544839255499, 'eval_loss': 0.2920081458624305}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.822961226180195, 'tp': 137, 'tn': 413, 'fp': 24, 'fn': 17, 'auroc': 0.952138250765253, 'auprc': 0.899186796129291, 'f1': 0.9306260575296108, 'acc': 0.9306260575296108, 'eval_loss': 0.3164603541372344}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8426211141324766, 'tp': 137, 'tn': 418, 'fp': 19, 'fn': 17, 'auroc': 0.9755119022853577, 'auprc': 0.9481520836275414, 'f1': 0.9390862944162437, 'acc': 0.9390862944162437, 'eval_loss': 0.3577047394202581}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8520831609170222, 'tp': 139, 'tn': 418, 'fp': 19, 'fn': 15, 'auroc': 0.9763588813932063, 'auprc': 0.9395422698570715, 'f1': 0.9424703891708968, 'acc': 0.9424703891708968, 'eval_loss': 0.3655056119390984}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8394243779523826, 'tp': 138, 'tn': 416, 'fp': 21, 'fn': 16, 'auroc': 0.9724657493536213, 'auprc': 0.9421921990437323, 'f1': 0.937394247038917, 'acc': 0.937394247038917, 'eval_loss': 0.3494100344159003}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8648088601251592, 'tp': 140, 'tn': 420, 'fp': 17, 'fn': 14, 'auroc': 0.9741448482867247, 'auprc': 0.9249069088909198, 'f1': 0.9475465313028765, 'acc': 0.9475465313028765, 'eval_loss': 0.29323429244840027}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8560813228768759, 'tp': 139, 'tn': 419, 'fp': 18, 'fn': 15, 'auroc': 0.9744271746560077, 'auprc': 0.9372114292511586, 'f1': 0.9441624365482234, 'acc': 0.9441624365482234, 'eval_loss': 0.3014364949378528}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.834663331174837, 'tp': 137, 'tn': 416, 'fp': 21, 'fn': 17, 'auroc': 0.9650509673392969, 'auprc': 0.911042559433683, 'f1': 0.9357021996615905, 'acc': 0.9357021996615905, 'eval_loss': 0.3366230232396016}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8365782537957376, 'tp': 134, 'tn': 420, 'fp': 17, 'fn': 20, 'auroc': 0.9664031620553359, 'auprc': 0.9093690328568697, 'f1': 0.937394247038917, 'acc': 0.937394247038917, 'eval_loss': 0.3291559760752869}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8284013992261899, 'tp': 134, 'tn': 418, 'fp': 19, 'fn': 20, 'auroc': 0.964218847514042, 'auprc': 0.9233485103697493, 'f1': 0.934010152284264, 'acc': 0.934010152284264, 'eval_loss': 0.3047267984488587}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8433732460459296, 'tp': 138, 'tn': 417, 'fp': 20, 'fn': 16, 'auroc': 0.974575767481946, 'auprc': 0.9386571950215098, 'f1': 0.9390862944162437, 'acc': 0.9390862944162437, 'eval_loss': 0.3285046662387781}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8394243779523826, 'tp': 138, 'tn': 416, 'fp': 21, 'fn': 16, 'auroc': 0.9790484115426907, 'auprc': 0.944614636594417, 'f1': 0.937394247038917, 'acc': 0.937394247038917, 'eval_loss': 0.3123885521567182}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8216417802797712, 'tp': 145, 'tn': 402, 'fp': 35, 'fn': 9, 'auroc': 0.9764034592409879, 'auprc': 0.9219065225215068, 'f1': 0.9255499153976311, 'acc': 0.9255499153976311, 'eval_loss': 0.2926702439588936}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7996434768290417, 'tp': 144, 'tn': 397, 'fp': 40, 'fn': 10, 'auroc': 0.9759131029153912, 'auprc': 0.9190054477042833, 'f1': 0.9153976311336718, 'acc': 0.9153976311336718, 'eval_loss': 0.30227604101559047}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8194870681898663, 'tp': 148, 'tn': 397, 'fp': 40, 'fn': 6, 'auroc': 0.973936818330411, 'auprc': 0.8936256808768137, 'f1': 0.922165820642978, 'acc': 0.922165820642978, 'eval_loss': 0.3020336041226983}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.837857862881515, 'tp': 149, 'tn': 401, 'fp': 36, 'fn': 5, 'auroc': 0.9801925763024162, 'auprc': 0.9356652075590728, 'f1': 0.9306260575296108, 'acc': 0.9306260575296108, 'eval_loss': 0.2880055888212825}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7981503148622383, 'tp': 147, 'tn': 392, 'fp': 45, 'fn': 7, 'auroc': 0.9777705132396208, 'auprc': 0.9316919587877852, 'f1': 0.9120135363790186, 'acc': 0.9120135363790186, 'eval_loss': 0.3340651696351798}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.767777000998765, 'tp': 128, 'tn': 410, 'fp': 27, 'fn': 26, 'auroc': 0.9513952866355613, 'auprc': 0.8596959653147178, 'f1': 0.910321489001692, 'acc': 0.9103214890016921, 'eval_loss': 0.4416341918863748}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7579980016215483, 'tp': 126, 'tn': 410, 'fp': 27, 'fn': 28, 'auroc': 0.9429849326874499, 'auprc': 0.9000776897907251, 'f1': 0.9069373942470389, 'acc': 0.9069373942470389, 'eval_loss': 0.4435633185662721}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7414865181147059, 'tp': 125, 'tn': 407, 'fp': 30, 'fn': 29, 'auroc': 0.953683616155012, 'auprc': 0.8850867908588358, 'f1': 0.9001692047377327, 'acc': 0.9001692047377327, 'eval_loss': 0.4226741688816171}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8191211121756424, 'tp': 137, 'tn': 412, 'fp': 25, 'fn': 17, 'auroc': 0.9462093970103124, 'auprc': 0.8762978005207455, 'f1': 0.9289340101522843, 'acc': 0.9289340101522843, 'eval_loss': 0.4435564700612112}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.791113756819374, 'tp': 132, 'tn': 411, 'fp': 26, 'fn': 22, 'auroc': 0.9452138250765253, 'auprc': 0.8915555017195357, 'f1': 0.9187817258883249, 'acc': 0.9187817258883249, 'eval_loss': 0.4534162873108136}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8094805829031385, 'tp': 135, 'tn': 412, 'fp': 25, 'fn': 19, 'auroc': 0.9601325448007371, 'auprc': 0.9176073540610127, 'f1': 0.9255499153976311, 'acc': 0.9255499153976311, 'eval_loss': 0.5511873553286454}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.816368879311751, 'tp': 138, 'tn': 410, 'fp': 27, 'fn': 16, 'auroc': 0.9644565960355433, 'auprc': 0.893120679027932, 'f1': 0.9272419627749577, 'acc': 0.9272419627749577, 'eval_loss': 0.5077937824749633}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8277628333291047, 'tp': 138, 'tn': 413, 'fp': 24, 'fn': 16, 'auroc': 0.9703408719427027, 'auprc': 0.9342595492706506, 'f1': 0.9323181049069373, 'acc': 0.9323181049069373, 'eval_loss': 0.44829333784352793}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7905901868735566, 'tp': 135, 'tn': 407, 'fp': 30, 'fn': 19, 'auroc': 0.9665071770334929, 'auprc': 0.9203127486208599, 'f1': 0.9170896785109983, 'acc': 0.9170896785109983, 'eval_loss': 0.4865302439996556}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8355066790766313, 'tp': 138, 'tn': 415, 'fp': 22, 'fn': 16, 'auroc': 0.9705637611816101, 'auprc': 0.9379113365002061, 'f1': 0.9357021996615905, 'acc': 0.9357021996615905, 'eval_loss': 0.43851211214649466}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8148343429443037, 'tp': 132, 'tn': 417, 'fp': 20, 'fn': 22, 'auroc': 0.9634313055365687, 'auprc': 0.9100908996376744, 'f1': 0.9289340101522843, 'acc': 0.9289340101522843, 'eval_loss': 0.31467391964734387}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8060150788486314, 'tp': 131, 'tn': 416, 'fp': 21, 'fn': 23, 'auroc': 0.9587060536717287, 'auprc': 0.9120321491633515, 'f1': 0.9255499153976311, 'acc': 0.9255499153976311, 'eval_loss': 0.3590090053744222}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8230026974910638, 'tp': 132, 'tn': 419, 'fp': 18, 'fn': 22, 'auroc': 0.9563582870219026, 'auprc': 0.9176423796273321, 'f1': 0.9323181049069373, 'acc': 0.9323181049069373, 'eval_loss': 0.3269959663187987}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8163849264473023, 'tp': 134, 'tn': 415, 'fp': 22, 'fn': 20, 'auroc': 0.9601771226485185, 'auprc': 0.912642586562303, 'f1': 0.9289340101522843, 'acc': 0.9289340101522843, 'eval_loss': 0.3116426121835646}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8163849264473023, 'tp': 134, 'tn': 415, 'fp': 22, 'fn': 20, 'auroc': 0.9593004249754822, 'auprc': 0.9069965496579246, 'f1': 0.9289340101522843, 'acc': 0.9289340101522843, 'eval_loss': 0.3144464105073559}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8020001251244493, 'tp': 131, 'tn': 415, 'fp': 22, 'fn': 23, 'auroc': 0.9504740111147435, 'auprc': 0.9191264089426466, 'f1': 0.9238578680203046, 'acc': 0.9238578680203046, 'eval_loss': 0.4473297024929994}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8308209276361849, 'tp': 131, 'tn': 422, 'fp': 15, 'fn': 23, 'auroc': 0.9577996374335047, 'auprc': 0.9111501048494697, 'f1': 0.9357021996615905, 'acc': 0.9357021996615905, 'eval_loss': 0.373968415979394}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8448930489823439, 'tp': 134, 'tn': 422, 'fp': 15, 'fn': 20, 'auroc': 0.9527771999167881, 'auprc': 0.9186196631417007, 'f1': 0.9407783417935702, 'acc': 0.9407783417935702, 'eval_loss': 0.41121553642197367}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8155814437278969, 'tp': 133, 'tn': 416, 'fp': 21, 'fn': 21, 'auroc': 0.9580819638027875, 'auprc': 0.9057549703633847, 'f1': 0.9289340101522843, 'acc': 0.9289340101522843, 'eval_loss': 0.4280939535237849}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8148343429443037, 'tp': 132, 'tn': 417, 'fp': 20, 'fn': 22, 'auroc': 0.9619899551249665, 'auprc': 0.9212509669868398, 'f1': 0.9289340101522843, 'acc': 0.9289340101522843, 'eval_loss': 0.38251345229065536}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8196009745256098, 'tp': 133, 'tn': 417, 'fp': 20, 'fn': 21, 'auroc': 0.9570120954560314, 'auprc': 0.902886094445626, 'f1': 0.9306260575296108, 'acc': 0.9306260575296108, 'eval_loss': 0.3964262843181036}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7988941346571861, 'tp': 132, 'tn': 413, 'fp': 24, 'fn': 22, 'auroc': 0.958230556628726, 'auprc': 0.9066098904155772, 'f1': 0.922165820642978, 'acc': 0.922165820642978, 'eval_loss': 0.43709473767758983}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8018376698687179, 'tp': 135, 'tn': 410, 'fp': 27, 'fn': 19, 'auroc': 0.9508306338969954, 'auprc': 0.915933410514429, 'f1': 0.922165820642978, 'acc': 0.922165820642978, 'eval_loss': 0.3520385802012721}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8181559482943027, 'tp': 136, 'tn': 413, 'fp': 24, 'fn': 18, 'auroc': 0.9504442925495558, 'auprc': 0.8973997317279577, 'f1': 0.9289340101522843, 'acc': 0.9289340101522843, 'eval_loss': 0.42569668275475697}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8115944724721967, 'tp': 133, 'tn': 415, 'fp': 22, 'fn': 21, 'auroc': 0.9584683051502273, 'auprc': 0.9082107692013379, 'f1': 0.9272419627749577, 'acc': 0.9272419627749577, 'eval_loss': 0.4464483804584138}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8133468018711243, 'tp': 135, 'tn': 413, 'fp': 24, 'fn': 19, 'auroc': 0.9611726945823055, 'auprc': 0.9005416756463559, 'f1': 0.9272419627749577, 'acc': 0.9272419627749577, 'eval_loss': 0.3539204703778715}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8291214610615695, 'tp': 135, 'tn': 417, 'fp': 20, 'fn': 19, 'auroc': 0.9588397872150733, 'auprc': 0.9082527300326666, 'f1': 0.934010152284264, 'acc': 0.934010152284264, 'eval_loss': 0.34883530403634433}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8243632797408541, 'tp': 134, 'tn': 417, 'fp': 20, 'fn': 20, 'auroc': 0.9595976106273589, 'auprc': 0.8831286069751259, 'f1': 0.9323181049069373, 'acc': 0.9323181049069373, 'eval_loss': 0.3457022977680409}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8318604079044017, 'tp': 133, 'tn': 420, 'fp': 17, 'fn': 21, 'auroc': 0.9574132960860651, 'auprc': 0.8908288946439392, 'f1': 0.9357021996615905, 'acc': 0.9357021996615905, 'eval_loss': 0.3764639321782038}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8318604079044017, 'tp': 133, 'tn': 420, 'fp': 17, 'fn': 21, 'auroc': 0.9614253023864008, 'auprc': 0.8948414968257793, 'f1': 0.9357021996615905, 'acc': 0.9357021996615905, 'eval_loss': 0.33409304652166993}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.811337451886574, 'tp': 140, 'tn': 406, 'fp': 31, 'fn': 14, 'auroc': 0.9677404974887813, 'auprc': 0.9115127280545053, 'f1': 0.9238578680203046, 'acc': 0.9238578680203046, 'eval_loss': 0.2902134509365025}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8287468573034439, 'tp': 139, 'tn': 412, 'fp': 25, 'fn': 15, 'auroc': 0.96494695236114, 'auprc': 0.9217160497202357, 'f1': 0.9323181049069373, 'acc': 0.9323181049069373, 'eval_loss': 0.2695496978826429}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8234879457991136, 'tp': 141, 'tn': 408, 'fp': 29, 'fn': 13, 'auroc': 0.9654373086867366, 'auprc': 0.8940677321135341, 'f1': 0.9289340101522843, 'acc': 0.9289340101522843, 'eval_loss': 0.2690524240269473}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8126181622436626, 'tp': 141, 'tn': 405, 'fp': 32, 'fn': 13, 'auroc': 0.9688995215311005, 'auprc': 0.9157495879414385, 'f1': 0.9238578680203046, 'acc': 0.9238578680203046, 'eval_loss': 0.28776933679259137}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8277628333291047, 'tp': 138, 'tn': 413, 'fp': 24, 'fn': 16, 'auroc': 0.966774644120182, 'auprc': 0.9124680710898698, 'f1': 0.9323181049069373, 'acc': 0.9323181049069373, 'eval_loss': 0.2674588686541507}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8251303223423604, 'tp': 135, 'tn': 416, 'fp': 21, 'fn': 19, 'auroc': 0.9639810989925406, 'auprc': 0.9011775813816002, 'f1': 0.9323181049069373, 'acc': 0.9323181049069373, 'eval_loss': 0.35516883579916075}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8331451157538114, 'tp': 135, 'tn': 418, 'fp': 19, 'fn': 19, 'auroc': 0.9652589972956106, 'auprc': 0.9226936140652906, 'f1': 0.9357021996615905, 'acc': 0.9357021996615905, 'eval_loss': 0.3359200174332057}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8108005498250296, 'tp': 132, 'tn': 416, 'fp': 21, 'fn': 22, 'auroc': 0.9565663169782164, 'auprc': 0.9202945978843452, 'f1': 0.9272419627749577, 'acc': 0.9272419627749577, 'eval_loss': 0.35728423102562756}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7966843462243632, 'tp': 137, 'tn': 406, 'fp': 31, 'fn': 17, 'auroc': 0.9556450414573984, 'auprc': 0.9185726473673735, 'f1': 0.9187817258883249, 'acc': 0.9187817258883249, 'eval_loss': 0.37435517727250334}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7824038419482815, 'tp': 131, 'tn': 410, 'fp': 27, 'fn': 23, 'auroc': 0.9634313055365689, 'auprc': 0.9212481479002528, 'f1': 0.9153976311336718, 'acc': 0.9153976311336718, 'eval_loss': 0.36017354157459186}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7950697822709131, 'tp': 127, 'tn': 418, 'fp': 19, 'fn': 27, 'auroc': 0.9469672204225981, 'auprc': 0.904785774106782, 'f1': 0.922165820642978, 'acc': 0.922165820642978, 'eval_loss': 0.501100837093729}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8148343429443037, 'tp': 132, 'tn': 417, 'fp': 20, 'fn': 22, 'auroc': 0.944886920859461, 'auprc': 0.8966835002753045, 'f1': 0.9289340101522843, 'acc': 0.9289340101522843, 'eval_loss': 0.5339501802196824}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.7923864636640535, 'tp': 129, 'tn': 415, 'fp': 22, 'fn': 25, 'auroc': 0.9501173883324913, 'auprc': 0.9102882898049997, 'f1': 0.9204737732656514, 'acc': 0.9204737732656514, 'eval_loss': 0.45731083816836443}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.8060150788486314, 'tp': 131, 'tn': 416, 'fp': 21, 'fn': 23, 'auroc': 0.9347380308478707, 'auprc': 0.8984374092012397, 'f1': 0.9255499153976311, 'acc': 0.9255499153976311, 'eval_loss': 0.5052213875919973}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.760332193502895, 'tp': 134, 'tn': 400, 'fp': 37, 'fn': 20, 'auroc': 0.9402656839727778, 'auprc': 0.9114032503638227, 'f1': 0.9035532994923858, 'acc': 0.9035532994923858, 'eval_loss': 0.5523721031648549}


### 4.1. Results using original dataset (texts) + embeddings obtained from knowledge graph exploitation

In [25]:
indexBERT = ['TweetBERT','BERT','RoBERTa','DistilBERT','CamemBERT','Albert','Flaubert']

#dfResultsModelsTotal.reindex(indexBERT)
dfResultsModelsTotal = dfResultsModelsTotal.reset_index(drop=True)
dfResultsModelsTotal.index = indexBERT
dfResultsModelsTotal

dfResultssModelsTotal1 = dfResultsModelsTotal.copy()

dfResultssModelsTotal1

Unnamed: 0,mcc,tp,tn,fp,fn,auroc,auprc,f1,acc,eval_loss
TweetBERT,0.83577,142.0,410.0,27.0,12.0,0.971708,0.92885,0.879257,0.93401,0.298105
BERT,0.84294,138.8,415.8,21.2,15.2,0.965518,0.918678,0.884076,0.938409,0.332597
RoBERTa,0.851004,138.6,418.2,18.8,15.4,0.974582,0.938401,0.890173,0.942132,0.333458
DistilBERT,0.836488,136.2,417.4,19.6,17.8,0.969859,0.925406,0.879277,0.936717,0.32228
CamemBERT,0.815356,146.6,397.8,39.2,7.4,0.976843,0.920379,0.862861,0.921151,0.30381
Albert,0.775499,129.6,410.0,27.0,24.4,0.947897,0.882543,0.834514,0.913029,0.440969
Flaubert,0.815942,136.8,411.4,25.6,17.2,0.9664,0.920642,0.864728,0.92758,0.486463


### 4.2. Results using original dataset (texts) 

In [26]:
indexBERT = ['TweetBERT','BERT','RoBERTa','DistilBERT','CamemBERT','Albert','Flaubert']

#dfResultsModelsTotal.reindex(indexBERT)
dfResultsModelsTotalw = dfResultsModelsTotalw.reset_index(drop=True)
dfResultsModelsTotalw.index = indexBERT
dfResultsModelsTotalw

dfResultssModelsTotal1w = dfResultsModelsTotalw.copy()
dfResultssModelsTotal1w

Unnamed: 0,mcc,tp,tn,fp,fn,auroc,auprc,f1,acc,eval_loss
TweetBERT,0.816016,136.333333,412.0,25.0,17.666667,0.965217,0.918368,0.864693,0.927806,0.457794
BERT,0.815757,136.0,412.333333,24.666667,18.0,0.965665,0.920744,0.864407,0.927806,0.469138
RoBERTa,0.815217,136.166667,412.0,25.0,17.833333,0.965078,0.91857,0.864093,0.927524,0.479794
DistilBERT,0.818595,136.166667,412.833333,24.166667,17.833333,0.965571,0.916342,0.866384,0.928934,0.461068
CamemBERT,0.817912,137.0,411.666667,25.333333,17.0,0.966463,0.91928,0.866175,0.92837,0.449963
Albert,0.810352,135.833333,411.166667,25.833333,18.166667,0.965905,0.920743,0.860612,0.92555,0.465415
Flaubert,0.806674,136.333333,409.5,27.5,17.666667,0.962044,0.919102,0.857892,0.923576,0.497448
