# Combining Knowledge Graphs and Deep Learning techniques for Categorizing Tweets
## BERT Models (TweetBERT, BERT, RoBERTa, CamemBERT, DistilBERT, Albert, Flaubert)


Authors:

Experiments:
* Applying RF, RNN and Bi-LSTM models to 2 datasets for classifying 4 binary categories.
* 2 datatasets: (i) textual information and (ii) textual information and embeddings obtained from knowledge graph exploitation (KGE).
 
 


In [1]:
from keras.preprocessing import sequence
from keras.models import Sequential
from keras.layers import Dense, Dropout, Embedding, LSTM, Bidirectional
from keras.datasets import imdb 
import spacy
import nltk.data
import pandas as pd
import numpy as np
from nltk.tokenize import word_tokenize
from nltk.stem import SnowballStemmer
import regex as re
import string
from collections import defaultdict
import matplotlib.pyplot as plt
import seaborn as sns
pd.set_option('display.max_colwidth', None)
import sklearn
from sklearn.model_selection import train_test_split
from sklearn.metrics import f1_score, accuracy_score
from simpletransformers.classification import ClassificationModel
import io
import os
import json
from collections import Counter
from wordcloud import WordCloud
import re, string, unicodedata
import nltk
from nltk import word_tokenize, sent_tokenize, FreqDist
from nltk.corpus import stopwords
from nltk.stem import LancasterStemmer, WordNetLemmatizer
nltk.download
from ast import literal_eval
'''
tweets = pd.read_csv('ed-dataset-falcon_spacy2-embeddings-sentence.csv', sep=';', encoding='utf8', converters=
                           {
                            'entities_instances_wikidata':literal_eval,
                            'spacy_entities_ids':literal_eval,
                            'spacy_entities_labels':literal_eval,
                            'falcon_spacy_entities':literal_eval,
                            'falcon_spacy_labels':literal_eval,
                            'falcon_spacy_embeddingsmd4_mw50_RW':literal_eval,
                            'falcon_spacy_embeddingsmd2_mw100_RW':literal_eval,
                            'sent_embedding_1':literal_eval,
                            'sent_embedding_2':literal_eval},error_bad_lines=False)

'''
tweets = pd.read_csv('ed-dataset-falcon_spacy2-embeddings-sentence-md4.csv', sep=';', encoding='utf8', converters=
                           {
                            'falcon_spacy_embeddingsmd4_mw50_RW':literal_eval,
                            'sent_embedding_1':literal_eval},error_bad_lines=False)

In [2]:
n_unique_words = 10000 # cut texts after this number of words
maxlen = 100
batch_size = 128 

In [3]:
punctuations = "¡!#$%&'()*+,-./:;<=>¿?@[\]^_`{|}~"

def read_txt(filename):
    list = []
    with open(filename, 'r', encoding='utf-8') as f:
        data = f.readlines()
        for line in data:
            list.append(str(line).replace('\n', ''))
    return list

stopwords = read_txt('english_stopwords.txt')

stemmer = SnowballStemmer('english')


def clean_accents(tweet):
    tweet = re.sub(r"[àáâãäå]", "a", tweet)
    tweet = re.sub(r"ç", "c", tweet)
    tweet = re.sub(r"[èéêë]", "e", tweet)
    tweet = re.sub(r"[ìíîï]", "i", tweet)
    tweet = re.sub(r"[òóôõö]", "o", tweet)
    tweet = re.sub(r"[ùúûü]", "u", tweet)
    tweet = re.sub(r"[ýÿ]", "y", tweet)

    return tweet

def clean_tweet(tweet, stem = False):
    tweet = tweet.lower().strip()
    tweet = re.sub(r'https?:\/\/\S+', '', tweet)
    tweet = re.sub(r'http?:\/\/\S+', '', tweet)
    tweet = re.sub(r'www?:\/\/\S+', '', tweet)
    tweet = re.sub(r'\s([@#][\w_-]+)', "", tweet)
    tweet = re.sub(r"\n", " ", tweet)
    tweet = clean_accents(tweet)
    tweet = re.sub(r"\b(a*ha+h[ha]*|o?l+o+l+[ol]*|x+d+[x*d*]*|a*ja+[j+a+]+)\b", "<risas>", tweet)
    for symbol in punctuations:
        tweet = tweet.replace(symbol, "")
    tokens = []
    for token in tweet.strip().split():
        if token not in punctuations and token not in stopwords:
            if stem:
                tokens.append(stemmer.stem(token))
            else:
                tokens.append(token)
    return " ".join(tokens)

In [4]:
tweets1 = tweets.copy()
tweets1['text_cleaned'] = tweets['text_orig'].apply(lambda s : clean_tweet(s))
print(tweets1['text_cleaned'].head(5))

0                                                                                                                                                                               make better
1    effects dosagecontrolled cannabis capsules cancerrelated cachexia anorexia syndrome advanced cancer patients pilot study gil barsela daniela zalman valerya semenysty eyal ballan 2019
2                                                                                                                                                                    kaydoloo best anorexic
3                                                                                                                                                                        maxy best anorexic
4                                                                                                                                                                                      ur f
Name: text_cleaned, dtype: object


In [5]:
# This will hold all of the dataset samples, as strings.
sen_w_feats = []

# The labels for the samples.
labels = []

# First, reload the dataset to undo the transformations we applied for XGBoost.
data_df = tweets.copy()

# Some of the reviews are missing either a "Title" or "Review Text", so we'll 
# replace the NaN values with empty string.
data_df = data_df.fillna("")

# Combining features following https://mccormickml.com/2021/06/29/combining-categorical-numerical-features-with-bert/
print('Combining features ...')

# For each of the samples...
for index, row in data_df.iterrows():

    # Piece it together...    
    combined = " {:} ".format(row["sent_embedding_1"])
    
    # Add the combined text to the list.
    sen_w_feats.append(combined)

    # Also record the sample's label.
    labels.append(row["ProED"])

print('  DONE.')

print('Dataset contains {:,} samples.'.format(len(sen_w_feats)))



Combining features into strings...
  DONE.
Dataset contains 1,968 samples.


In [6]:
X = sen_w_feats
X2 = tweets1['text_cleaned']

df = tweets1.copy()
Y1 = df['ED_Patient']
Y2 = df['ProED']
Y3 = df['informative']
Y4 = df['scientific']

X1_train, X1_test, y1_train, y1_test = train_test_split(X, Y1, test_size=0.3, random_state=42)
X2_train, X2_test, y2_train, y2_test = train_test_split(X, Y2, test_size=0.3, random_state=42)
X3_train, X3_test, y3_train, y3_test = train_test_split(X, Y3, test_size=0.3, random_state=42)
X4_train, X4_test, y4_train, y4_test = train_test_split(X, Y4, test_size=0.3, random_state=42)

In [7]:
y1_test.value_counts(normalize=True)

1    0.500846
0    0.499154
Name: ED_Patient, dtype: float64

In [8]:
train_args ={"reprocess_input_data": True,
           "fp16":False,
             "evaluate_during_training": False,
             "evaluate_during_training_verbose":False,
             "learning_rate":2e-5,
             "train_batch_size":32,
             "eval_batch_size":32,
           "num_train_epochs": 15, 'overwrite_output_dir': True, "evaluation_strategy":'epochs'
            }
#optimizer = torch.optim.SGD(model.parameters(), lr=0.01, momentum=0.9)


def f1_multiclass(labels, preds):
    return f1_score(labels, preds, average='micro')

def calcule_f1(df):
    return(df['tp'] / (df['tp'] + 0.5 * (df['fp'] + df['fn'])))

import torch
import gc
from tqdm import tqdm


dfEval1 = pd.DataFrame()

In [20]:
N_ITER = 4

In [10]:
gc.collect()
torch.cuda.empty_cache()

In [11]:
import torch
print(torch.cuda.is_available())


True


## 1. BERT Models applied to Category I - Tweets written by people suffering Eating Disorders

In [21]:
#gc.collect()
#torch.cuda.empty_cache()
limitsave=0

X1_train, X1_test, y1_train, y1_test = train_test_split(X, Y1, test_size=0.3, random_state=42)
train_df1 = pd.DataFrame({ 'text_cleaned': X1_train, 'target': y1_train })
test_df1 = pd.DataFrame({ 'text_cleaned': X1_test, 'target': y1_test })

c_model_1 = ["bertweet","bert","roberta", "distilbert","camembert",  "albert", "flaubert"]
c_model_2 = ["vinai/bertweet-base","bert-base-multilingual-cased","roberta-base","distilbert-base-cased", "camembert-base", "albert-base-v1", "flaubert/flaubert_base_cased"]

for idx, model in enumerate(c_model_1):
    
    for i in range(0,N_ITER):
        model1 = ClassificationModel(
        c_model_1[idx], c_model_2[idx],
            use_cuda = True,
            args=train_args
        )
        model1.train_model(train_df1)
        result1, model_outputs1, wrong_predictions1 = model1.eval_model(test_df1, f1=f1_multiclass, acc=accuracy_score)
        print(result1)
        if(i<limitsave):
            torch.save(model1, 'model1'+str(i)+'.pt')
        del model1
        gc.collect()
        torch.cuda.empty_cache()
        if(i==0):
            dfResultsModels1 = pd.DataFrame.from_dict(result1, orient="index").T
        else:
            dfResultsModels1b = pd.DataFrame.from_dict(result1, orient="index").T
            dfResultsModels1 = dfResultsModels1.append(dfResultsModels1b)

    dfResultsModels1Trans = pd.DataFrame(dfResultsModels1.mean(axis=0)).T
    dfResultsModels1Trans['f1'] = calcule_f1(dfResultsModels1Trans)
    if(idx == 0):
        dfResultsModelsTotal = dfResultsModels1Trans.copy()
    else:
        dfResultsModelsTotal = dfResultsModelsTotal.append(dfResultsModels1Trans)
    #dfResultsModelsTotal.to_csv('dfResultsModelsTotalEMB-1.csv')

Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

  "Dataframe headers not specified. Falling back to using column 0 as text and column 1 as labels."


Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.08455626111951116, 'tp': 134, 'tn': 186, 'fp': 109, 'fn': 162, 'auroc': 0.5511337608795236, 'auprc': 0.606286507310604, 'f1': 0.5414551607445008, 'acc': 0.5414551607445008, 'eval_loss': 0.7267374992370605}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

  mcc = cov_ytyp / np.sqrt(cov_ytyt * cov_ypyp)


{'mcc': 0.0, 'tp': 0, 'tn': 295, 'fp': 0, 'fn': 296, 'auroc': 0.4690677966101695, 'auprc': 0.4760503128279338, 'f1': 0.49915397631133673, 'acc': 0.49915397631133673, 'eval_loss': 0.6944787596401415}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 295, 'fp': 0, 'fn': 296, 'auroc': 0.5303137883646358, 'auprc': 0.5207646382789118, 'f1': 0.49915397631133673, 'acc': 0.49915397631133673, 'eval_loss': 0.6976239022455717}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.09333465847855542, 'tp': 176, 'tn': 147, 'fp': 148, 'fn': 120, 'auroc': 0.581779661016949, 'auprc': 0.5990306403283328, 'f1': 0.5465313028764806, 'acc': 0.5465313028764806, 'eval_loss': 0.7064932365166513}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.11345683978036342, 'tp': 61, 'tn': 259, 'fp': 36, 'fn': 235, 'auroc': 0.5986830050389373, 'auprc': 0.5870343184944578, 'f1': 0.5414551607445008, 'acc': 0.5414551607445008, 'eval_loss': 0.6987140868839464}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.1277106413077166, 'tp': 152, 'tn': 181, 'fp': 114, 'fn': 144, 'auroc': 0.5813559322033899, 'auprc': 0.6197220981370304, 'f1': 0.5634517766497462, 'acc': 0.5634517766497462, 'eval_loss': 0.8990962097519323}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 295, 'fp': 0, 'fn': 296, 'auroc': 0.5126431516262024, 'auprc': 0.5240095844454189, 'f1': 0.49915397631133673, 'acc': 0.49915397631133673, 'eval_loss': 0.6950931298105341}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 295, 'fp': 0, 'fn': 296, 'auroc': 0.546358222629409, 'auprc': 0.5559186372864937, 'f1': 0.49915397631133673, 'acc': 0.49915397631133673, 'eval_loss': 0.6957067251205444}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 295, 'fp': 0, 'fn': 296, 'auroc': 0.4845854328905177, 'auprc': 0.4939166548419759, 'f1': 0.49915397631133673, 'acc': 0.49915397631133673, 'eval_loss': 0.6941615437206469}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 295, 'fp': 0, 'fn': 296, 'auroc': 0.5025366468163079, 'auprc': 0.5127227007386015, 'f1': 0.49915397631133673, 'acc': 0.49915397631133673, 'eval_loss': 0.6947162684641386}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 295, 'fp': 0, 'fn': 296, 'auroc': 0.4886738433348603, 'auprc': 0.4959608982979406, 'f1': 0.49915397631133673, 'acc': 0.49915397631133673, 'eval_loss': 0.6951331088417455}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 295, 'fp': 0, 'fn': 296, 'auroc': 0.48774622079706825, 'auprc': 0.5029720585861688, 'f1': 0.49915397631133673, 'acc': 0.49915397631133673, 'eval_loss': 0.6943331172591761}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.18304338899350867, 'tp': 140, 'tn': 208, 'fp': 87, 'fn': 156, 'auroc': 0.5939990838295923, 'auprc': 0.6250851968420328, 'f1': 0.5888324873096447, 'acc': 0.5888324873096447, 'eval_loss': 0.7289221380886278}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.19299340690423902, 'tp': 143, 'tn': 208, 'fp': 87, 'fn': 153, 'auroc': 0.5893380668804398, 'auprc': 0.6180218380698885, 'f1': 0.5939086294416244, 'acc': 0.5939086294416244, 'eval_loss': 0.7098432434232611}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.11289517513642668, 'tp': 133, 'tn': 195, 'fp': 100, 'fn': 163, 'auroc': 0.5758818140174071, 'auprc': 0.6244502262214207, 'f1': 0.5549915397631133, 'acc': 0.5549915397631133, 'eval_loss': 0.8198223019901075}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.15916653193124278, 'tp': 115, 'tn': 224, 'fp': 71, 'fn': 181, 'auroc': 0.5882615666513972, 'auprc': 0.6285577910175069, 'f1': 0.5736040609137056, 'acc': 0.5736040609137056, 'eval_loss': 0.7387722165961015}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 295, 'fp': 0, 'fn': 296, 'auroc': 0.48856504809894646, 'auprc': 0.49495749453795845, 'f1': 0.49915397631133673, 'acc': 0.49915397631133673, 'eval_loss': 0.6960202361408033}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 295, 'fp': 0, 'fn': 296, 'auroc': 0.5426820888685295, 'auprc': 0.5402123659512018, 'f1': 0.49915397631133673, 'acc': 0.49915397631133673, 'eval_loss': 0.6946801543235779}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 295, 'fp': 0, 'fn': 296, 'auroc': 0.5451213925790197, 'auprc': 0.5544147221748635, 'f1': 0.49915397631133673, 'acc': 0.49915397631133673, 'eval_loss': 0.694665723725369}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 295, 'fp': 0, 'fn': 296, 'auroc': 0.5535043518094366, 'auprc': 0.553802575946397, 'f1': 0.49915397631133673, 'acc': 0.49915397631133673, 'eval_loss': 0.6945303678512573}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.15636103899567558, 'tp': 132, 'tn': 208, 'fp': 87, 'fn': 164, 'auroc': 0.5934493815849748, 'auprc': 0.6386916498364946, 'f1': 0.5752961082910322, 'acc': 0.5752961082910322, 'eval_loss': 0.687680278953753}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.1353788235525247, 'tp': 117, 'tn': 216, 'fp': 79, 'fn': 179, 'auroc': 0.5859024278515804, 'auprc': 0.6311936760473775, 'f1': 0.5634517766497462, 'acc': 0.5634517766497462, 'eval_loss': 0.7147401194823416}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 295, 'fp': 0, 'fn': 296, 'auroc': 0.5054054054054054, 'auprc': 0.507834305688015, 'f1': 0.49915397631133673, 'acc': 0.49915397631133673, 'eval_loss': 0.6976714228328905}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.14486613798738684, 'tp': 122, 'tn': 214, 'fp': 81, 'fn': 174, 'auroc': 0.5733279890059552, 'auprc': 0.6338591171705209, 'f1': 0.5685279187817259, 'acc': 0.5685279187817259, 'eval_loss': 0.7350959087672987}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.17484524312995162, 'tp': 25, 'tn': 292, 'fp': 3, 'fn': 271, 'auroc': 0.5763284470911589, 'auprc': 0.6183569307181249, 'f1': 0.5363790186125211, 'acc': 0.5363790186125211, 'eval_loss': 0.6907856527127718}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 295, 'fp': 0, 'fn': 296, 'auroc': 0.545716903344022, 'auprc': 0.5596035407743263, 'f1': 0.49915397631133673, 'acc': 0.49915397631133673, 'eval_loss': 0.6980974423257928}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 295, 'fp': 0, 'fn': 296, 'auroc': 0.5477095739807605, 'auprc': 0.5371327355809137, 'f1': 0.49915397631133673, 'acc': 0.49915397631133673, 'eval_loss': 0.6930736836634184}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 295, 'fp': 0, 'fn': 296, 'auroc': 0.558680714612918, 'auprc': 0.5329905589642072, 'f1': 0.49915397631133673, 'acc': 0.49915397631133673, 'eval_loss': 0.6952331850403234}


### 1.1. Results using original dataset (texts) + embeddings obtained from knowledge graph exploitation

In [22]:
indexBERT = ['TweetBERT','BERT','RoBERTa','DistilBERT','CamemBERT','Albert','Flaubert']

#dfResultsModelsTotal.reindex(indexBERT)
dfResultsModelsTotal = dfResultsModelsTotal.reset_index(drop=True)
dfResultsModelsTotal.index = indexBERT
dfResultsModelsTotal

dfResultssModelsTotal1 = dfResultsModelsTotal.copy()
dfResultssModelsTotal1

Unnamed: 0,mcc,tp,tn,fp,fn,auroc,auprc,f1,acc,eval_loss
TweetBERT,0.044473,77.5,230.75,64.25,218.5,0.533074,0.550533,0.354083,0.521574,0.706333
BERT,0.060292,53.25,257.5,37.5,242.75,0.55976,0.571671,0.275372,0.525804,0.747153
RoBERTa,0.0,0.0,295.0,0.0,296.0,0.490886,0.501393,0.0,0.499154,0.694586
DistilBERT,0.162025,132.75,208.75,86.25,163.25,0.58687,0.624029,0.515534,0.577834,0.74934
CamemBERT,0.0,0.0,295.0,0.0,296.0,0.532468,0.535847,0.0,0.499154,0.694974
Albert,0.109152,92.75,233.25,61.75,203.25,0.564521,0.602895,0.411765,0.551607,0.708797
Flaubert,0.043711,6.25,294.25,0.75,289.75,0.557109,0.562021,0.041254,0.50846,0.694297


## 2. BERT Models applied to Category II - Tweets promoting Eating Disorders

In [23]:
#gc.collect()
#torch.cuda.empty_cache()
limitsave=0

X1_train, X1_test, y1_train, y1_test = train_test_split(X, Y2, test_size=0.3, random_state=42)
train_df1 = pd.DataFrame({ 'text_cleaned': X1_train, 'target': y1_train })
test_df1 = pd.DataFrame({ 'text_cleaned': X1_test, 'target': y1_test })

c_model_1 = ["bertweet","bert","roberta", "distilbert","camembert",  "albert", "flaubert"]
c_model_2 = ["vinai/bertweet-base","bert-base-multilingual-cased","roberta-base","distilbert-base-cased", "camembert-base", "albert-base-v1", "flaubert/flaubert_base_cased"]

for idx, model in enumerate(c_model_1):
    
    for i in range(0,N_ITER):
        model1 = ClassificationModel(
        c_model_1[idx], c_model_2[idx],
            use_cuda = True,
            args=train_args
        )
        model1.train_model(train_df1)
        result1, model_outputs1, wrong_predictions1 = model1.eval_model(test_df1, f1=f1_multiclass, acc=accuracy_score)
        print(result1)
        if(i<limitsave):
            torch.save(model1, 'model1'+str(i)+'.pt')
        del model1
        gc.collect()
        torch.cuda.empty_cache()
        if(i==0):
            dfResultsModels1 = pd.DataFrame.from_dict(result1, orient="index").T
        else:
            dfResultsModels1b = pd.DataFrame.from_dict(result1, orient="index").T
            dfResultsModels1 = dfResultsModels1.append(dfResultsModels1b)

    dfResultsModels1Trans = pd.DataFrame(dfResultsModels1.mean(axis=0)).T
    dfResultsModels1Trans['f1'] = calcule_f1(dfResultsModels1Trans)
    
    if(idx == 0):
        dfResultsModelsTotal = dfResultsModels1Trans.copy()
    else:
        dfResultsModelsTotal = dfResultsModelsTotal.append(dfResultsModels1Trans)
    #dfResultsModelsTotal.to_csv('dfResultsModelsTotalEMB-2.csv')



Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

  "Dataframe headers not specified. Falling back to using column 0 as text and column 1 as labels."


Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

  mcc = cov_ytyp / np.sqrt(cov_ytyt * cov_ypyp)


{'mcc': 0.0, 'tp': 0, 'tn': 465, 'fp': 0, 'fn': 126, 'auroc': 0.5543778801843318, 'auprc': 0.2550984037012106, 'f1': 0.7868020304568529, 'acc': 0.7868020304568528, 'eval_loss': 0.5129570317895789}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.13038221706133446, 'tp': 13, 'tn': 449, 'fp': 16, 'fn': 113, 'auroc': 0.5983273596176822, 'auprc': 0.3407823244640531, 'f1': 0.7817258883248731, 'acc': 0.7817258883248731, 'eval_loss': 0.5057991272524783}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 465, 'fp': 0, 'fn': 126, 'auroc': 0.6018774534903567, 'auprc': 0.3273634333563661, 'f1': 0.7868020304568529, 'acc': 0.7868020304568528, 'eval_loss': 0.5125844431550879}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 465, 'fp': 0, 'fn': 126, 'auroc': 0.6006144393241168, 'auprc': 0.33897571586831277, 'f1': 0.7868020304568529, 'acc': 0.7868020304568528, 'eval_loss': 0.5126889097063165}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.38796809248320707, 'tp': 65, 'tn': 405, 'fp': 60, 'fn': 61, 'auroc': 0.7339307048984469, 'auprc': 0.569173440278475, 'f1': 0.7952622673434857, 'acc': 0.7952622673434856, 'eval_loss': 0.5145674708642458}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.3389762097614201, 'tp': 57, 'tn': 407, 'fp': 58, 'fn': 69, 'auroc': 0.6896228025260284, 'auprc': 0.38479531711626747, 'f1': 0.7851099830795261, 'acc': 0.7851099830795262, 'eval_loss': 0.6933815479278564}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.3381018176997214, 'tp': 61, 'tn': 398, 'fp': 67, 'fn': 65, 'auroc': 0.758115719406042, 'auprc': 0.5627676803754379, 'f1': 0.7766497461928935, 'acc': 0.7766497461928934, 'eval_loss': 0.5365136108900371}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.36368249240198314, 'tp': 41, 'tn': 442, 'fp': 23, 'fn': 85, 'auroc': 0.7369346304830175, 'auprc': 0.5413769558022297, 'f1': 0.817258883248731, 'acc': 0.817258883248731, 'eval_loss': 0.45670062225115926}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 465, 'fp': 0, 'fn': 126, 'auroc': 0.5551117938214712, 'auprc': 0.2616629851026225, 'f1': 0.7868020304568529, 'acc': 0.7868020304568528, 'eval_loss': 0.5101587960594579}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 465, 'fp': 0, 'fn': 126, 'auroc': 0.7142345110087045, 'auprc': 0.45333089737755616, 'f1': 0.7868020304568529, 'acc': 0.7868020304568528, 'eval_loss': 0.47590334321323197}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 465, 'fp': 0, 'fn': 126, 'auroc': 0.5236473800989929, 'auprc': 0.23004929002398, 'f1': 0.7868020304568529, 'acc': 0.7868020304568528, 'eval_loss': 0.5134150527025524}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 465, 'fp': 0, 'fn': 126, 'auroc': 0.5835808158388803, 'auprc': 0.2936983571137608, 'f1': 0.7868020304568529, 'acc': 0.7868020304568528, 'eval_loss': 0.5137417536032828}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.3528053308082998, 'tp': 58, 'tn': 409, 'fp': 56, 'fn': 68, 'auroc': 0.7258576548899129, 'auprc': 0.5187762795543974, 'f1': 0.7901861252115059, 'acc': 0.7901861252115059, 'eval_loss': 0.4966221953693189}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.3633171493388823, 'tp': 56, 'tn': 416, 'fp': 49, 'fn': 70, 'auroc': 0.7403823178016727, 'auprc': 0.5687588918426976, 'f1': 0.7986463620981388, 'acc': 0.7986463620981388, 'eval_loss': 0.48132941283677755}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.2972332415957694, 'tp': 53, 'tn': 403, 'fp': 62, 'fn': 73, 'auroc': 0.7123741252773511, 'auprc': 0.5095963273218607, 'f1': 0.7715736040609137, 'acc': 0.7715736040609137, 'eval_loss': 0.5539306464948153}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.36188610705752744, 'tp': 64, 'tn': 399, 'fp': 66, 'fn': 62, 'auroc': 0.748557774364226, 'auprc': 0.5228154060894482, 'f1': 0.7834179357021996, 'acc': 0.7834179357021996, 'eval_loss': 0.46671177054706375}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 465, 'fp': 0, 'fn': 126, 'auroc': 0.592268305171531, 'auprc': 0.2950885783492697, 'f1': 0.7868020304568529, 'acc': 0.7868020304568528, 'eval_loss': 0.5129033327102661}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.32331860539512436, 'tp': 50, 'tn': 417, 'fp': 48, 'fn': 76, 'auroc': 0.7496671786994367, 'auprc': 0.5167007440737865, 'f1': 0.7901861252115059, 'acc': 0.7901861252115059, 'eval_loss': 0.4642818609350606}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 465, 'fp': 0, 'fn': 126, 'auroc': 0.6621607782898106, 'auprc': 0.3863264329418583, 'f1': 0.7868020304568529, 'acc': 0.7868020304568528, 'eval_loss': 0.5065067504581652}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 465, 'fp': 0, 'fn': 126, 'auroc': 0.7065881549752517, 'auprc': 0.43963382468962253, 'f1': 0.7868020304568529, 'acc': 0.7868020304568528, 'eval_loss': 0.4782246178702304}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 465, 'fp': 0, 'fn': 126, 'auroc': 0.5544888206178529, 'auprc': 0.25469564080974705, 'f1': 0.7868020304568529, 'acc': 0.7868020304568528, 'eval_loss': 0.5144351909035131}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.2566700892498441, 'tp': 44, 'tn': 411, 'fp': 54, 'fn': 82, 'auroc': 0.6367127496159755, 'auprc': 0.4605175967592816, 'f1': 0.7698815566835872, 'acc': 0.7698815566835872, 'eval_loss': 0.540004982760078}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': -0.023374107454834623, 'tp': 4, 'tn': 445, 'fp': 20, 'fn': 122, 'auroc': 0.5701826250213347, 'auprc': 0.25341005815456735, 'f1': 0.7597292724196277, 'acc': 0.7597292724196277, 'eval_loss': 0.5336133398507771}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.34519713640964944, 'tp': 40, 'tn': 440, 'fp': 25, 'fn': 86, 'auroc': 0.6818569721795528, 'auprc': 0.5159524135130096, 'f1': 0.8121827411167513, 'acc': 0.8121827411167513, 'eval_loss': 0.48594962609441655}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 465, 'fp': 0, 'fn': 126, 'auroc': 0.5707799965864483, 'auprc': 0.2953070077952138, 'f1': 0.7868020304568529, 'acc': 0.7868020304568528, 'eval_loss': 0.5123659074306488}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 465, 'fp': 0, 'fn': 126, 'auroc': 0.4983358934971838, 'auprc': 0.20221405280845967, 'f1': 0.7868020304568529, 'acc': 0.7868020304568528, 'eval_loss': 0.5134178149072748}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 465, 'fp': 0, 'fn': 126, 'auroc': 0.5874722648916197, 'auprc': 0.31642131554494096, 'f1': 0.7868020304568529, 'acc': 0.7868020304568528, 'eval_loss': 0.5135041992915305}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.40587492377345546, 'tp': 38, 'tn': 453, 'fp': 12, 'fn': 88, 'auroc': 0.6968766001024065, 'auprc': 0.5459891507017433, 'f1': 0.8307952622673436, 'acc': 0.8307952622673435, 'eval_loss': 0.43545809074452047}


### 2.1. Results using original dataset (texts) + embeddings obtained from knowledge graph exploitation

In [24]:
indexBERT = ['TweetBERT','BERT','RoBERTa','DistilBERT','CamemBERT','Albert','Flaubert']

#dfResultsModelsTotal.reindex(indexBERT)
dfResultsModelsTotal = dfResultsModelsTotal.reset_index(drop=True)
dfResultsModelsTotal.index = indexBERT
dfResultsModelsTotal

dfResultssModelsTotal1 = dfResultsModelsTotal.copy()

dfResultssModelsTotal1

Unnamed: 0,mcc,tp,tn,fp,fn,auroc,auprc,f1,acc,eval_loss
TweetBERT,0.032596,3.25,461.0,4.0,122.75,0.588799,0.315555,0.04878,0.785533,0.511007
BERT,0.357182,56.0,413.0,52.0,70.0,0.729651,0.514528,0.478632,0.79357,0.550291
RoBERTa,0.0,0.0,465.0,0.0,126.0,0.594144,0.309685,0.0,0.786802,0.503305
DistilBERT,0.34381,57.75,406.75,58.25,68.25,0.731793,0.529987,0.477273,0.785956,0.499649
CamemBERT,0.08083,12.5,453.0,12.0,113.5,0.677671,0.409437,0.166113,0.787648,0.490479
Albert,0.144623,22.0,440.25,24.75,104.0,0.61081,0.371144,0.254703,0.782149,0.518501
Flaubert,0.101469,9.5,462.0,3.0,116.5,0.588366,0.339983,0.137184,0.7978,0.493687


## 3. BERT Models applied to Category III - Informative tweets

In [25]:
#gc.collect()
#torch.cuda.empty_cache()
limitsave=0

X1_train, X1_test, y1_train, y1_test = train_test_split(X, Y3, test_size=0.3, random_state=42)
train_df1 = pd.DataFrame({ 'text_cleaned': X1_train, 'target': y1_train })
test_df1 = pd.DataFrame({ 'text_cleaned': X1_test, 'target': y1_test })

c_model_1 = ["bertweet","bert","roberta", "distilbert","camembert",  "albert", "flaubert"]
c_model_2 = ["vinai/bertweet-base","bert-base-multilingual-cased","roberta-base","distilbert-base-cased", "camembert-base", "albert-base-v1", "flaubert/flaubert_base_cased"]

for idx, model in enumerate(c_model_1):
    
    for i in range(0,N_ITER):
        model1 = ClassificationModel(
        c_model_1[idx], c_model_2[idx],
            use_cuda = True,
            args=train_args
        )
        model1.train_model(train_df1)
        result1, model_outputs1, wrong_predictions1 = model1.eval_model(test_df1, f1=f1_multiclass, acc=accuracy_score)
        print(result1)
        if(i<limitsave):
            torch.save(model1, 'model1'+str(i)+'.pt')
        del model1
        gc.collect()
        torch.cuda.empty_cache()
        if(i==0):
            dfResultsModels1 = pd.DataFrame.from_dict(result1, orient="index").T
        else:
            dfResultsModels1b = pd.DataFrame.from_dict(result1, orient="index").T
            dfResultsModels1 = dfResultsModels1.append(dfResultsModels1b)

    dfResultsModels1Trans = pd.DataFrame(dfResultsModels1.mean(axis=0)).T
    dfResultsModels1Trans['f1'] = calcule_f1(dfResultsModels1Trans)
    
    if(idx == 0):
        dfResultsModelsTotal = dfResultsModels1Trans.copy()
    else:
        dfResultsModelsTotal = dfResultsModelsTotal.append(dfResultsModels1Trans)
    #dfResultsModelsTotal.to_csv('dfResultsModelsTotalEMB-3.csv')



Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

  "Dataframe headers not specified. Falling back to using column 0 as text and column 1 as labels."


Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

  mcc = cov_ytyp / np.sqrt(cov_ytyt * cov_ypyp)


{'mcc': 0.0, 'tp': 0, 'tn': 356, 'fp': 0, 'fn': 235, 'auroc': 0.5168957685871385, 'auprc': 0.4070739100943132, 'f1': 0.6023688663282571, 'acc': 0.6023688663282571, 'eval_loss': 0.674005317060571}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.02142592055201, 'tp': 70, 'tn': 257, 'fp': 99, 'fn': 165, 'auroc': 0.5347298589529046, 'auprc': 0.41495389727995147, 'f1': 0.5532994923857868, 'acc': 0.5532994923857868, 'eval_loss': 0.7136261180827492}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 356, 'fp': 0, 'fn': 235, 'auroc': 0.5233564427444418, 'auprc': 0.4221982879503171, 'f1': 0.6023688663282571, 'acc': 0.6023688663282571, 'eval_loss': 0.6737947024797138}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': -0.05803378500312194, 'tp': 0, 'tn': 353, 'fp': 3, 'fn': 235, 'auroc': 0.5028986373416209, 'auprc': 0.41921013256242057, 'f1': 0.5972927241962775, 'acc': 0.5972927241962775, 'eval_loss': 0.6785668354285391}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 356, 'fp': 0, 'fn': 235, 'auroc': 0.5487628496294525, 'auprc': 0.4223764457182487, 'f1': 0.6023688663282571, 'acc': 0.6023688663282571, 'eval_loss': 0.6720413000960099}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 356, 'fp': 0, 'fn': 235, 'auroc': 0.4689875687305761, 'auprc': 0.3674221872084402, 'f1': 0.6023688663282571, 'acc': 0.6023688663282571, 'eval_loss': 0.6727089474075719}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.03637909377433385, 'tp': 101, 'tn': 216, 'fp': 140, 'fn': 134, 'auroc': 0.5174934257709778, 'auprc': 0.41619610746357355, 'f1': 0.5363790186125211, 'acc': 0.5363790186125211, 'eval_loss': 1.0456180101946781}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 356, 'fp': 0, 'fn': 235, 'auroc': 0.5176129572077457, 'auprc': 0.41371817235102204, 'f1': 0.6023688663282571, 'acc': 0.6023688663282571, 'eval_loss': 0.6730827689170837}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 356, 'fp': 0, 'fn': 235, 'auroc': 0.5270260578532153, 'auprc': 0.4236826287529917, 'f1': 0.6023688663282571, 'acc': 0.6023688663282571, 'eval_loss': 0.6727114445284793}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 356, 'fp': 0, 'fn': 235, 'auroc': 0.4995218742529285, 'auprc': 0.4065272394530621, 'f1': 0.6023688663282571, 'acc': 0.6023688663282571, 'eval_loss': 0.6729014170797247}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 356, 'fp': 0, 'fn': 235, 'auroc': 0.4980217547214918, 'auprc': 0.401493041181477, 'f1': 0.6023688663282571, 'acc': 0.6023688663282571, 'eval_loss': 0.6723020641427291}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 356, 'fp': 0, 'fn': 235, 'auroc': 0.49414893617021277, 'auprc': 0.3944820605761771, 'f1': 0.6023688663282571, 'acc': 0.6023688663282571, 'eval_loss': 0.6723609127496418}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.045490681167879084, 'tp': 76, 'tn': 256, 'fp': 100, 'fn': 159, 'auroc': 0.5748565622758786, 'auprc': 0.44900467508453634, 'f1': 0.5617597292724196, 'acc': 0.5617597292724196, 'eval_loss': 0.7094366832783348}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.06298183357945353, 'tp': 91, 'tn': 240, 'fp': 116, 'fn': 144, 'auroc': 0.5748685154195554, 'auprc': 0.4460805381356833, 'f1': 0.560067681895093, 'acc': 0.560067681895093, 'eval_loss': 0.8086670825355932}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0804123803378336, 'tp': 86, 'tn': 253, 'fp': 103, 'fn': 149, 'auroc': 0.5535680133875209, 'auprc': 0.44496227122099774, 'f1': 0.5736040609137056, 'acc': 0.5736040609137056, 'eval_loss': 0.8003021415911222}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': -0.047685608864788044, 'tp': 73, 'tn': 229, 'fp': 127, 'fn': 162, 'auroc': 0.496324408319388, 'auprc': 0.3970928040138184, 'f1': 0.5109983079526227, 'acc': 0.5109983079526227, 'eval_loss': 0.7449788953128614}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 356, 'fp': 0, 'fn': 235, 'auroc': 0.515007171886206, 'auprc': 0.4124840959163123, 'f1': 0.6023688663282571, 'acc': 0.6023688663282571, 'eval_loss': 0.6742075242494282}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 356, 'fp': 0, 'fn': 235, 'auroc': 0.490796079368874, 'auprc': 0.4009189672914335, 'f1': 0.6023688663282571, 'acc': 0.6023688663282571, 'eval_loss': 0.6740003604637949}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 356, 'fp': 0, 'fn': 235, 'auroc': 0.5262670332297394, 'auprc': 0.4244267233473355, 'f1': 0.6023688663282571, 'acc': 0.6023688663282571, 'eval_loss': 0.6728018083070454}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 356, 'fp': 0, 'fn': 235, 'auroc': 0.4955594071240736, 'auprc': 0.4019851694587304, 'f1': 0.6023688663282571, 'acc': 0.6023688663282571, 'eval_loss': 0.6743251273506566}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.10646565397812174, 'tp': 79, 'tn': 271, 'fp': 85, 'fn': 156, 'auroc': 0.5816339947406167, 'auprc': 0.471954589614862, 'f1': 0.5922165820642978, 'acc': 0.5922165820642978, 'eval_loss': 0.6945458054542542}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.08986904045445607, 'tp': 91, 'tn': 249, 'fp': 107, 'fn': 144, 'auroc': 0.5822316519244561, 'auprc': 0.4868453540993001, 'f1': 0.5752961082910322, 'acc': 0.5752961082910322, 'eval_loss': 0.6790556813541212}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.09214909236569599, 'tp': 102, 'tn': 234, 'fp': 122, 'fn': 133, 'auroc': 0.5789803968443701, 'auprc': 0.4905263997186331, 'f1': 0.5685279187817259, 'acc': 0.5685279187817259, 'eval_loss': 0.6996626697088543}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.060392533440468694, 'tp': 56, 'tn': 289, 'fp': 67, 'fn': 179, 'auroc': 0.5699438202247191, 'auprc': 0.4434114321001835, 'f1': 0.583756345177665, 'acc': 0.583756345177665, 'eval_loss': 0.671184097465716}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 356, 'fp': 0, 'fn': 235, 'auroc': 0.4876703322973942, 'auprc': 0.40904671983370056, 'f1': 0.6023688663282571, 'acc': 0.6023688663282571, 'eval_loss': 0.6736677351750826}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 356, 'fp': 0, 'fn': 235, 'auroc': 0.5151267033229739, 'auprc': 0.4159176994143494, 'f1': 0.6023688663282571, 'acc': 0.6023688663282571, 'eval_loss': 0.6722918686113859}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 356, 'fp': 0, 'fn': 235, 'auroc': 0.530223523786756, 'auprc': 0.4275098869188965, 'f1': 0.6023688663282571, 'acc': 0.6023688663282571, 'eval_loss': 0.672579332401878}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 356, 'fp': 0, 'fn': 235, 'auroc': 0.4615467367917762, 'auprc': 0.378635343425892, 'f1': 0.6023688663282571, 'acc': 0.6023688663282571, 'eval_loss': 0.6739688139212759}


### 3.1. Results using original dataset (texts) + embeddings obtained from knowledge graph exploitation

In [26]:
indexBERT = ['TweetBERT','BERT','RoBERTa','DistilBERT','CamemBERT','Albert','Flaubert']

#dfResultsModelsTotal.reindex(indexBERT)
dfResultsModelsTotal = dfResultsModelsTotal.reset_index(drop=True)
dfResultsModelsTotal.index = indexBERT
dfResultsModelsTotal

dfResultssModelsTotal1 = dfResultsModelsTotal.copy()

dfResultssModelsTotal1

Unnamed: 0,mcc,tp,tn,fp,fn,auroc,auprc,f1,acc,eval_loss
TweetBERT,-0.009152,17.5,330.5,25.5,217.5,0.51947,0.415859,0.125899,0.588832,0.684998
BERT,0.009095,25.25,321.0,35.0,209.75,0.513214,0.404928,0.171041,0.585871,0.765863
RoBERTa,0.0,0.0,356.0,0.0,235.0,0.50468,0.406546,0.0,0.602369,0.672569
DistilBERT,0.0353,81.5,244.5,111.5,153.5,0.549904,0.434285,0.380841,0.551607,0.765846
CamemBERT,0.0,0.0,356.0,0.0,235.0,0.506907,0.409954,0.0,0.602369,0.673834
Albert,0.087219,82.0,260.75,95.25,153.0,0.578197,0.473184,0.397817,0.579949,0.686112
Flaubert,0.0,0.0,356.0,0.0,235.0,0.498642,0.407777,0.0,0.602369,0.673127


## 4. BERT Models applied to Category IV - Scientific Tweets

In [27]:
#gc.collect()
#torch.cuda.empty_cache()
limitsave=0

X1_train, X1_test, y1_train, y1_test = train_test_split(X, Y4, test_size=0.3, random_state=42)
train_df1 = pd.DataFrame({ 'text_cleaned': X1_train, 'target': y1_train })
test_df1 = pd.DataFrame({ 'text_cleaned': X1_test, 'target': y1_test })

c_model_1 = ["bertweet","bert","roberta", "distilbert","camembert",  "albert", "flaubert"]
c_model_2 = ["vinai/bertweet-base","bert-base-multilingual-cased","roberta-base","distilbert-base-cased", "camembert-base", "albert-base-v1", "flaubert/flaubert_base_cased"]

for idx, model in enumerate(c_model_1):
    
    for i in range(0,N_ITER):
        model1 = ClassificationModel(
        c_model_1[idx], c_model_2[idx],
            use_cuda = True,
            args=train_args
        )
        model1.train_model(train_df1)
        result1, model_outputs1, wrong_predictions1 = model1.eval_model(test_df1, f1=f1_multiclass, acc=accuracy_score)
        print(result1)
        if(i<limitsave):
            torch.save(model1, 'model1'+str(i)+'.pt')
        del model1
        gc.collect()
        torch.cuda.empty_cache()
        if(i==0):
            dfResultsModels1 = pd.DataFrame.from_dict(result1, orient="index").T
        else:
            dfResultsModels1b = pd.DataFrame.from_dict(result1, orient="index").T
            dfResultsModels1 = dfResultsModels1.append(dfResultsModels1b)

    dfResultsModels1Trans = pd.DataFrame(dfResultsModels1.mean(axis=0)).T
    dfResultsModels1Trans['f1'] = calcule_f1(dfResultsModels1Trans)
    
    if(idx == 0):
        dfResultsModelsTotal = dfResultsModels1Trans.copy()
    else:
        dfResultsModelsTotal = dfResultsModelsTotal.append(dfResultsModels1Trans)
   #dfResultsModelsTotal.to_csv('dfResultsModelsTotalEMB-4.csv')



Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

  "Dataframe headers not specified. Falling back to using column 0 as text and column 1 as labels."


Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

  mcc = cov_ytyp / np.sqrt(cov_ytyt * cov_ypyp)


{'mcc': 0.0, 'tp': 0, 'tn': 437, 'fp': 0, 'fn': 154, 'auroc': 0.48073494011709117, 'auprc': 0.2756174984331953, 'f1': 0.739424703891709, 'acc': 0.739424703891709, 'eval_loss': 0.5715288363004986}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 437, 'fp': 0, 'fn': 154, 'auroc': 0.5067758328627894, 'auprc': 0.2685313062191896, 'f1': 0.739424703891709, 'acc': 0.739424703891709, 'eval_loss': 0.5718403129201186}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.07313760305412682, 'tp': 18, 'tn': 406, 'fp': 31, 'fn': 136, 'auroc': 0.5120063003358197, 'auprc': 0.3106414430240656, 'f1': 0.7174280879864636, 'acc': 0.7174280879864636, 'eval_loss': 0.6109400109240883}


Some weights of the model checkpoint at vinai/bertweet-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight', 'lm_head.decoder.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at vinai/bertweet-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classi

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 437, 'fp': 0, 'fn': 154, 'auroc': 0.5251270468661773, 'auprc': 0.2789034958616555, 'f1': 0.739424703891709, 'acc': 0.739424703891709, 'eval_loss': 0.5764450242644862}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.029083299634093902, 'tp': 37, 'tn': 344, 'fp': 93, 'fn': 117, 'auroc': 0.5339088828791346, 'auprc': 0.2792932101553465, 'f1': 0.6446700507614214, 'acc': 0.6446700507614214, 'eval_loss': 0.7621623512945677}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 437, 'fp': 0, 'fn': 154, 'auroc': 0.5116496775535677, 'auprc': 0.26688311115626673, 'f1': 0.739424703891709, 'acc': 0.739424703891709, 'eval_loss': 0.5708083918220118}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 437, 'fp': 0, 'fn': 154, 'auroc': 0.5574459865077714, 'auprc': 0.3057264573078326, 'f1': 0.739424703891709, 'acc': 0.739424703891709, 'eval_loss': 0.5707062388721266}


Some weights of the model checkpoint at bert-base-multilingual-cased were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model ch

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 437, 'fp': 0, 'fn': 154, 'auroc': 0.5156171060061221, 'auprc': 0.2721291812872042, 'f1': 0.739424703891709, 'acc': 0.739424703891709, 'eval_loss': 0.5712041258811951}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 437, 'fp': 0, 'fn': 154, 'auroc': 0.5174893756129455, 'auprc': 0.27708189255955973, 'f1': 0.739424703891709, 'acc': 0.739424703891709, 'eval_loss': 0.5721192485407779}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 437, 'fp': 0, 'fn': 154, 'auroc': 0.5175488127433208, 'auprc': 0.26729581051749807, 'f1': 0.739424703891709, 'acc': 0.739424703891709, 'eval_loss': 0.5731330341414401}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 437, 'fp': 0, 'fn': 154, 'auroc': 0.4798656720853517, 'auprc': 0.2606518851150452, 'f1': 0.739424703891709, 'acc': 0.739424703891709, 'eval_loss': 0.5725217053764745}


Some weights of the model checkpoint at roberta-base were not used when initializing RobertaForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at roberta-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'classifier.out

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 437, 'fp': 0, 'fn': 154, 'auroc': 0.5409373235460192, 'auprc': 0.28286604119749015, 'f1': 0.739424703891709, 'acc': 0.739424703891709, 'eval_loss': 0.5717626559106928}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 437, 'fp': 0, 'fn': 154, 'auroc': 0.6224999257035871, 'auprc': 0.3343314904188596, 'f1': 0.739424703891709, 'acc': 0.739424703891709, 'eval_loss': 0.5549519971797341}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 437, 'fp': 0, 'fn': 154, 'auroc': 0.5861244019138756, 'auprc': 0.3036527032288342, 'f1': 0.739424703891709, 'acc': 0.739424703891709, 'eval_loss': 0.5820571184158325}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.04506939304410541, 'tp': 24, 'tn': 384, 'fp': 53, 'fn': 130, 'auroc': 0.5860501055009064, 'auprc': 0.3160623297739104, 'f1': 0.6903553299492385, 'acc': 0.6903553299492385, 'eval_loss': 0.6076277243463617}


Some weights of the model checkpoint at distilbert-base-cased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight', 'vocab_projector.bias']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-cased and are newly initialized: ['pre_classifier.weight', 'pre_classifier.bias', 'classifier

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.11856848755748416, 'tp': 32, 'tn': 387, 'fp': 50, 'fn': 122, 'auroc': 0.6122767392790276, 'auprc': 0.33298676678922634, 'f1': 0.7089678510998308, 'acc': 0.7089678510998308, 'eval_loss': 0.6416943716375452}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 437, 'fp': 0, 'fn': 154, 'auroc': 0.4997176736307172, 'auprc': 0.257158032346754, 'f1': 0.739424703891709, 'acc': 0.739424703891709, 'eval_loss': 0.5722068516831649}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 437, 'fp': 0, 'fn': 154, 'auroc': 0.5084846503610806, 'auprc': 0.28215236714078584, 'f1': 0.739424703891709, 'acc': 0.739424703891709, 'eval_loss': 0.5722316974087766}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 437, 'fp': 0, 'fn': 154, 'auroc': 0.5430770602395316, 'auprc': 0.300097113889132, 'f1': 0.739424703891709, 'acc': 0.739424703891709, 'eval_loss': 0.5712308460160306}


Some weights of the model checkpoint at camembert-base were not used when initializing CamembertForSequenceClassification: ['lm_head.bias', 'lm_head.dense.weight', 'lm_head.dense.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.decoder.weight']
- This IS expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing CamembertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of CamembertForSequenceClassification were not initialized from the model checkpoint at camembert-base and are newly initialized: ['classifier.dense.weight', 'classifier.dense.bias', 'classifier.out_proj.weight', 'cl

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 437, 'fp': 0, 'fn': 154, 'auroc': 0.5229427323248833, 'auprc': 0.2849666542736885, 'f1': 0.739424703891709, 'acc': 0.739424703891709, 'eval_loss': 0.5718340685493067}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.06848134435779686, 'tp': 21, 'tn': 398, 'fp': 39, 'fn': 133, 'auroc': 0.586718773217629, 'auprc': 0.3121921869820265, 'f1': 0.7089678510998308, 'acc': 0.7089678510998308, 'eval_loss': 0.6091894209384918}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 437, 'fp': 0, 'fn': 154, 'auroc': 0.5038188356266159, 'auprc': 0.25229311822844, 'f1': 0.739424703891709, 'acc': 0.739424703891709, 'eval_loss': 0.5757948301340404}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 437, 'fp': 0, 'fn': 154, 'auroc': 0.5147255490504918, 'auprc': 0.2603542197341739, 'f1': 0.739424703891709, 'acc': 0.739424703891709, 'eval_loss': 0.5725362222445639}


Some weights of the model checkpoint at albert-base-v1 were not used when initializing AlbertForSequenceClassification: ['predictions.bias', 'predictions.LayerNorm.weight', 'predictions.LayerNorm.bias', 'predictions.dense.weight', 'predictions.dense.bias', 'predictions.decoder.weight', 'predictions.decoder.bias']
- This IS expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing AlbertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of AlbertForSequenceClassification were not initialized from the model checkpoint at albert-base-v1 and are newly initialized: ['classifier.weight', 'classifier.bias']
You sho

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 437, 'fp': 0, 'fn': 154, 'auroc': 0.5707450444292549, 'auprc': 0.296074055656997, 'f1': 0.739424703891709, 'acc': 0.739424703891709, 'eval_loss': 0.5631361697849474}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 437, 'fp': 0, 'fn': 154, 'auroc': 0.5156022467235282, 'auprc': 0.29034836070318437, 'f1': 0.739424703891709, 'acc': 0.739424703891709, 'eval_loss': 0.5711114924204977}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 437, 'fp': 0, 'fn': 154, 'auroc': 0.5103866385330916, 'auprc': 0.2828981072013028, 'f1': 0.739424703891709, 'acc': 0.739424703891709, 'eval_loss': 0.5715928422777277}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 437, 'fp': 0, 'fn': 154, 'auroc': 0.5323560878480786, 'auprc': 0.2749985388670983, 'f1': 0.739424703891709, 'acc': 0.739424703891709, 'eval_loss': 0.5724437974001232}


Some weights of the model checkpoint at flaubert/flaubert_base_cased were not used when initializing FlaubertForSequenceClassification: ['pred_layer.proj.bias', 'pred_layer.proj.weight']
- This IS expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing FlaubertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of FlaubertForSequenceClassification were not initialized from the model checkpoint at flaubert/flaubert_base_cased and are newly initialized: ['position_embeddings.weight', 'embeddings.weight', 'layer_norm_emb.weight', 'layer_norm_emb.bias', 'attentions.0.q_lin.weight', 'attentions.0.q_lin.bias', 

  0%|          | 0/3 [00:00<?, ?it/s]

Epoch:   0%|          | 0/15 [00:00<?, ?it/s]

Running Epoch 0 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 1 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 2 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 3 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 4 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 5 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 6 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 7 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 8 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 9 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 10 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 11 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 12 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 13 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Epoch 14 of 15:   0%|          | 0/44 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/19 [00:00<?, ?it/s]

{'mcc': 0.0, 'tp': 0, 'tn': 437, 'fp': 0, 'fn': 154, 'auroc': 0.4602291301375969, 'auprc': 0.23721036313858068, 'f1': 0.739424703891709, 'acc': 0.739424703891709, 'eval_loss': 0.5721141633234526}


### 4.1. Results using original dataset (texts) + embeddings obtained from knowledge graph exploitation

In [28]:
indexBERT = ['TweetBERT','BERT','RoBERTa','DistilBERT','CamemBERT','Albert','Flaubert']

#dfResultsModelsTotal.reindex(indexBERT)
dfResultsModelsTotal = dfResultsModelsTotal.reset_index(drop=True)
dfResultsModelsTotal.index = indexBERT
dfResultsModelsTotal

dfResultssModelsTotal1 = dfResultsModelsTotal.copy()

dfResultssModelsTotal1

Unnamed: 0,mcc,tp,tn,fp,fn,auroc,auprc,f1,acc,eval_loss
TweetBERT,0.018284,4.5,429.25,7.75,149.5,0.506161,0.283423,0.054135,0.733926,0.582689
BERT,0.007271,9.25,413.75,23.25,144.75,0.529655,0.281008,0.099196,0.715736,0.61872
RoBERTa,0.0,0.0,437.0,0.0,154.0,0.51396,0.271974,0.0,0.739425,0.572384
DistilBERT,0.040909,14.0,411.25,25.75,140.0,0.601738,0.321758,0.144516,0.719543,0.596583
CamemBERT,0.0,0.0,437.0,0.0,154.0,0.518556,0.281094,0.0,0.739425,0.571876
Albert,0.01712,5.25,427.25,9.75,148.75,0.544002,0.280228,0.06213,0.73181,0.580164
Flaubert,0.0,0.0,437.0,0.0,154.0,0.504644,0.271364,0.0,0.739425,0.571816
