In [1]:
import os
os.environ["CUDA_VISIBLE_DEVICES"]="0" 

import numpy as np
import tensorflow as tf
import pandas as pd
import pyarabic.araby as araby
import warnings
warnings.filterwarnings('ignore')
from sklearn.model_selection import train_test_split
from sklearn.metrics import classification_report
from tensorflow.keras.layers import Dense, Input
from tensorflow.keras.utils import to_categorical
from tensorflow.keras.optimizers import Adam
from tensorflow.keras.callbacks import EarlyStopping
from tensorflow.keras.initializers import TruncatedNormal
from tensorflow.keras.losses import CategoricalCrossentropy
from tensorflow.keras.metrics import CategoricalAccuracy
import torch
from sklearn.metrics import accuracy_score, f1_score, precision_score, recall_score
from transformers import Trainer, TrainingArguments
from transformers import AutoTokenizer, AutoModelForSequenceClassification
from datasets import load_dataset, Dataset, concatenate_datasets
import torch
import torch.nn as nn
from transformers import AutoModel, TrainingArguments, Trainer, BertModel
from transformers.modeling_outputs import SequenceClassifierOutput
import numpy as np
from sklearn.metrics import confusion_matrix, ConfusionMatrixDisplay
import matplotlib.pyplot as plt
import seaborn as sns
pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', None)
pd.set_option('display.max_colwidth', 1000)


fname = 'results'
log_file = fname + '.txt'

with open(log_file, 'w') as f:
    f.write('Model,Accuracy,Precision,Recall,F1\n')


df = pd.read_csv('Expectation_Analysis.csv', encoding='utf-8', engine='python', sep='\t')



df.fillna('', inplace=True)  
display(len(df))


display(df.columns)
display(len(df))
display(df[:4])



classes = set(df['future_sentiment'].values)
display(classes)

c = df['future_sentiment'].value_counts()
display(c)

df['future_sentiment'] = df['future_sentiment'].astype('category')
df['label'] = df['future_sentiment'].cat.codes

df = df[['text', 'label']]
classes_num = len(classes)
display(classes_num)
display(len(df))


max_sequence_length = 128



models = [ 
        'aubmindlab/bert-base-arabertv02',
        'asafaya/bert-base-arabic',
        'CAMeL-Lab/bert-base-arabic-camelbert-da',
        'qarib/bert-base-qarib', 
        'UBC-NLP/ARBERTv2',
        'UBC-NLP/MARBERTv2',
        'faisalq/SaudiBERT',           
]


seeds = [0, 1, 42, 100]


for model_name in models:
    for seed in seeds:
        ds = Dataset.from_pandas(df)
        ds = ds.train_test_split(test_size=0.2, seed = seed)
        if seed==0:
            display(ds)
        for i in range(3):
            print(f'{model_name}, try:{i}')
                  
          
            tokenizer = AutoTokenizer.from_pretrained(model_name)                
            model = AutoModelForSequenceClassification.from_pretrained(model_name,
                                                                  num_labels=classes_num).to('cuda')                                                 
            dataset_train = ds['train']
            dataset_validation = ds['test']                                                    
            
          
    
            def preprocess_function(examples):
                return tokenizer(examples['text'], truncation=True, padding="max_length",
                                max_length=max_sequence_length)
            
            
            dataset_train = dataset_train.map(preprocess_function, batched=True) 
            dataset_validation = dataset_validation.map(preprocess_function, batched=True)  
            
           
            
            def compute_metrics(eval_pred):
                logits, labels = eval_pred
                predictions = np.argmax(logits, axis=-1)    
                acc = accuracy_score(labels, predictions)        
                f1 = f1_score(labels, predictions, average='macro')  
                precision = precision_score(labels, predictions, average='macro')
                recall = recall_score(labels, predictions, average='macro')
                with open(log_file, 'a') as f:
                    f.write(f'{model_name},{acc},{precision},{recall},{f1}\n')
                return {'accuracy': acc, 'precision': precision, 'recall':recall, 'f1_score': f1}
    
    
            
            
            epochs = 8
            save_steps = 10000 #save checkpoint every 10000 steps
            batch_size = 64
            
            training_args = TrainingArguments(
                output_dir = 'bert/',
                overwrite_output_dir=True,
                num_train_epochs = epochs,
                per_device_train_batch_size = batch_size,
                per_device_eval_batch_size = batch_size,
                save_steps = save_steps,
                save_total_limit = 1, #only save the last 5 checkpoints
                fp16=True,
                learning_rate = 5e-5,  # 5e-5 is the default
                logging_steps = 50, #50_000
                evaluation_strategy = 'steps',
                # evaluate_during_training = True,
                eval_steps = 50
                
            )
            
            trainer = Trainer(
                model = model,
                args = training_args,
                train_dataset=dataset_train,
                eval_dataset=dataset_validation,
                compute_metrics = compute_metrics
            )
            
            
            trainer.train()


results = pd.read_csv(log_file)

best_results = results.groupby('Model', as_index=False)['F1'].max()

best_results = pd.merge(best_results, results, on=['Model', 'F1'])
best_results = best_results[['Model', 'Accuracy', 'Precision', 'Recall', 'F1']]
best_results = best_results.drop_duplicates()
best_results.to_csv(f'{fname}.csv')
display(best_results)



2025-02-10 14:19:48.250489: I tensorflow/core/util/port.cc:110] oneDNN custom operations are on. You may see slightly different numerical results due to floating-point round-off errors from different computation orders. To turn them off, set the environment variable `TF_ENABLE_ONEDNN_OPTS=0`.
2025-02-10 14:19:48.412371: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.
To enable the following instructions: AVX2 AVX512F AVX512_VNNI AVX512_BF16 FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.


16152

Index(['text', 'future_sentiment', 'class'], dtype='object')

16152

Unnamed: 0,text,future_sentiment,class
0,إن شاء الله خسارة للمتغطرس مدرب اليونايتد,pessimistic,sport
1,إن شاء الله عمان تغادر البطولة,optimistic,sport
2,اتمنى استغلال السمعة الاوروبية عن فيغا وتصريفه سريع في الشتوية,optimistic,sport
3,اتوقع انهيار الخصم الان,pessimistic,sport


{'neutral', 'optimistic', 'pessimistic'}

future_sentiment
optimistic     6611
neutral        5472
pessimistic    4069
Name: count, dtype: int64

3

16152

DatasetDict({
    train: Dataset({
        features: ['text', 'label'],
        num_rows: 12921
    })
    test: Dataset({
        features: ['text', 'label'],
        num_rows: 3231
    })
})

aubmindlab/bert-base-arabertv02, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8053,0.577394,0.755494,0.748023,0.758492,0.747632
100,0.6061,0.504984,0.782111,0.777925,0.781211,0.778095
150,0.5102,0.446429,0.815846,0.811261,0.809046,0.807571
200,0.5013,0.459223,0.809966,0.808328,0.809303,0.800363
250,0.3224,0.432357,0.838131,0.831572,0.834028,0.832705
300,0.3016,0.460409,0.828536,0.825638,0.819751,0.822025
350,0.305,0.409012,0.836583,0.831797,0.831284,0.831341
400,0.3103,0.407111,0.842464,0.837503,0.835374,0.835835
450,0.1428,0.522246,0.835345,0.829362,0.830343,0.82894
500,0.149,0.472958,0.848654,0.843652,0.842421,0.843014


aubmindlab/bert-base-arabertv02, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8226,0.630034,0.738781,0.741186,0.741541,0.721782
100,0.5949,0.505979,0.790777,0.783986,0.787272,0.785281
150,0.5215,0.461654,0.808728,0.802035,0.804345,0.800665
200,0.5064,0.457863,0.809347,0.80574,0.800856,0.800728
250,0.34,0.471251,0.818013,0.816453,0.817108,0.814827
300,0.306,0.476548,0.822656,0.817826,0.813718,0.815495
350,0.2885,0.572492,0.793253,0.803497,0.789658,0.780129
400,0.3153,0.440004,0.831012,0.822986,0.831017,0.824874
450,0.1623,0.546213,0.82637,0.828408,0.818562,0.821254
500,0.1642,0.535838,0.83225,0.828038,0.823479,0.824317


aubmindlab/bert-base-arabertv02, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8226,0.630034,0.738781,0.741186,0.741541,0.721782
100,0.5949,0.505979,0.790777,0.783986,0.787272,0.785281
150,0.5215,0.461654,0.808728,0.802035,0.804345,0.800665
200,0.5064,0.457863,0.809347,0.80574,0.800856,0.800728
250,0.34,0.471251,0.818013,0.816453,0.817108,0.814827
300,0.306,0.476548,0.822656,0.817826,0.813718,0.815495
350,0.2885,0.572492,0.793253,0.803497,0.789658,0.780129
400,0.3153,0.440004,0.831012,0.822986,0.831017,0.824874
450,0.1623,0.546213,0.82637,0.828408,0.818562,0.821254
500,0.1642,0.535838,0.83225,0.828038,0.823479,0.824317


aubmindlab/bert-base-arabertv02, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8287,0.65074,0.717734,0.734393,0.726086,0.694873
100,0.5992,0.522823,0.788301,0.78825,0.778693,0.779783
150,0.5284,0.465956,0.805633,0.805961,0.793108,0.797511
200,0.4841,0.445919,0.82637,0.828848,0.813682,0.818293
250,0.3504,0.524354,0.789539,0.79628,0.787851,0.778462
300,0.3145,0.427372,0.831631,0.829234,0.822221,0.82509
350,0.2992,0.45354,0.827298,0.820622,0.82841,0.822457
400,0.3138,0.418846,0.829774,0.824138,0.826798,0.824906
450,0.1458,0.529216,0.840607,0.833715,0.835292,0.83441
500,0.1504,0.46209,0.830703,0.822872,0.827763,0.824663


aubmindlab/bert-base-arabertv02, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8287,0.65074,0.717734,0.734393,0.726086,0.694873
100,0.5992,0.522823,0.788301,0.78825,0.778693,0.779783
150,0.5284,0.465956,0.805633,0.805961,0.793108,0.797511
200,0.4841,0.445919,0.82637,0.828848,0.813682,0.818293
250,0.3504,0.524354,0.789539,0.79628,0.787851,0.778462
300,0.3145,0.427372,0.831631,0.829234,0.822221,0.82509
350,0.2992,0.45354,0.827298,0.820622,0.82841,0.822457
400,0.3138,0.418846,0.829774,0.824138,0.826798,0.824906
450,0.1458,0.529216,0.840607,0.833715,0.835292,0.83441
500,0.1504,0.46209,0.830703,0.822872,0.827763,0.824663


aubmindlab/bert-base-arabertv02, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8287,0.65074,0.717734,0.734393,0.726086,0.694873
100,0.5992,0.522823,0.788301,0.78825,0.778693,0.779783
150,0.5284,0.465956,0.805633,0.805961,0.793108,0.797511
200,0.4841,0.445919,0.82637,0.828848,0.813682,0.818293
250,0.3504,0.524354,0.789539,0.79628,0.787851,0.778462
300,0.3145,0.427372,0.831631,0.829234,0.822221,0.82509
350,0.2992,0.45354,0.827298,0.820622,0.82841,0.822457
400,0.3138,0.418846,0.829774,0.824138,0.826798,0.824906
450,0.1458,0.529216,0.840607,0.833715,0.835292,0.83441
500,0.1504,0.46209,0.830703,0.822872,0.827763,0.824663


aubmindlab/bert-base-arabertv02, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.836,0.585729,0.756422,0.753875,0.753074,0.751161
100,0.5992,0.543169,0.772516,0.779169,0.747405,0.754611
150,0.5365,0.477106,0.804704,0.799115,0.80033,0.796475
200,0.4986,0.434769,0.815846,0.811442,0.805559,0.80784
250,0.3199,0.461252,0.816465,0.811358,0.812293,0.811248
300,0.3319,0.439458,0.827917,0.820088,0.819337,0.819053
350,0.3158,0.426653,0.831631,0.824009,0.825057,0.82451
400,0.3103,0.470209,0.822346,0.819139,0.811823,0.812877
450,0.1734,0.539317,0.818323,0.819993,0.815593,0.81485
500,0.172,0.491793,0.830084,0.823044,0.831777,0.825433


aubmindlab/bert-base-arabertv02, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.836,0.585729,0.756422,0.753875,0.753074,0.751161
100,0.5992,0.543169,0.772516,0.779169,0.747405,0.754611
150,0.5365,0.477106,0.804704,0.799115,0.80033,0.796475
200,0.4986,0.434769,0.815846,0.811442,0.805559,0.80784
250,0.3199,0.461252,0.816465,0.811358,0.812293,0.811248
300,0.3319,0.439458,0.827917,0.820088,0.819337,0.819053
350,0.3158,0.426653,0.831631,0.824009,0.825057,0.82451
400,0.3103,0.470209,0.822346,0.819139,0.811823,0.812877
450,0.1734,0.539317,0.818323,0.819993,0.815593,0.81485
500,0.172,0.491793,0.830084,0.823044,0.831777,0.825433


aubmindlab/bert-base-arabertv02, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.836,0.585729,0.756422,0.753875,0.753074,0.751161
100,0.5992,0.543169,0.772516,0.779169,0.747405,0.754611
150,0.5365,0.477106,0.804704,0.799115,0.80033,0.796475
200,0.4986,0.434769,0.815846,0.811442,0.805559,0.80784
250,0.3199,0.461252,0.816465,0.811358,0.812293,0.811248
300,0.3319,0.439458,0.827917,0.820088,0.819337,0.819053
350,0.3158,0.426653,0.831631,0.824009,0.825057,0.82451
400,0.3103,0.470209,0.822346,0.819139,0.811823,0.812877
450,0.1734,0.539317,0.818323,0.819993,0.815593,0.81485
500,0.172,0.491793,0.830084,0.823044,0.831777,0.825433


aubmindlab/bert-base-arabertv02, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8871,0.620287,0.744352,0.731244,0.735987,0.733174
100,0.6465,0.556759,0.768493,0.77677,0.766054,0.764907
150,0.5231,0.45876,0.819251,0.810788,0.809329,0.810017
200,0.5077,0.441382,0.818013,0.809295,0.809816,0.809477
250,0.3452,0.447314,0.82018,0.812829,0.819679,0.814797
300,0.3592,0.454066,0.827298,0.831816,0.807066,0.814685
350,0.3445,0.440089,0.831322,0.822151,0.823182,0.821913
400,0.3289,0.400138,0.840607,0.83272,0.831841,0.832272
450,0.1744,0.525929,0.833179,0.832687,0.814475,0.821221
500,0.1798,0.543207,0.829465,0.825444,0.825556,0.819126


aubmindlab/bert-base-arabertv02, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8871,0.620287,0.744352,0.731244,0.735987,0.733174
100,0.6465,0.556759,0.768493,0.77677,0.766054,0.764907
150,0.5231,0.45876,0.819251,0.810788,0.809329,0.810017
200,0.5077,0.441382,0.818013,0.809295,0.809816,0.809477
250,0.3452,0.447314,0.82018,0.812829,0.819679,0.814797
300,0.3592,0.454066,0.827298,0.831816,0.807066,0.814685
350,0.3445,0.440089,0.831322,0.822151,0.823182,0.821913
400,0.3289,0.400138,0.840607,0.83272,0.831841,0.832272
450,0.1744,0.525929,0.833179,0.832687,0.814475,0.821221
500,0.1798,0.543207,0.829465,0.825444,0.825556,0.819126


aubmindlab/bert-base-arabertv02, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8871,0.620287,0.744352,0.731244,0.735987,0.733174
100,0.6465,0.556759,0.768493,0.77677,0.766054,0.764907
150,0.5231,0.45876,0.819251,0.810788,0.809329,0.810017
200,0.5077,0.441382,0.818013,0.809295,0.809816,0.809477
250,0.3452,0.447314,0.82018,0.812829,0.819679,0.814797
300,0.3592,0.454066,0.827298,0.831816,0.807066,0.814685
350,0.3445,0.440089,0.831322,0.822151,0.823182,0.821913
400,0.3289,0.400138,0.840607,0.83272,0.831841,0.832272
450,0.1744,0.525929,0.833179,0.832687,0.814475,0.821221
500,0.1798,0.543207,0.829465,0.825444,0.825556,0.819126


DatasetDict({
    train: Dataset({
        features: ['text', 'label'],
        num_rows: 12921
    })
    test: Dataset({
        features: ['text', 'label'],
        num_rows: 3231
    })
})

asafaya/bert-base-arabic, try:0


tokenizer_config.json:   0%|          | 0.00/62.0 [00:00<?, ?B/s]

config.json:   0%|          | 0.00/491 [00:00<?, ?B/s]

vocab.txt:   0%|          | 0.00/334k [00:00<?, ?B/s]

special_tokens_map.json:   0%|          | 0.00/112 [00:00<?, ?B/s]

model.safetensors:   0%|          | 0.00/445M [00:00<?, ?B/s]

Some weights of BertForSequenceClassification were not initialized from the model checkpoint at asafaya/bert-base-arabic and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8504,0.71092,0.696069,0.70425,0.707323,0.691045
100,0.6841,0.616866,0.748994,0.750375,0.741132,0.741153
150,0.6077,0.555866,0.765707,0.758997,0.754075,0.755987
200,0.5845,0.553627,0.768493,0.76493,0.766904,0.757116
250,0.3355,0.588098,0.772826,0.780187,0.756332,0.761142
300,0.3092,0.611034,0.782111,0.787119,0.761535,0.768142
350,0.3078,0.609113,0.784277,0.78008,0.776356,0.77404
400,0.3197,0.556253,0.798514,0.795177,0.798799,0.794438
450,0.1378,0.729328,0.792943,0.786514,0.792946,0.787768
500,0.1383,0.661039,0.792943,0.794733,0.784688,0.786881


asafaya/bert-base-arabic, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at asafaya/bert-base-arabic and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8504,0.71092,0.696069,0.70425,0.707323,0.691045
100,0.6841,0.616866,0.748994,0.750375,0.741132,0.741153
150,0.6077,0.555866,0.765707,0.758997,0.754075,0.755987
200,0.5845,0.553627,0.768493,0.76493,0.766904,0.757116
250,0.3355,0.588098,0.772826,0.780187,0.756332,0.761142
300,0.3092,0.611034,0.782111,0.787119,0.761535,0.768142
350,0.3078,0.609113,0.784277,0.78008,0.776356,0.77404
400,0.3197,0.556253,0.798514,0.795177,0.798799,0.794438
450,0.1378,0.729328,0.792943,0.786514,0.792946,0.787768
500,0.1383,0.661039,0.792943,0.794733,0.784688,0.786881


asafaya/bert-base-arabic, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at asafaya/bert-base-arabic and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8504,0.71092,0.696069,0.70425,0.707323,0.691045
100,0.6841,0.616866,0.748994,0.750375,0.741132,0.741153
150,0.6077,0.555866,0.765707,0.758997,0.754075,0.755987
200,0.5845,0.553627,0.768493,0.76493,0.766904,0.757116
250,0.3355,0.588098,0.772826,0.780187,0.756332,0.761142
300,0.3092,0.611034,0.782111,0.787119,0.761535,0.768142
350,0.3078,0.609113,0.784277,0.78008,0.776356,0.77404
400,0.3197,0.556253,0.798514,0.795177,0.798799,0.794438
450,0.1378,0.729328,0.792943,0.786514,0.792946,0.787768
500,0.1383,0.661039,0.792943,0.794733,0.784688,0.786881


asafaya/bert-base-arabic, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at asafaya/bert-base-arabic and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8554,0.760414,0.678118,0.702143,0.670415,0.64823
100,0.6581,0.608182,0.744661,0.736705,0.743354,0.73516
150,0.6078,0.552097,0.769731,0.763153,0.755551,0.758535
200,0.5788,0.549172,0.754875,0.775099,0.735672,0.740754
250,0.3557,0.647627,0.743733,0.757886,0.747712,0.727463
300,0.3292,0.536432,0.786134,0.778283,0.787182,0.779697
350,0.324,0.524715,0.792015,0.784324,0.787997,0.785684
400,0.3114,0.548869,0.791396,0.787492,0.791385,0.787071
450,0.1306,0.702756,0.795419,0.786467,0.785825,0.786097
500,0.1177,0.790532,0.774992,0.771973,0.768695,0.764805


asafaya/bert-base-arabic, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at asafaya/bert-base-arabic and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8554,0.760414,0.678118,0.702143,0.670415,0.64823
100,0.6581,0.608182,0.744661,0.736705,0.743354,0.73516
150,0.6078,0.552097,0.769731,0.763153,0.755551,0.758535
200,0.5788,0.549172,0.754875,0.775099,0.735672,0.740754
250,0.3557,0.647627,0.743733,0.757886,0.747712,0.727463
300,0.3292,0.536432,0.786134,0.778283,0.787182,0.779697
350,0.324,0.524715,0.792015,0.784324,0.787997,0.785684
400,0.3114,0.548869,0.791396,0.787492,0.791385,0.787071
450,0.1306,0.702756,0.795419,0.786467,0.785825,0.786097
500,0.1177,0.790532,0.774992,0.771973,0.768695,0.764805


asafaya/bert-base-arabic, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at asafaya/bert-base-arabic and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8554,0.760414,0.678118,0.702143,0.670415,0.64823
100,0.6581,0.608182,0.744661,0.736705,0.743354,0.73516
150,0.6078,0.552097,0.769731,0.763153,0.755551,0.758535
200,0.5788,0.549172,0.754875,0.775099,0.735672,0.740754
250,0.3557,0.647627,0.743733,0.757886,0.747712,0.727463
300,0.3292,0.536432,0.786134,0.778283,0.787182,0.779697
350,0.324,0.524715,0.792015,0.784324,0.787997,0.785684
400,0.3114,0.548869,0.791396,0.787492,0.791385,0.787071
450,0.1306,0.702756,0.795419,0.786467,0.785825,0.786097
500,0.1177,0.790532,0.774992,0.771973,0.768695,0.764805


asafaya/bert-base-arabic, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at asafaya/bert-base-arabic and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8437,0.676102,0.715258,0.713453,0.687712,0.692664
100,0.6649,0.595704,0.747137,0.737016,0.738551,0.737452
150,0.6173,0.565408,0.756732,0.750443,0.751985,0.746089
200,0.5939,0.538958,0.774683,0.766682,0.765438,0.762829
250,0.3203,0.571815,0.770659,0.766534,0.765751,0.763961
300,0.3599,0.556709,0.775611,0.769863,0.75317,0.757697
350,0.3514,0.588603,0.762303,0.773124,0.740574,0.744701
400,0.3465,0.619589,0.776849,0.776453,0.757001,0.762403
450,0.1552,0.68101,0.784587,0.77456,0.774821,0.77316
500,0.1391,0.722336,0.790467,0.780996,0.780192,0.779687


asafaya/bert-base-arabic, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at asafaya/bert-base-arabic and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8437,0.676102,0.715258,0.713453,0.687712,0.692664
100,0.6649,0.595704,0.747137,0.737016,0.738551,0.737452
150,0.6173,0.565408,0.756732,0.750443,0.751985,0.746089
200,0.5939,0.538958,0.774683,0.766682,0.765438,0.762829
250,0.3203,0.571815,0.770659,0.766534,0.765751,0.763961
300,0.3599,0.556709,0.775611,0.769863,0.75317,0.757697
350,0.3514,0.588603,0.762303,0.773124,0.740574,0.744701
400,0.3465,0.619589,0.776849,0.776453,0.757001,0.762403
450,0.1552,0.68101,0.784587,0.77456,0.774821,0.77316
500,0.1391,0.722336,0.790467,0.780996,0.780192,0.779687


asafaya/bert-base-arabic, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at asafaya/bert-base-arabic and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8437,0.676102,0.715258,0.713453,0.687712,0.692664
100,0.6649,0.595704,0.747137,0.737016,0.738551,0.737452
150,0.6173,0.565408,0.756732,0.750443,0.751985,0.746089
200,0.5939,0.538958,0.774683,0.766682,0.765438,0.762829
250,0.3203,0.571815,0.770659,0.766534,0.765751,0.763961
300,0.3599,0.556709,0.775611,0.769863,0.75317,0.757697
350,0.3514,0.588603,0.762303,0.773124,0.740574,0.744701
400,0.3465,0.619589,0.776849,0.776453,0.757001,0.762403
450,0.1552,0.68101,0.784587,0.77456,0.774821,0.77316
500,0.1391,0.722336,0.790467,0.780996,0.780192,0.779687


asafaya/bert-base-arabic, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at asafaya/bert-base-arabic and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8058,0.675244,0.713401,0.699138,0.6985,0.696986
100,0.6842,0.607696,0.741257,0.726547,0.730754,0.726716
150,0.5994,0.570694,0.759208,0.747411,0.747889,0.747625
200,0.5886,0.547253,0.768183,0.756923,0.763569,0.757938
250,0.3598,0.565092,0.77004,0.757603,0.757384,0.75748
300,0.337,0.622966,0.766945,0.782523,0.732719,0.738469
350,0.3473,0.551028,0.787682,0.778074,0.771535,0.773806
400,0.3258,0.528678,0.792015,0.779231,0.783394,0.780933
450,0.1446,0.792773,0.777468,0.773499,0.754982,0.761277
500,0.1442,0.682954,0.78892,0.777968,0.777708,0.777826


asafaya/bert-base-arabic, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at asafaya/bert-base-arabic and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8058,0.675244,0.713401,0.699138,0.6985,0.696986
100,0.6842,0.607696,0.741257,0.726547,0.730754,0.726716
150,0.5994,0.570694,0.759208,0.747411,0.747889,0.747625
200,0.5886,0.547253,0.768183,0.756923,0.763569,0.757938
250,0.3598,0.565092,0.77004,0.757603,0.757384,0.75748
300,0.337,0.622966,0.766945,0.782523,0.732719,0.738469
350,0.3473,0.551028,0.787682,0.778074,0.771535,0.773806
400,0.3258,0.528678,0.792015,0.779231,0.783394,0.780933
450,0.1446,0.792773,0.777468,0.773499,0.754982,0.761277
500,0.1442,0.682954,0.78892,0.777968,0.777708,0.777826


asafaya/bert-base-arabic, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at asafaya/bert-base-arabic and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8058,0.675244,0.713401,0.699138,0.6985,0.696986
100,0.6842,0.607696,0.741257,0.726547,0.730754,0.726716
150,0.5994,0.570694,0.759208,0.747411,0.747889,0.747625
200,0.5886,0.547253,0.768183,0.756923,0.763569,0.757938
250,0.3598,0.565092,0.77004,0.757603,0.757384,0.75748
300,0.337,0.622966,0.766945,0.782523,0.732719,0.738469
350,0.3473,0.551028,0.787682,0.778074,0.771535,0.773806
400,0.3258,0.528678,0.792015,0.779231,0.783394,0.780933
450,0.1446,0.792773,0.777468,0.773499,0.754982,0.761277
500,0.1442,0.682954,0.78892,0.777968,0.777708,0.777826


DatasetDict({
    train: Dataset({
        features: ['text', 'label'],
        num_rows: 12921
    })
    test: Dataset({
        features: ['text', 'label'],
        num_rows: 3231
    })
})

CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8252,0.646028,0.724853,0.730746,0.720508,0.706452
100,0.599,0.558247,0.763231,0.757887,0.754253,0.754536
150,0.5716,0.504157,0.784896,0.776444,0.776854,0.776621
200,0.5147,0.492804,0.792634,0.784264,0.786678,0.78379
250,0.2715,0.547942,0.798824,0.793212,0.78883,0.790303
300,0.2379,0.600273,0.805323,0.805643,0.789234,0.793779
350,0.2531,0.574383,0.80099,0.795084,0.792239,0.792422
400,0.2688,0.509185,0.816465,0.808509,0.811244,0.809727
450,0.1008,0.74889,0.805323,0.797382,0.79547,0.796273
500,0.0945,0.754382,0.806252,0.797479,0.800684,0.798002


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8252,0.646028,0.724853,0.730746,0.720508,0.706452
100,0.599,0.558247,0.763231,0.757887,0.754253,0.754536
150,0.5716,0.504157,0.784896,0.776444,0.776854,0.776621
200,0.5147,0.492804,0.792634,0.784264,0.786678,0.78379
250,0.2715,0.547942,0.798824,0.793212,0.78883,0.790303
300,0.2379,0.600273,0.805323,0.805643,0.789234,0.793779
350,0.2531,0.574383,0.80099,0.795084,0.792239,0.792422
400,0.2688,0.509185,0.816465,0.808509,0.811244,0.809727
450,0.1008,0.74889,0.805323,0.797382,0.79547,0.796273
500,0.0945,0.754382,0.806252,0.797479,0.800684,0.798002


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8252,0.646028,0.724853,0.730746,0.720508,0.706452
100,0.599,0.558247,0.763231,0.757887,0.754253,0.754536
150,0.5716,0.504157,0.784896,0.776444,0.776854,0.776621
200,0.5147,0.492804,0.792634,0.784264,0.786678,0.78379
250,0.2715,0.547942,0.798824,0.793212,0.78883,0.790303
300,0.2379,0.600273,0.805323,0.805643,0.789234,0.793779
350,0.2531,0.574383,0.80099,0.795084,0.792239,0.792422
400,0.2688,0.509185,0.816465,0.808509,0.811244,0.809727
450,0.1008,0.74889,0.805323,0.797382,0.79547,0.796273
500,0.0945,0.754382,0.806252,0.797479,0.800684,0.798002


CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8282,0.632427,0.728258,0.722938,0.709408,0.713074
100,0.6148,0.561407,0.763541,0.75836,0.747512,0.750409
150,0.5593,0.500467,0.785825,0.77947,0.774528,0.776629
200,0.5007,0.498947,0.793253,0.795723,0.779715,0.782841
250,0.2867,0.676225,0.775302,0.779726,0.781577,0.765518
300,0.2605,0.533548,0.799133,0.796045,0.788246,0.79097
350,0.2531,0.529449,0.8013,0.794862,0.790014,0.792116
400,0.2509,0.551628,0.79511,0.786696,0.789936,0.78808
450,0.0884,0.80568,0.795729,0.786818,0.788641,0.787659
500,0.098,0.713613,0.791086,0.786302,0.774645,0.778681


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8282,0.632427,0.728258,0.722938,0.709408,0.713074
100,0.6148,0.561407,0.763541,0.75836,0.747512,0.750409
150,0.5593,0.500467,0.785825,0.77947,0.774528,0.776629
200,0.5007,0.498947,0.793253,0.795723,0.779715,0.782841
250,0.2867,0.676225,0.775302,0.779726,0.781577,0.765518
300,0.2605,0.533548,0.799133,0.796045,0.788246,0.79097
350,0.2531,0.529449,0.8013,0.794862,0.790014,0.792116
400,0.2509,0.551628,0.79511,0.786696,0.789936,0.78808
450,0.0884,0.80568,0.795729,0.786818,0.788641,0.787659
500,0.098,0.713613,0.791086,0.786302,0.774645,0.778681


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8282,0.632427,0.728258,0.722938,0.709408,0.713074
100,0.6148,0.561407,0.763541,0.75836,0.747512,0.750409
150,0.5593,0.500467,0.785825,0.77947,0.774528,0.776629
200,0.5007,0.498947,0.793253,0.795723,0.779715,0.782841
250,0.2867,0.676225,0.775302,0.779726,0.781577,0.765518
300,0.2605,0.533548,0.799133,0.796045,0.788246,0.79097
350,0.2531,0.529449,0.8013,0.794862,0.790014,0.792116
400,0.2509,0.551628,0.79511,0.786696,0.789936,0.78808
450,0.0884,0.80568,0.795729,0.786818,0.788641,0.787659
500,0.098,0.713613,0.791086,0.786302,0.774645,0.778681


CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8274,0.602303,0.746209,0.735011,0.73842,0.736041
100,0.6314,0.553443,0.762922,0.771282,0.737048,0.741366
150,0.5622,0.540049,0.772826,0.770369,0.776602,0.76623
200,0.5198,0.4739,0.797895,0.789364,0.787163,0.787827
250,0.2446,0.633025,0.77623,0.790367,0.764739,0.767322
300,0.2734,0.503033,0.805323,0.795791,0.79909,0.796598
350,0.2517,0.558639,0.796038,0.795942,0.776425,0.782266
400,0.2666,0.539683,0.805323,0.808743,0.787871,0.793099
450,0.1004,0.735791,0.795419,0.795288,0.785652,0.787457
500,0.1035,0.711494,0.805323,0.797382,0.794478,0.795695


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8274,0.602303,0.746209,0.735011,0.73842,0.736041
100,0.6314,0.553443,0.762922,0.771282,0.737048,0.741366
150,0.5622,0.540049,0.772826,0.770369,0.776602,0.76623
200,0.5198,0.4739,0.797895,0.789364,0.787163,0.787827
250,0.2446,0.633025,0.77623,0.790367,0.764739,0.767322
300,0.2734,0.503033,0.805323,0.795791,0.79909,0.796598
350,0.2517,0.558639,0.796038,0.795942,0.776425,0.782266
400,0.2666,0.539683,0.805323,0.808743,0.787871,0.793099
450,0.1004,0.735791,0.795419,0.795288,0.785652,0.787457
500,0.1035,0.711494,0.805323,0.797382,0.794478,0.795695


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8274,0.602303,0.746209,0.735011,0.73842,0.736041
100,0.6314,0.553443,0.762922,0.771282,0.737048,0.741366
150,0.5622,0.540049,0.772826,0.770369,0.776602,0.76623
200,0.5198,0.4739,0.797895,0.789364,0.787163,0.787827
250,0.2446,0.633025,0.77623,0.790367,0.764739,0.767322
300,0.2734,0.503033,0.805323,0.795791,0.79909,0.796598
350,0.2517,0.558639,0.796038,0.795942,0.776425,0.782266
400,0.2666,0.539683,0.805323,0.808743,0.787871,0.793099
450,0.1004,0.735791,0.795419,0.795288,0.785652,0.787457
500,0.1035,0.711494,0.805323,0.797382,0.794478,0.795695


CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8777,0.634684,0.727019,0.718916,0.723193,0.718383
100,0.6379,0.551868,0.773135,0.764818,0.765402,0.763871
150,0.5414,0.505552,0.79511,0.786953,0.778776,0.782115
200,0.534,0.482522,0.800681,0.791051,0.792809,0.791474
250,0.2899,0.534947,0.789539,0.778261,0.783473,0.778201
300,0.2503,0.555292,0.804704,0.802481,0.7856,0.791825
350,0.2625,0.498275,0.809966,0.797912,0.801746,0.799108
400,0.2739,0.49531,0.806871,0.796758,0.793815,0.795085
450,0.111,0.782875,0.80749,0.806046,0.784142,0.790641
500,0.1082,0.668188,0.805014,0.793848,0.797617,0.794005


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8777,0.634684,0.727019,0.718916,0.723193,0.718383
100,0.6379,0.551868,0.773135,0.764818,0.765402,0.763871
150,0.5414,0.505552,0.79511,0.786953,0.778776,0.782115
200,0.534,0.482522,0.800681,0.791051,0.792809,0.791474
250,0.2899,0.534947,0.789539,0.778261,0.783473,0.778201
300,0.2503,0.555292,0.804704,0.802481,0.7856,0.791825
350,0.2625,0.498275,0.809966,0.797912,0.801746,0.799108
400,0.2739,0.49531,0.806871,0.796758,0.793815,0.795085
450,0.111,0.782875,0.80749,0.806046,0.784142,0.790641
500,0.1082,0.668188,0.805014,0.793848,0.797617,0.794005


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8777,0.634684,0.727019,0.718916,0.723193,0.718383
100,0.6379,0.551868,0.773135,0.764818,0.765402,0.763871
150,0.5414,0.505552,0.79511,0.786953,0.778776,0.782115
200,0.534,0.482522,0.800681,0.791051,0.792809,0.791474
250,0.2899,0.534947,0.789539,0.778261,0.783473,0.778201
300,0.2503,0.555292,0.804704,0.802481,0.7856,0.791825
350,0.2625,0.498275,0.809966,0.797912,0.801746,0.799108
400,0.2739,0.49531,0.806871,0.796758,0.793815,0.795085
450,0.111,0.782875,0.80749,0.806046,0.784142,0.790641
500,0.1082,0.668188,0.805014,0.793848,0.797617,0.794005


DatasetDict({
    train: Dataset({
        features: ['text', 'label'],
        num_rows: 12921
    })
    test: Dataset({
        features: ['text', 'label'],
        num_rows: 3231
    })
})

qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.6957,0.492971,0.798824,0.795945,0.794952,0.790778
100,0.4711,0.456277,0.810275,0.815889,0.811236,0.807941
150,0.4513,0.404596,0.826989,0.828883,0.81858,0.819564
200,0.4103,0.364048,0.850201,0.843202,0.8516,0.845544
250,0.1825,0.414364,0.855772,0.850954,0.851249,0.851069
300,0.1709,0.481759,0.830393,0.842105,0.819099,0.824378
350,0.1809,0.434458,0.842773,0.845941,0.835415,0.835481
400,0.1674,0.448913,0.842773,0.840297,0.841169,0.836558
450,0.0652,0.695171,0.846797,0.841837,0.847687,0.841143
500,0.0759,0.651748,0.831941,0.848314,0.817511,0.824116


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.6957,0.492971,0.798824,0.795945,0.794952,0.790778
100,0.4711,0.456277,0.810275,0.815889,0.811236,0.807941
150,0.4513,0.404596,0.826989,0.828883,0.81858,0.819564
200,0.4103,0.364048,0.850201,0.843202,0.8516,0.845544
250,0.1825,0.414364,0.855772,0.850954,0.851249,0.851069
300,0.1709,0.481759,0.830393,0.842105,0.819099,0.824378
350,0.1809,0.434458,0.842773,0.845941,0.835415,0.835481
400,0.1674,0.448913,0.842773,0.840297,0.841169,0.836558
450,0.0652,0.695171,0.846797,0.841837,0.847687,0.841143
500,0.0759,0.651748,0.831941,0.848314,0.817511,0.824116


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.6957,0.492971,0.798824,0.795945,0.794952,0.790778
100,0.4711,0.456277,0.810275,0.815889,0.811236,0.807941
150,0.4513,0.404596,0.826989,0.828883,0.81858,0.819564
200,0.4103,0.364048,0.850201,0.843202,0.8516,0.845544
250,0.1825,0.414364,0.855772,0.850954,0.851249,0.851069
300,0.1709,0.481759,0.830393,0.842105,0.819099,0.824378
350,0.1809,0.434458,0.842773,0.845941,0.835415,0.835481
400,0.1674,0.448913,0.842773,0.840297,0.841169,0.836558
450,0.0652,0.695171,0.846797,0.841837,0.847687,0.841143
500,0.0759,0.651748,0.831941,0.848314,0.817511,0.824116


qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7192,0.479816,0.803157,0.794425,0.800199,0.796426
100,0.4717,0.420451,0.821727,0.815661,0.815853,0.815621
150,0.4521,0.390355,0.831322,0.824363,0.832874,0.826918
200,0.3913,0.37535,0.843083,0.844127,0.830503,0.835147
250,0.1746,0.479293,0.841226,0.83738,0.841115,0.834341
300,0.1636,0.419841,0.85113,0.849385,0.84042,0.843955
350,0.164,0.412168,0.85113,0.846378,0.846694,0.845936
400,0.1871,0.427645,0.848035,0.841179,0.849803,0.844019
450,0.0604,0.710055,0.837512,0.834495,0.841858,0.834987
500,0.0519,0.65562,0.844321,0.838203,0.841701,0.839219


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7192,0.479816,0.803157,0.794425,0.800199,0.796426
100,0.4717,0.420451,0.821727,0.815661,0.815853,0.815621
150,0.4521,0.390355,0.831322,0.824363,0.832874,0.826918
200,0.3913,0.37535,0.843083,0.844127,0.830503,0.835147
250,0.1746,0.479293,0.841226,0.83738,0.841115,0.834341
300,0.1636,0.419841,0.85113,0.849385,0.84042,0.843955
350,0.164,0.412168,0.85113,0.846378,0.846694,0.845936
400,0.1871,0.427645,0.848035,0.841179,0.849803,0.844019
450,0.0604,0.710055,0.837512,0.834495,0.841858,0.834987
500,0.0519,0.65562,0.844321,0.838203,0.841701,0.839219


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7192,0.479816,0.803157,0.794425,0.800199,0.796426
100,0.4717,0.420451,0.821727,0.815661,0.815853,0.815621
150,0.4521,0.390355,0.831322,0.824363,0.832874,0.826918
200,0.3913,0.37535,0.843083,0.844127,0.830503,0.835147
250,0.1746,0.479293,0.841226,0.83738,0.841115,0.834341
300,0.1636,0.419841,0.85113,0.849385,0.84042,0.843955
350,0.164,0.412168,0.85113,0.846378,0.846694,0.845936
400,0.1871,0.427645,0.848035,0.841179,0.849803,0.844019
450,0.0604,0.710055,0.837512,0.834495,0.841858,0.834987
500,0.0519,0.65562,0.844321,0.838203,0.841701,0.839219


qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.6956,0.464569,0.806561,0.800272,0.805059,0.801717
100,0.4812,0.410974,0.829465,0.821699,0.826259,0.823561
150,0.4487,0.4821,0.793253,0.802058,0.799619,0.781261
200,0.4419,0.38292,0.839988,0.844623,0.82395,0.83062
250,0.1917,0.39378,0.864748,0.857842,0.858665,0.858243
300,0.1633,0.401816,0.855153,0.85145,0.847744,0.847803
350,0.1746,0.401435,0.855463,0.849364,0.85087,0.850087
400,0.1693,0.421885,0.856391,0.856094,0.844636,0.848982
450,0.0771,0.535719,0.853296,0.849145,0.849977,0.846672
500,0.0706,0.604634,0.857939,0.855987,0.847086,0.85016


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.6956,0.464569,0.806561,0.800272,0.805059,0.801717
100,0.4812,0.410974,0.829465,0.821699,0.826259,0.823561
150,0.4487,0.4821,0.793253,0.802058,0.799619,0.781261
200,0.4419,0.38292,0.839988,0.844623,0.82395,0.83062
250,0.1917,0.39378,0.864748,0.857842,0.858665,0.858243
300,0.1633,0.401816,0.855153,0.85145,0.847744,0.847803
350,0.1746,0.401435,0.855463,0.849364,0.85087,0.850087
400,0.1693,0.421885,0.856391,0.856094,0.844636,0.848982
450,0.0771,0.535719,0.853296,0.849145,0.849977,0.846672
500,0.0706,0.604634,0.857939,0.855987,0.847086,0.85016


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.6956,0.464569,0.806561,0.800272,0.805059,0.801717
100,0.4812,0.410974,0.829465,0.821699,0.826259,0.823561
150,0.4487,0.4821,0.793253,0.802058,0.799619,0.781261
200,0.4419,0.38292,0.839988,0.844623,0.82395,0.83062
250,0.1917,0.39378,0.864748,0.857842,0.858665,0.858243
300,0.1633,0.401816,0.855153,0.85145,0.847744,0.847803
350,0.1746,0.401435,0.855463,0.849364,0.85087,0.850087
400,0.1693,0.421885,0.856391,0.856094,0.844636,0.848982
450,0.0771,0.535719,0.853296,0.849145,0.849977,0.846672
500,0.0706,0.604634,0.857939,0.855987,0.847086,0.85016


qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.739,0.476638,0.81337,0.804634,0.812955,0.806368
100,0.4918,0.408224,0.83875,0.829303,0.833311,0.831043
150,0.4233,0.421716,0.831012,0.829182,0.822505,0.821219
200,0.4174,0.370373,0.84463,0.836264,0.839104,0.837167
250,0.1787,0.435218,0.847416,0.843655,0.836967,0.839801
300,0.179,0.374434,0.862581,0.856774,0.856072,0.856419
350,0.173,0.392583,0.865057,0.859985,0.85718,0.858148
400,0.1829,0.401886,0.85732,0.857545,0.843197,0.848216
450,0.0792,0.635505,0.850201,0.852626,0.838912,0.84305
500,0.0809,0.574266,0.860724,0.862885,0.849979,0.85466


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.739,0.476638,0.81337,0.804634,0.812955,0.806368
100,0.4918,0.408224,0.83875,0.829303,0.833311,0.831043
150,0.4233,0.421716,0.831012,0.829182,0.822505,0.821219
200,0.4174,0.370373,0.84463,0.836264,0.839104,0.837167
250,0.1787,0.435218,0.847416,0.843655,0.836967,0.839801
300,0.179,0.374434,0.862581,0.856774,0.856072,0.856419
350,0.173,0.392583,0.865057,0.859985,0.85718,0.858148
400,0.1829,0.401886,0.85732,0.857545,0.843197,0.848216
450,0.0792,0.635505,0.850201,0.852626,0.838912,0.84305
500,0.0809,0.574266,0.860724,0.862885,0.849979,0.85466


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.739,0.476638,0.81337,0.804634,0.812955,0.806368
100,0.4918,0.408224,0.83875,0.829303,0.833311,0.831043
150,0.4233,0.421716,0.831012,0.829182,0.822505,0.821219
200,0.4174,0.370373,0.84463,0.836264,0.839104,0.837167
250,0.1787,0.435218,0.847416,0.843655,0.836967,0.839801
300,0.179,0.374434,0.862581,0.856774,0.856072,0.856419
350,0.173,0.392583,0.865057,0.859985,0.85718,0.858148
400,0.1829,0.401886,0.85732,0.857545,0.843197,0.848216
450,0.0792,0.635505,0.850201,0.852626,0.838912,0.84305
500,0.0809,0.574266,0.860724,0.862885,0.849979,0.85466


DatasetDict({
    train: Dataset({
        features: ['text', 'label'],
        num_rows: 12921
    })
    test: Dataset({
        features: ['text', 'label'],
        num_rows: 3231
    })
})

UBC-NLP/ARBERTv2, try:0


model.safetensors:   0%|          | 0.00/654M [00:00<?, ?B/s]

Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/ARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7956,0.639138,0.729496,0.734463,0.732308,0.727859
100,0.6143,0.564388,0.766636,0.775404,0.750985,0.755677
150,0.5538,0.534783,0.779944,0.781105,0.764185,0.766717
200,0.5555,0.505763,0.781182,0.776596,0.782326,0.777821
250,0.3153,0.558524,0.787682,0.789543,0.783406,0.783462
300,0.3159,0.529598,0.806871,0.799921,0.802414,0.798597
350,0.3028,0.524034,0.797586,0.799788,0.790839,0.786034
400,0.3057,0.493017,0.819561,0.813345,0.813207,0.81324
450,0.1482,0.638628,0.815227,0.810108,0.813401,0.807271
500,0.1429,0.64293,0.799752,0.796977,0.799643,0.790397


UBC-NLP/ARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/ARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7956,0.639138,0.729496,0.734463,0.732308,0.727859
100,0.6143,0.564388,0.766636,0.775404,0.750985,0.755677
150,0.5538,0.534783,0.779944,0.781105,0.764185,0.766717
200,0.5555,0.505763,0.781182,0.776596,0.782326,0.777821
250,0.3153,0.558524,0.787682,0.789543,0.783406,0.783462
300,0.3159,0.529598,0.806871,0.799921,0.802414,0.798597
350,0.3028,0.524034,0.797586,0.799788,0.790839,0.786034
400,0.3057,0.493017,0.819561,0.813345,0.813207,0.81324
450,0.1482,0.638628,0.815227,0.810108,0.813401,0.807271
500,0.1429,0.64293,0.799752,0.796977,0.799643,0.790397


UBC-NLP/ARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/ARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7956,0.639138,0.729496,0.734463,0.732308,0.727859
100,0.6143,0.564388,0.766636,0.775404,0.750985,0.755677
150,0.5538,0.534783,0.779944,0.781105,0.764185,0.766717
200,0.5555,0.505763,0.781182,0.776596,0.782326,0.777821
250,0.3153,0.558524,0.787682,0.789543,0.783406,0.783462
300,0.3159,0.529598,0.806871,0.799921,0.802414,0.798597
350,0.3028,0.524034,0.797586,0.799788,0.790839,0.786034
400,0.3057,0.493017,0.819561,0.813345,0.813207,0.81324
450,0.1482,0.638628,0.815227,0.810108,0.813401,0.807271
500,0.1429,0.64293,0.799752,0.796977,0.799643,0.790397


UBC-NLP/ARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/ARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7993,0.677461,0.733829,0.731059,0.737815,0.724883
100,0.6172,0.580955,0.765088,0.763256,0.761716,0.753455
150,0.5763,0.509519,0.790158,0.796479,0.769398,0.776593
200,0.5371,0.475812,0.80749,0.800167,0.800685,0.800383
250,0.326,0.569434,0.787063,0.785601,0.785031,0.777363
300,0.3155,0.536379,0.794491,0.790528,0.792521,0.784377
350,0.3122,0.463584,0.820799,0.816765,0.811155,0.81297
400,0.3227,0.491483,0.805323,0.799315,0.809688,0.799855
450,0.1554,0.690814,0.802847,0.795217,0.803501,0.796784
500,0.1335,0.652324,0.822346,0.815855,0.816903,0.816358


UBC-NLP/ARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/ARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7993,0.677461,0.733829,0.731059,0.737815,0.724883
100,0.6172,0.580955,0.765088,0.763256,0.761716,0.753455
150,0.5763,0.509519,0.790158,0.796479,0.769398,0.776593
200,0.5371,0.475812,0.80749,0.800167,0.800685,0.800383
250,0.326,0.569434,0.787063,0.785601,0.785031,0.777363
300,0.3155,0.536379,0.794491,0.790528,0.792521,0.784377
350,0.3122,0.463584,0.820799,0.816765,0.811155,0.81297
400,0.3227,0.491483,0.805323,0.799315,0.809688,0.799855
450,0.1554,0.690814,0.802847,0.795217,0.803501,0.796784
500,0.1335,0.652324,0.822346,0.815855,0.816903,0.816358


UBC-NLP/ARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/ARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7993,0.677461,0.733829,0.731059,0.737815,0.724883
100,0.6172,0.580955,0.765088,0.763256,0.761716,0.753455
150,0.5763,0.509519,0.790158,0.796479,0.769398,0.776593
200,0.5371,0.475812,0.80749,0.800167,0.800685,0.800383
250,0.326,0.569434,0.787063,0.785601,0.785031,0.777363
300,0.3155,0.536379,0.794491,0.790528,0.792521,0.784377
350,0.3122,0.463584,0.820799,0.816765,0.811155,0.81297
400,0.3227,0.491483,0.805323,0.799315,0.809688,0.799855
450,0.1554,0.690814,0.802847,0.795217,0.803501,0.796784
500,0.1335,0.652324,0.822346,0.815855,0.816903,0.816358


UBC-NLP/ARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/ARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7925,0.607047,0.738781,0.747111,0.722726,0.724783
100,0.6077,0.597841,0.761684,0.775527,0.733187,0.740476
150,0.5577,0.568586,0.769421,0.782004,0.746384,0.755366
200,0.5491,0.525954,0.789848,0.784584,0.785404,0.78219
250,0.3049,0.548693,0.799133,0.793154,0.802228,0.793955
300,0.3063,0.523359,0.802228,0.801722,0.788145,0.792436
350,0.3259,0.52617,0.8013,0.796346,0.805245,0.797186
400,0.3,0.502792,0.805014,0.802325,0.792681,0.795406
450,0.144,0.640347,0.812751,0.804393,0.808641,0.804714
500,0.1238,0.62224,0.813989,0.809814,0.803118,0.805833


UBC-NLP/ARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/ARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7925,0.607047,0.738781,0.747111,0.722726,0.724783
100,0.6077,0.597841,0.761684,0.775527,0.733187,0.740476
150,0.5577,0.568586,0.769421,0.782004,0.746384,0.755366
200,0.5491,0.525954,0.789848,0.784584,0.785404,0.78219
250,0.3049,0.548693,0.799133,0.793154,0.802228,0.793955
300,0.3063,0.523359,0.802228,0.801722,0.788145,0.792436
350,0.3259,0.52617,0.8013,0.796346,0.805245,0.797186
400,0.3,0.502792,0.805014,0.802325,0.792681,0.795406
450,0.144,0.640347,0.812751,0.804393,0.808641,0.804714
500,0.1238,0.62224,0.813989,0.809814,0.803118,0.805833


UBC-NLP/ARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/ARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7925,0.607047,0.738781,0.747111,0.722726,0.724783
100,0.6077,0.597841,0.761684,0.775527,0.733187,0.740476
150,0.5577,0.568586,0.769421,0.782004,0.746384,0.755366
200,0.5491,0.525954,0.789848,0.784584,0.785404,0.78219
250,0.3049,0.548693,0.799133,0.793154,0.802228,0.793955
300,0.3063,0.523359,0.802228,0.801722,0.788145,0.792436
350,0.3259,0.52617,0.8013,0.796346,0.805245,0.797186
400,0.3,0.502792,0.805014,0.802325,0.792681,0.795406
450,0.144,0.640347,0.812751,0.804393,0.808641,0.804714
500,0.1238,0.62224,0.813989,0.809814,0.803118,0.805833


UBC-NLP/ARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/ARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7946,0.571685,0.773135,0.763713,0.770304,0.766208
100,0.6117,0.51228,0.786444,0.785236,0.765573,0.77207
150,0.5526,0.519523,0.798205,0.792541,0.794044,0.790552
200,0.5606,0.500995,0.790777,0.782726,0.787706,0.778614
250,0.3128,0.532607,0.798205,0.787182,0.79584,0.790178
300,0.315,0.460332,0.820489,0.811445,0.812519,0.81166
350,0.3141,0.47576,0.811823,0.807693,0.799748,0.79928
400,0.3302,0.470724,0.814918,0.808422,0.806698,0.806225
450,0.1491,0.627224,0.809656,0.802627,0.806458,0.8028
500,0.1343,0.651367,0.814299,0.804483,0.810841,0.807105


UBC-NLP/ARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/ARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7946,0.571685,0.773135,0.763713,0.770304,0.766208
100,0.6117,0.51228,0.786444,0.785236,0.765573,0.77207
150,0.5526,0.519523,0.798205,0.792541,0.794044,0.790552
200,0.5606,0.500995,0.790777,0.782726,0.787706,0.778614
250,0.3128,0.532607,0.798205,0.787182,0.79584,0.790178
300,0.315,0.460332,0.820489,0.811445,0.812519,0.81166
350,0.3141,0.47576,0.811823,0.807693,0.799748,0.79928
400,0.3302,0.470724,0.814918,0.808422,0.806698,0.806225
450,0.1491,0.627224,0.809656,0.802627,0.806458,0.8028
500,0.1343,0.651367,0.814299,0.804483,0.810841,0.807105


UBC-NLP/ARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/ARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7946,0.571685,0.773135,0.763713,0.770304,0.766208
100,0.6117,0.51228,0.786444,0.785236,0.765573,0.77207
150,0.5526,0.519523,0.798205,0.792541,0.794044,0.790552
200,0.5606,0.500995,0.790777,0.782726,0.787706,0.778614
250,0.3128,0.532607,0.798205,0.787182,0.79584,0.790178
300,0.315,0.460332,0.820489,0.811445,0.812519,0.81166
350,0.3141,0.47576,0.811823,0.807693,0.799748,0.79928
400,0.3302,0.470724,0.814918,0.808422,0.806698,0.806225
450,0.1491,0.627224,0.809656,0.802627,0.806458,0.8028
500,0.1343,0.651367,0.814299,0.804483,0.810841,0.807105


DatasetDict({
    train: Dataset({
        features: ['text', 'label'],
        num_rows: 12921
    })
    test: Dataset({
        features: ['text', 'label'],
        num_rows: 3231
    })
})

UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.73,0.476784,0.815537,0.811144,0.807597,0.808989
100,0.4816,0.420951,0.829465,0.823627,0.832702,0.826164
150,0.4452,0.398809,0.839059,0.834772,0.8397,0.832986
200,0.4014,0.357333,0.858558,0.85174,0.858566,0.853935
250,0.2215,0.373734,0.8632,0.860858,0.858238,0.858855
300,0.1866,0.398186,0.853606,0.85759,0.841256,0.847124
350,0.1932,0.379335,0.85732,0.854544,0.849761,0.851445
400,0.1874,0.385491,0.858248,0.858076,0.848806,0.852475
450,0.075,0.601517,0.862272,0.856444,0.860072,0.857705
500,0.0874,0.503136,0.867843,0.861441,0.866776,0.863212


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.73,0.476784,0.815537,0.811144,0.807597,0.808989
100,0.4816,0.420951,0.829465,0.823627,0.832702,0.826164
150,0.4452,0.398809,0.839059,0.834772,0.8397,0.832986
200,0.4014,0.357333,0.858558,0.85174,0.858566,0.853935
250,0.2215,0.373734,0.8632,0.860858,0.858238,0.858855
300,0.1866,0.398186,0.853606,0.85759,0.841256,0.847124
350,0.1932,0.379335,0.85732,0.854544,0.849761,0.851445
400,0.1874,0.385491,0.858248,0.858076,0.848806,0.852475
450,0.075,0.601517,0.862272,0.856444,0.860072,0.857705
500,0.0874,0.503136,0.867843,0.861441,0.866776,0.863212


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.73,0.476784,0.815537,0.811144,0.807597,0.808989
100,0.4816,0.420951,0.829465,0.823627,0.832702,0.826164
150,0.4452,0.398809,0.839059,0.834772,0.8397,0.832986
200,0.4014,0.357333,0.858558,0.85174,0.858566,0.853935
250,0.2215,0.373734,0.8632,0.860858,0.858238,0.858855
300,0.1866,0.398186,0.853606,0.85759,0.841256,0.847124
350,0.1932,0.379335,0.85732,0.854544,0.849761,0.851445
400,0.1874,0.385491,0.858248,0.858076,0.848806,0.852475
450,0.075,0.601517,0.862272,0.856444,0.860072,0.857705
500,0.0874,0.503136,0.867843,0.861441,0.866776,0.863212


UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7441,0.509871,0.793562,0.788428,0.779738,0.782901
100,0.4871,0.478337,0.816775,0.820126,0.810225,0.807108
150,0.4302,0.381279,0.84463,0.838764,0.845635,0.840694
200,0.3867,0.35284,0.8632,0.857671,0.860464,0.858969
250,0.2207,0.451225,0.834107,0.840213,0.837349,0.825564
300,0.1805,0.412228,0.861962,0.866425,0.852119,0.856683
350,0.1847,0.509801,0.842154,0.846039,0.849443,0.834128
400,0.1789,0.366317,0.868771,0.864092,0.863081,0.863536
450,0.0725,0.532389,0.862272,0.857391,0.862113,0.858829
500,0.0676,0.596737,0.859486,0.856131,0.864515,0.853935


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7441,0.509871,0.793562,0.788428,0.779738,0.782901
100,0.4871,0.478337,0.816775,0.820126,0.810225,0.807108
150,0.4302,0.381279,0.84463,0.838764,0.845635,0.840694
200,0.3867,0.35284,0.8632,0.857671,0.860464,0.858969
250,0.2207,0.451225,0.834107,0.840213,0.837349,0.825564
300,0.1805,0.412228,0.861962,0.866425,0.852119,0.856683
350,0.1847,0.509801,0.842154,0.846039,0.849443,0.834128
400,0.1789,0.366317,0.868771,0.864092,0.863081,0.863536
450,0.0725,0.532389,0.862272,0.857391,0.862113,0.858829
500,0.0676,0.596737,0.859486,0.856131,0.864515,0.853935


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7441,0.509871,0.793562,0.788428,0.779738,0.782901
100,0.4871,0.478337,0.816775,0.820126,0.810225,0.807108
150,0.4302,0.381279,0.84463,0.838764,0.845635,0.840694
200,0.3867,0.35284,0.8632,0.857671,0.860464,0.858969
250,0.2207,0.451225,0.834107,0.840213,0.837349,0.825564
300,0.1805,0.412228,0.861962,0.866425,0.852119,0.856683
350,0.1847,0.509801,0.842154,0.846039,0.849443,0.834128
400,0.1789,0.366317,0.868771,0.864092,0.863081,0.863536
450,0.0725,0.532389,0.862272,0.857391,0.862113,0.858829
500,0.0676,0.596737,0.859486,0.856131,0.864515,0.853935


UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7496,0.496445,0.799133,0.800713,0.787245,0.790886
100,0.4703,0.432759,0.828227,0.828019,0.811255,0.816241
150,0.4256,0.391149,0.844321,0.838232,0.843618,0.840467
200,0.3948,0.371068,0.847725,0.848423,0.836427,0.840712
250,0.1995,0.431169,0.848035,0.849268,0.838833,0.84187
300,0.1923,0.392504,0.861034,0.856481,0.858023,0.856831
350,0.1781,0.400798,0.862272,0.858547,0.854885,0.856557
400,0.1917,0.449192,0.855772,0.85408,0.846654,0.849127
450,0.0899,0.500365,0.859177,0.852006,0.858578,0.854088
500,0.0607,0.543747,0.865057,0.859793,0.860888,0.85922


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7496,0.496445,0.799133,0.800713,0.787245,0.790886
100,0.4703,0.432759,0.828227,0.828019,0.811255,0.816241
150,0.4256,0.391149,0.844321,0.838232,0.843618,0.840467
200,0.3948,0.371068,0.847725,0.848423,0.836427,0.840712
250,0.1995,0.431169,0.848035,0.849268,0.838833,0.84187
300,0.1923,0.392504,0.861034,0.856481,0.858023,0.856831
350,0.1781,0.400798,0.862272,0.858547,0.854885,0.856557
400,0.1917,0.449192,0.855772,0.85408,0.846654,0.849127
450,0.0899,0.500365,0.859177,0.852006,0.858578,0.854088
500,0.0607,0.543747,0.865057,0.859793,0.860888,0.85922


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7496,0.496445,0.799133,0.800713,0.787245,0.790886
100,0.4703,0.432759,0.828227,0.828019,0.811255,0.816241
150,0.4256,0.391149,0.844321,0.838232,0.843618,0.840467
200,0.3948,0.371068,0.847725,0.848423,0.836427,0.840712
250,0.1995,0.431169,0.848035,0.849268,0.838833,0.84187
300,0.1923,0.392504,0.861034,0.856481,0.858023,0.856831
350,0.1781,0.400798,0.862272,0.858547,0.854885,0.856557
400,0.1917,0.449192,0.855772,0.85408,0.846654,0.849127
450,0.0899,0.500365,0.859177,0.852006,0.858578,0.854088
500,0.0607,0.543747,0.865057,0.859793,0.860888,0.85922


UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7666,0.494628,0.806561,0.798889,0.804106,0.800515
100,0.4798,0.406984,0.840297,0.830822,0.837047,0.833376
150,0.4396,0.36491,0.852987,0.845513,0.846056,0.845753
200,0.3993,0.380691,0.840607,0.840048,0.844353,0.838962
250,0.2109,0.387472,0.861653,0.852408,0.860179,0.855485
300,0.207,0.412849,0.852368,0.857061,0.834328,0.842616
350,0.1983,0.396091,0.871247,0.870263,0.860269,0.864486
400,0.1915,0.388837,0.865986,0.867681,0.851501,0.857947
450,0.0933,0.431356,0.864438,0.866281,0.850823,0.856555
500,0.0849,0.489483,0.874961,0.870543,0.867857,0.869121


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7666,0.494628,0.806561,0.798889,0.804106,0.800515
100,0.4798,0.406984,0.840297,0.830822,0.837047,0.833376
150,0.4396,0.36491,0.852987,0.845513,0.846056,0.845753
200,0.3993,0.380691,0.840607,0.840048,0.844353,0.838962
250,0.2109,0.387472,0.861653,0.852408,0.860179,0.855485
300,0.207,0.412849,0.852368,0.857061,0.834328,0.842616
350,0.1983,0.396091,0.871247,0.870263,0.860269,0.864486
400,0.1915,0.388837,0.865986,0.867681,0.851501,0.857947
450,0.0933,0.431356,0.864438,0.866281,0.850823,0.856555
500,0.0849,0.489483,0.874961,0.870543,0.867857,0.869121


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7666,0.494628,0.806561,0.798889,0.804106,0.800515
100,0.4798,0.406984,0.840297,0.830822,0.837047,0.833376
150,0.4396,0.36491,0.852987,0.845513,0.846056,0.845753
200,0.3993,0.380691,0.840607,0.840048,0.844353,0.838962
250,0.2109,0.387472,0.861653,0.852408,0.860179,0.855485
300,0.207,0.412849,0.852368,0.857061,0.834328,0.842616
350,0.1983,0.396091,0.871247,0.870263,0.860269,0.864486
400,0.1915,0.388837,0.865986,0.867681,0.851501,0.857947
450,0.0933,0.431356,0.864438,0.866281,0.850823,0.856555
500,0.0849,0.489483,0.874961,0.870543,0.867857,0.869121


DatasetDict({
    train: Dataset({
        features: ['text', 'label'],
        num_rows: 12921
    })
    test: Dataset({
        features: ['text', 'label'],
        num_rows: 3231
    })
})

faisalq/SaudiBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.5284,0.400084,0.83844,0.84947,0.839307,0.829704
100,0.3359,0.300837,0.871866,0.879323,0.872123,0.871473
150,0.2749,0.220935,0.911792,0.909432,0.908863,0.909021
200,0.2652,0.209582,0.91953,0.918454,0.914176,0.916051
250,0.1136,0.222935,0.921077,0.920465,0.917384,0.918683
300,0.0978,0.232663,0.917982,0.920551,0.90935,0.913698
350,0.1026,0.23338,0.914578,0.915621,0.906847,0.910427
400,0.1065,0.258526,0.909626,0.90691,0.912376,0.904684
450,0.053,0.32388,0.912102,0.911035,0.9115,0.90857
500,0.0565,0.260433,0.922625,0.920193,0.918771,0.919405


faisalq/SaudiBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.5284,0.400084,0.83844,0.84947,0.839307,0.829704
100,0.3359,0.300837,0.871866,0.879323,0.872123,0.871473
150,0.2749,0.220935,0.911792,0.909432,0.908863,0.909021
200,0.2652,0.209582,0.91953,0.918454,0.914176,0.916051
250,0.1136,0.222935,0.921077,0.920465,0.917384,0.918683
300,0.0978,0.232663,0.917982,0.920551,0.90935,0.913698
350,0.1026,0.23338,0.914578,0.915621,0.906847,0.910427
400,0.1065,0.258526,0.909626,0.90691,0.912376,0.904684
450,0.053,0.32388,0.912102,0.911035,0.9115,0.90857
500,0.0565,0.260433,0.922625,0.920193,0.918771,0.919405


faisalq/SaudiBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.5284,0.400084,0.83844,0.84947,0.839307,0.829704
100,0.3359,0.300837,0.871866,0.879323,0.872123,0.871473
150,0.2749,0.220935,0.911792,0.909432,0.908863,0.909021
200,0.2652,0.209582,0.91953,0.918454,0.914176,0.916051
250,0.1136,0.222935,0.921077,0.920465,0.917384,0.918683
300,0.0978,0.232663,0.917982,0.920551,0.90935,0.913698
350,0.1026,0.23338,0.914578,0.915621,0.906847,0.910427
400,0.1065,0.258526,0.909626,0.90691,0.912376,0.904684
450,0.053,0.32388,0.912102,0.911035,0.9115,0.90857
500,0.0565,0.260433,0.922625,0.920193,0.918771,0.919405


faisalq/SaudiBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.5536,0.408775,0.838131,0.845699,0.839266,0.829496
100,0.3126,0.353432,0.8697,0.875913,0.864052,0.865558
150,0.289,0.239166,0.902816,0.898139,0.906919,0.900682
200,0.2446,0.229698,0.911483,0.91257,0.91087,0.910355
250,0.1168,0.246733,0.909935,0.904442,0.911145,0.906303
300,0.1106,0.227497,0.917673,0.913718,0.917407,0.915388
350,0.1076,0.254448,0.91334,0.909325,0.914726,0.911263
400,0.0985,0.259897,0.914887,0.908646,0.91749,0.911563
450,0.044,0.36934,0.90034,0.903735,0.893639,0.897475
500,0.0666,0.350587,0.902816,0.896548,0.907206,0.899475


faisalq/SaudiBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.5536,0.408775,0.838131,0.845699,0.839266,0.829496
100,0.3126,0.353432,0.8697,0.875913,0.864052,0.865558
150,0.289,0.239166,0.902816,0.898139,0.906919,0.900682
200,0.2446,0.229698,0.911483,0.91257,0.91087,0.910355
250,0.1168,0.246733,0.909935,0.904442,0.911145,0.906303
300,0.1106,0.227497,0.917673,0.913718,0.917407,0.915388
350,0.1076,0.254448,0.91334,0.909325,0.914726,0.911263
400,0.0985,0.259897,0.914887,0.908646,0.91749,0.911563
450,0.044,0.36934,0.90034,0.903735,0.893639,0.897475
500,0.0666,0.350587,0.902816,0.896548,0.907206,0.899475


faisalq/SaudiBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.5536,0.408775,0.838131,0.845699,0.839266,0.829496
100,0.3126,0.353432,0.8697,0.875913,0.864052,0.865558
150,0.289,0.239166,0.902816,0.898139,0.906919,0.900682
200,0.2446,0.229698,0.911483,0.91257,0.91087,0.910355
250,0.1168,0.246733,0.909935,0.904442,0.911145,0.906303
300,0.1106,0.227497,0.917673,0.913718,0.917407,0.915388
350,0.1076,0.254448,0.91334,0.909325,0.914726,0.911263
400,0.0985,0.259897,0.914887,0.908646,0.91749,0.911563
450,0.044,0.36934,0.90034,0.903735,0.893639,0.897475
500,0.0666,0.350587,0.902816,0.896548,0.907206,0.899475


faisalq/SaudiBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.5843,0.355677,0.857939,0.854456,0.859403,0.854548
100,0.3281,0.249404,0.897555,0.897559,0.893945,0.894416
150,0.2984,0.267171,0.896626,0.896157,0.896198,0.891269
200,0.2564,0.234778,0.910864,0.909346,0.909123,0.906426
250,0.1072,0.232545,0.918601,0.914023,0.916806,0.91532
300,0.0946,0.244835,0.915816,0.913088,0.912639,0.912187
350,0.0937,0.245143,0.910245,0.911818,0.907852,0.907915
400,0.0879,0.233831,0.918292,0.917258,0.914844,0.91598
450,0.0508,0.302013,0.915197,0.914249,0.909384,0.911615
500,0.0617,0.288511,0.91953,0.916637,0.916952,0.916709


faisalq/SaudiBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.5843,0.355677,0.857939,0.854456,0.859403,0.854548
100,0.3281,0.249404,0.897555,0.897559,0.893945,0.894416
150,0.2984,0.267171,0.896626,0.896157,0.896198,0.891269
200,0.2564,0.234778,0.910864,0.909346,0.909123,0.906426
250,0.1072,0.232545,0.918601,0.914023,0.916806,0.91532
300,0.0946,0.244835,0.915816,0.913088,0.912639,0.912187
350,0.0937,0.245143,0.910245,0.911818,0.907852,0.907915
400,0.0879,0.233831,0.918292,0.917258,0.914844,0.91598
450,0.0508,0.302013,0.915197,0.914249,0.909384,0.911615
500,0.0617,0.288511,0.91953,0.916637,0.916952,0.916709


faisalq/SaudiBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.5843,0.355677,0.857939,0.854456,0.859403,0.854548
100,0.3281,0.249404,0.897555,0.897559,0.893945,0.894416
150,0.2984,0.267171,0.896626,0.896157,0.896198,0.891269
200,0.2564,0.234778,0.910864,0.909346,0.909123,0.906426
250,0.1072,0.232545,0.918601,0.914023,0.916806,0.91532
300,0.0946,0.244835,0.915816,0.913088,0.912639,0.912187
350,0.0937,0.245143,0.910245,0.911818,0.907852,0.907915
400,0.0879,0.233831,0.918292,0.917258,0.914844,0.91598
450,0.0508,0.302013,0.915197,0.914249,0.909384,0.911615
500,0.0617,0.288511,0.91953,0.916637,0.916952,0.916709


faisalq/SaudiBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.5301,0.314365,0.8697,0.860837,0.871255,0.864643
100,0.3293,0.275205,0.886722,0.890797,0.879795,0.88133
150,0.2711,0.223442,0.909006,0.907274,0.901471,0.904148
200,0.2513,0.215061,0.916125,0.908409,0.918039,0.911272
250,0.1098,0.271255,0.909935,0.912896,0.899009,0.904714
300,0.1076,0.24912,0.915506,0.914811,0.90826,0.910975
350,0.105,0.211077,0.921077,0.922745,0.912978,0.916706
400,0.1111,0.208813,0.915506,0.91317,0.912327,0.911795
450,0.0431,0.337737,0.90684,0.912449,0.89195,0.899293
500,0.0581,0.406554,0.895388,0.892301,0.894694,0.888127


faisalq/SaudiBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.5301,0.314365,0.8697,0.860837,0.871255,0.864643
100,0.3293,0.275205,0.886722,0.890797,0.879795,0.88133
150,0.2711,0.223442,0.909006,0.907274,0.901471,0.904148
200,0.2513,0.215061,0.916125,0.908409,0.918039,0.911272
250,0.1098,0.271255,0.909935,0.912896,0.899009,0.904714
300,0.1076,0.24912,0.915506,0.914811,0.90826,0.910975
350,0.105,0.211077,0.921077,0.922745,0.912978,0.916706
400,0.1111,0.208813,0.915506,0.91317,0.912327,0.911795
450,0.0431,0.337737,0.90684,0.912449,0.89195,0.899293
500,0.0581,0.406554,0.895388,0.892301,0.894694,0.888127


faisalq/SaudiBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/12921 [00:00<?, ? examples/s]

Map:   0%|          | 0/3231 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.5301,0.314365,0.8697,0.860837,0.871255,0.864643
100,0.3293,0.275205,0.886722,0.890797,0.879795,0.88133
150,0.2711,0.223442,0.909006,0.907274,0.901471,0.904148
200,0.2513,0.215061,0.916125,0.908409,0.918039,0.911272
250,0.1098,0.271255,0.909935,0.912896,0.899009,0.904714
300,0.1076,0.24912,0.915506,0.914811,0.90826,0.910975
350,0.105,0.211077,0.921077,0.922745,0.912978,0.916706
400,0.1111,0.208813,0.915506,0.91317,0.912327,0.911795
450,0.0431,0.337737,0.90684,0.912449,0.89195,0.899293
500,0.0581,0.406554,0.895388,0.892301,0.894694,0.888127


Unnamed: 0,Model,Accuracy,Precision,Recall,F1
0,CAMeL-Lab/bert-base-arabic-camelbert-da,0.822037,0.8122,0.813821,0.812903
3,UBC-NLP/ARBERTv2,0.835655,0.828308,0.827383,0.827834
6,UBC-NLP/MARBERTv2,0.877128,0.872997,0.872043,0.872505
9,asafaya/bert-base-arabic,0.805633,0.796996,0.801571,0.798801
12,aubmindlab/bert-base-arabertv02,0.854225,0.846953,0.851188,0.848533
13,faisalq/SaudiBERT,0.933767,0.931596,0.930681,0.931105
16,qarib/bert-base-qarib,0.870319,0.863613,0.864173,0.863866
