In [1]:
import os
os.environ["CUDA_VISIBLE_DEVICES"]="1" 

import numpy as np
import tensorflow as tf
import pandas as pd
import pyarabic.araby as araby
import warnings
warnings.filterwarnings('ignore')
from sklearn.model_selection import train_test_split
from sklearn.metrics import classification_report
from tensorflow.keras.layers import Dense, Input
from tensorflow.keras.utils import to_categorical
from tensorflow.keras.optimizers import Adam
from tensorflow.keras.callbacks import EarlyStopping
from tensorflow.keras.initializers import TruncatedNormal
from tensorflow.keras.losses import CategoricalCrossentropy
from tensorflow.keras.metrics import CategoricalAccuracy
import torch
from sklearn.metrics import accuracy_score, f1_score
from transformers import Trainer, TrainingArguments
from transformers import AutoTokenizer, AutoModelForSequenceClassification
from datasets import load_dataset, Dataset, concatenate_datasets
pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', None)
pd.set_option('display.max_colwidth', 1000)


fname = 'Elec_1'
log_file = fname + '.txt'

with open(log_file, 'w') as f:
    f.write('Model,Accuracy,F1\n')


df = pd.read_csv('datasets/ElecMorocco2016.csv', encoding='utf-8', engine='python', sep='\t') #, quotechar="'"  , quoting=3


      
display(df.columns)
display(len(df))
display(df[:4])



classes = set(df['sentiment'].values)
display(classes)

c = df['sentiment'].value_counts()
display(c)

df['sentiment'] = df['sentiment'].astype('category')
df['label'] = df['sentiment'].cat.codes

df = df[['comment_message', 'label']]
classes_num = len(classes)
display(classes_num)
display(len(df))


# ds = Dataset.from_pandas(df)
# ds = ds.train_test_split(test_size=0.2)

# display(ds)

max_sequence_length = 128


models = [ 
        'aubmindlab/bert-base-arabertv02-twitter',
        'CAMeL-Lab/bert-base-arabic-camelbert-da',
        'qarib/bert-base-qarib', 
        'UBC-NLP/MARBERT',
        'UBC-NLP/MARBERTv2',
    'SI2M-Lab/DarijaBERT-mix',
    'SI2M-Lab/DarijaBERT-arabizi'
]


seeds = [0, 1, 42]



for model_name in models:
    for seed in seeds:
        ds = Dataset.from_pandas(df)
        ds = ds.train_test_split(test_size=0.2, seed = seed)
        if seed==0:
            display(ds)
        for i in range(3):
            print(f'{model_name}, try:{i}')
                  
            tokenizer = AutoTokenizer.from_pretrained(model_name)
            model = AutoModelForSequenceClassification.from_pretrained(model_name,
                                                                  num_labels=classes_num).to('cuda')                                                 
            dataset_train = ds['train']
            dataset_validation = ds['test']                                                    
            
          
    
            def preprocess_function(examples):
                return tokenizer(examples['comment_message'], truncation=True, padding="max_length",
                                max_length=max_sequence_length)
            
            
            dataset_train = dataset_train.map(preprocess_function, batched=True) # , batched=True
            dataset_validation = dataset_validation.map(preprocess_function, batched=True)  # , batched=True
            
           
            
            def compute_metrics(eval_pred):
                logits, labels = eval_pred
                predictions = np.argmax(logits, axis=-1)    
                acc = accuracy_score(labels, predictions)        
                f1 = f1_score(labels, predictions, average='macro')   
                with open(log_file, 'a') as f:
                    f.write(f'{model_name},{acc},{f1}\n')
                return {'accuracy': acc, 'f1_score': f1}
    
    
            
            
            epochs = 15
            save_steps = 10000 #save checkpoint every 10000 steps
            batch_size = 64
            
            training_args = TrainingArguments(
                output_dir = 'bert/',
                overwrite_output_dir=True,
                num_train_epochs = epochs,
                per_device_train_batch_size = batch_size,
                per_device_eval_batch_size = batch_size,
                save_steps = save_steps,
                save_total_limit = 1, #only save the last 5 checkpoints
                fp16=True,
                learning_rate = 5e-5,  # 5e-5 is the default
                logging_steps = 60, #50_000
                evaluation_strategy = 'steps',
                # evaluate_during_training = True,
                eval_steps = 60
                
            )
            
            trainer = Trainer(
                model = model,
                args = training_args,
                # data_collator=data_collator,
                train_dataset=dataset_train,
                eval_dataset=dataset_validation,
                compute_metrics = compute_metrics
            )
            
            
            trainer.train()


results = pd.read_csv(log_file)

best_results = results.groupby('Model', as_index=False)['F1'].max()

best_results = pd.merge(best_results, results, on=['Model', 'F1'])
best_results = best_results[['Model', 'Accuracy', 'F1']]
best_results = best_results.drop_duplicates()
best_results.to_csv(f'{fname}.csv')
display(best_results)



2024-09-17 08:39:20.189277: I tensorflow/core/util/port.cc:110] oneDNN custom operations are on. You may see slightly different numerical results due to floating-point round-off errors from different computation orders. To turn them off, set the environment variable `TF_ENABLE_ONEDNN_OPTS=0`.
2024-09-17 08:39:20.214738: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.
To enable the following instructions: AVX2 AVX512F AVX512_VNNI AVX512_BF16 FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.


Index(['index', 'comment_message', 'sentiment', 'comment_published'], dtype='object')

10254

Unnamed: 0,index,comment_message,sentiment,comment_published
0,1,البكاء ليس سمت الرجال ..البكاء سلطة الضعفاء لكسب التعاطف ..انا لست ضد بنكيران وانما الرجل الصالح هو الذي يفعل ما يقول ولا يبكي الا عند النصر,N,2016-10-01 00:07:44
1,2,كلنا بنكيران\nولاية ثانية ان شاء الله\nموتوا بحقدكم,P,2016-10-01 00:47:37
2,3,الشركات في الدول المتقدمة تساهم في بناء أوطانها بدفع الضرائب وفي بلدنا العزيز الشركات تطلب من الدولة أن تخدم عليها؟,N,2016-10-01 00:48:02
3,4,من ينتقد بن كران هم خصوم معارضة لى خاصها هي سلطة لا تهتم لوضعية مواطن,N,2016-10-01 00:49:10


{'N', 'P'}

sentiment
N    6581
P    3673
Name: count, dtype: int64

2

10254

DatasetDict({
    train: Dataset({
        features: ['comment_message', 'label'],
        num_rows: 8203
    })
    test: Dataset({
        features: ['comment_message', 'label'],
        num_rows: 2051
    })
})

aubmindlab/bert-base-arabertv02-twitter, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4043,0.33008,0.864944,0.851458
120,0.339,0.305941,0.879571,0.86052
180,0.2329,0.36311,0.862506,0.849591
240,0.2022,0.327394,0.878596,0.86259
300,0.1446,0.423781,0.863481,0.849108
360,0.1056,0.45163,0.863481,0.85009
420,0.0712,0.570395,0.877133,0.858573
480,0.0597,0.560492,0.864456,0.852273
540,0.0472,0.66674,0.881521,0.863345
600,0.0231,0.718843,0.879083,0.864879


aubmindlab/bert-base-arabertv02-twitter, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.3997,0.321217,0.87177,0.858317
120,0.3432,0.295981,0.879083,0.861155
180,0.231,0.362314,0.861043,0.848874
240,0.2131,0.33829,0.876158,0.863301
300,0.1539,0.402766,0.87372,0.859524
360,0.1114,0.419334,0.868357,0.855628
420,0.0648,0.539528,0.872745,0.852118
480,0.0589,0.497561,0.865431,0.851946
540,0.0476,0.610917,0.877621,0.863001
600,0.0267,0.715392,0.867869,0.854007


aubmindlab/bert-base-arabertv02-twitter, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.3997,0.321217,0.87177,0.858317
120,0.3432,0.295981,0.879083,0.861155
180,0.231,0.362314,0.861043,0.848874
240,0.2131,0.33829,0.876158,0.863301
300,0.1539,0.402766,0.87372,0.859524
360,0.1114,0.419334,0.868357,0.855628
420,0.0648,0.539528,0.872745,0.852118
480,0.0589,0.497561,0.865431,0.851946
540,0.0476,0.610917,0.877621,0.863001
600,0.0267,0.715392,0.867869,0.854007


aubmindlab/bert-base-arabertv02-twitter, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4074,0.324277,0.870307,0.851078
120,0.3388,0.304631,0.878596,0.863102
180,0.2287,0.326905,0.877621,0.864781
240,0.2143,0.304786,0.881521,0.869004
300,0.1416,0.397921,0.882496,0.868831
360,0.0956,0.508689,0.879083,0.860014
420,0.074,0.572629,0.873233,0.861922
480,0.0545,0.600868,0.856168,0.84776
540,0.0469,0.619131,0.869332,0.85605
600,0.0193,0.773811,0.876158,0.861609


aubmindlab/bert-base-arabertv02-twitter, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4074,0.324277,0.870307,0.851078
120,0.3388,0.304631,0.878596,0.863102
180,0.2287,0.326905,0.877621,0.864781
240,0.2143,0.304786,0.881521,0.869004
300,0.1416,0.397921,0.882496,0.868831
360,0.0956,0.508689,0.879083,0.860014
420,0.074,0.572629,0.873233,0.861922
480,0.0545,0.600868,0.856168,0.84776
540,0.0469,0.619131,0.869332,0.85605
600,0.0193,0.773811,0.876158,0.861609


aubmindlab/bert-base-arabertv02-twitter, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4074,0.324277,0.870307,0.851078
120,0.3388,0.304631,0.878596,0.863102
180,0.2287,0.326905,0.877621,0.864781
240,0.2143,0.304786,0.881521,0.869004
300,0.1416,0.397921,0.882496,0.868831
360,0.0956,0.508689,0.879083,0.860014
420,0.074,0.572629,0.873233,0.861922
480,0.0545,0.600868,0.856168,0.84776
540,0.0469,0.619131,0.869332,0.85605
600,0.0193,0.773811,0.876158,0.861609


aubmindlab/bert-base-arabertv02-twitter, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4011,0.303289,0.877621,0.86358
120,0.3419,0.3255,0.865919,0.846224
180,0.2414,0.317465,0.879571,0.864501
240,0.2159,0.329173,0.87372,0.861641
300,0.1508,0.426129,0.855193,0.843796
360,0.1132,0.40694,0.870795,0.857334
420,0.069,0.623057,0.862019,0.850903
480,0.0508,0.557539,0.860068,0.849311
540,0.0354,0.685896,0.876646,0.862203
600,0.037,0.664728,0.867382,0.855015


aubmindlab/bert-base-arabertv02-twitter, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4011,0.303289,0.877621,0.86358
120,0.3419,0.3255,0.865919,0.846224
180,0.2414,0.317465,0.879571,0.864501
240,0.2159,0.329173,0.87372,0.861641
300,0.1508,0.426129,0.855193,0.843796
360,0.1132,0.40694,0.870795,0.857334
420,0.069,0.623057,0.862019,0.850903
480,0.0508,0.557539,0.860068,0.849311
540,0.0354,0.685896,0.876646,0.862203
600,0.037,0.664728,0.867382,0.855015


aubmindlab/bert-base-arabertv02-twitter, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4011,0.303289,0.877621,0.86358
120,0.3419,0.3255,0.865919,0.846224
180,0.2414,0.317465,0.879571,0.864501
240,0.2159,0.329173,0.87372,0.861641
300,0.1508,0.426129,0.855193,0.843796
360,0.1132,0.40694,0.870795,0.857334
420,0.069,0.623057,0.862019,0.850903
480,0.0508,0.557539,0.860068,0.849311
540,0.0354,0.685896,0.876646,0.862203
600,0.037,0.664728,0.867382,0.855015


DatasetDict({
    train: Dataset({
        features: ['comment_message', 'label'],
        num_rows: 8203
    })
    test: Dataset({
        features: ['comment_message', 'label'],
        num_rows: 2051
    })
})

CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4646,0.385631,0.836177,0.818074
120,0.3899,0.399089,0.83374,0.794091
180,0.2848,0.416925,0.842028,0.824451
240,0.2412,0.424569,0.846416,0.827574
300,0.1624,0.616489,0.829352,0.808485
360,0.1128,0.46766,0.842028,0.820313
420,0.0758,1.00777,0.831302,0.809842
480,0.0673,0.744465,0.805461,0.792639
540,0.0503,0.83338,0.83959,0.820555
600,0.0321,0.800456,0.840078,0.817813


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4646,0.385631,0.836177,0.818074
120,0.3899,0.399089,0.83374,0.794091
180,0.2848,0.416925,0.842028,0.824451
240,0.2412,0.424569,0.846416,0.827574
300,0.1624,0.616489,0.829352,0.808485
360,0.1128,0.46766,0.842028,0.820313
420,0.0758,1.00777,0.831302,0.809842
480,0.0673,0.744465,0.805461,0.792639
540,0.0503,0.83338,0.83959,0.820555
600,0.0321,0.800456,0.840078,0.817813


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4646,0.385631,0.836177,0.818074
120,0.3899,0.399089,0.83374,0.794091
180,0.2848,0.416925,0.842028,0.824451
240,0.2412,0.424569,0.846416,0.827574
300,0.1624,0.616489,0.829352,0.808485
360,0.1128,0.46766,0.842028,0.820313
420,0.0758,1.00777,0.831302,0.809842
480,0.0673,0.744465,0.805461,0.792639
540,0.0503,0.83338,0.83959,0.820555
600,0.0321,0.800456,0.840078,0.817813


CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4719,0.360987,0.845929,0.822655
120,0.3985,0.360768,0.852755,0.836816
180,0.2573,0.447539,0.839103,0.82517
240,0.2502,0.367273,0.847392,0.827141
300,0.1424,0.750729,0.82155,0.810981
360,0.0906,0.663673,0.83569,0.820312
420,0.0833,0.900671,0.814725,0.803167
480,0.0559,0.762259,0.838615,0.822153
540,0.0463,0.840308,0.822038,0.812263
600,0.0281,0.996831,0.841053,0.822129


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4719,0.360987,0.845929,0.822655
120,0.3985,0.360768,0.852755,0.836816
180,0.2573,0.447539,0.839103,0.82517
240,0.2502,0.367273,0.847392,0.827141
300,0.1424,0.750729,0.82155,0.810981
360,0.0906,0.663673,0.83569,0.820312
420,0.0833,0.900671,0.814725,0.803167
480,0.0559,0.762259,0.838615,0.822153
540,0.0463,0.840308,0.822038,0.812263
600,0.0281,0.996831,0.841053,0.822129


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4719,0.360987,0.845929,0.822655
120,0.3985,0.360768,0.852755,0.836816
180,0.2573,0.447539,0.839103,0.82517
240,0.2502,0.367273,0.847392,0.827141
300,0.1424,0.750729,0.82155,0.810981
360,0.0906,0.663673,0.83569,0.820312
420,0.0833,0.900671,0.814725,0.803167
480,0.0559,0.762259,0.838615,0.822153
540,0.0463,0.840308,0.822038,0.812263
600,0.0281,0.996831,0.841053,0.822129


CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4764,0.390344,0.838128,0.820847
120,0.3953,0.387269,0.831789,0.798081
180,0.2711,0.39037,0.847392,0.833005
240,0.249,0.374397,0.843491,0.82649
300,0.1537,0.554246,0.835202,0.821773
360,0.1152,0.469462,0.832765,0.815946
420,0.0728,0.938566,0.823988,0.812095
480,0.0429,0.706461,0.83374,0.81874
540,0.052,0.83095,0.842028,0.825857
600,0.0311,0.767818,0.840566,0.824983


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4764,0.390344,0.838128,0.820847
120,0.3953,0.387269,0.831789,0.798081
180,0.2711,0.39037,0.847392,0.833005
240,0.249,0.374397,0.843491,0.82649
300,0.1537,0.554246,0.835202,0.821773
360,0.1152,0.469462,0.832765,0.815946
420,0.0728,0.938566,0.823988,0.812095
480,0.0429,0.706461,0.83374,0.81874
540,0.052,0.83095,0.842028,0.825857
600,0.0311,0.767818,0.840566,0.824983


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4764,0.390344,0.838128,0.820847
120,0.3953,0.387269,0.831789,0.798081
180,0.2711,0.39037,0.847392,0.833005
240,0.249,0.374397,0.843491,0.82649
300,0.1537,0.554246,0.835202,0.821773
360,0.1152,0.469462,0.832765,0.815946
420,0.0728,0.938566,0.823988,0.812095
480,0.0429,0.706461,0.83374,0.81874
540,0.052,0.83095,0.842028,0.825857
600,0.0311,0.767818,0.840566,0.824983


DatasetDict({
    train: Dataset({
        features: ['comment_message', 'label'],
        num_rows: 8203
    })
    test: Dataset({
        features: ['comment_message', 'label'],
        num_rows: 2051
    })
})

qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4234,0.341839,0.854217,0.83199
120,0.3524,0.331895,0.861043,0.834143
180,0.2298,0.397474,0.847879,0.834407
240,0.1822,0.3802,0.852267,0.83279
300,0.1268,0.538624,0.863969,0.846834
360,0.0807,0.502307,0.856655,0.842494
420,0.0523,0.855404,0.826426,0.816589
480,0.0457,0.614232,0.853242,0.836744
540,0.0287,0.855127,0.863481,0.845772
600,0.0215,0.918424,0.85178,0.826492


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4234,0.341839,0.854217,0.83199
120,0.3524,0.331895,0.861043,0.834143
180,0.2298,0.397474,0.847879,0.834407
240,0.1822,0.3802,0.852267,0.83279
300,0.1268,0.538624,0.863969,0.846834
360,0.0807,0.502307,0.856655,0.842494
420,0.0523,0.855404,0.826426,0.816589
480,0.0457,0.614232,0.853242,0.836744
540,0.0287,0.855127,0.863481,0.845772
600,0.0215,0.918424,0.85178,0.826492


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4234,0.341839,0.854217,0.83199
120,0.3524,0.331895,0.861043,0.834143
180,0.2298,0.397474,0.847879,0.834407
240,0.1822,0.3802,0.852267,0.83279
300,0.1268,0.538624,0.863969,0.846834
360,0.0807,0.502307,0.856655,0.842494
420,0.0523,0.855404,0.826426,0.816589
480,0.0457,0.614232,0.853242,0.836744
540,0.0287,0.855127,0.863481,0.845772
600,0.0215,0.918424,0.85178,0.826492


qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4239,0.338529,0.859093,0.838653
120,0.3655,0.311994,0.87372,0.858022
180,0.2222,0.331113,0.87177,0.858597
240,0.1978,0.337073,0.867869,0.855231
300,0.1022,0.562437,0.865431,0.851753
360,0.0769,0.544589,0.863969,0.852409
420,0.0545,0.759677,0.872257,0.855361
480,0.0565,0.677569,0.865431,0.849302
540,0.0298,0.801343,0.85763,0.844739
600,0.0167,0.877615,0.857143,0.84328


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4239,0.338529,0.859093,0.838653
120,0.3655,0.311994,0.87372,0.858022
180,0.2222,0.331113,0.87177,0.858597
240,0.1978,0.337073,0.867869,0.855231
300,0.1022,0.562437,0.865431,0.851753
360,0.0769,0.544589,0.863969,0.852409
420,0.0545,0.759677,0.872257,0.855361
480,0.0565,0.677569,0.865431,0.849302
540,0.0298,0.801343,0.85763,0.844739
600,0.0167,0.877615,0.857143,0.84328


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4239,0.338529,0.859093,0.838653
120,0.3655,0.311994,0.87372,0.858022
180,0.2222,0.331113,0.87177,0.858597
240,0.1978,0.337073,0.867869,0.855231
300,0.1022,0.562437,0.865431,0.851753
360,0.0769,0.544589,0.863969,0.852409
420,0.0545,0.759677,0.872257,0.855361
480,0.0565,0.677569,0.865431,0.849302
540,0.0298,0.801343,0.85763,0.844739
600,0.0167,0.877615,0.857143,0.84328


qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4166,0.337961,0.857143,0.839617
120,0.3565,0.356134,0.85178,0.822501
180,0.2301,0.384618,0.860556,0.844064
240,0.1769,0.400948,0.853242,0.8401
300,0.118,0.60301,0.860556,0.841387
360,0.0699,0.540754,0.844466,0.831937
420,0.0633,0.751275,0.858118,0.842918
480,0.0466,0.774821,0.85763,0.840106
540,0.0322,0.862724,0.85373,0.840968
600,0.0234,0.905148,0.858606,0.841883


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4166,0.337961,0.857143,0.839617
120,0.3565,0.356134,0.85178,0.822501
180,0.2301,0.384618,0.860556,0.844064
240,0.1769,0.400948,0.853242,0.8401
300,0.118,0.60301,0.860556,0.841387
360,0.0699,0.540754,0.844466,0.831937
420,0.0633,0.751275,0.858118,0.842918
480,0.0466,0.774821,0.85763,0.840106
540,0.0322,0.862724,0.85373,0.840968
600,0.0234,0.905148,0.858606,0.841883


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4166,0.337961,0.857143,0.839617
120,0.3565,0.356134,0.85178,0.822501
180,0.2301,0.384618,0.860556,0.844064
240,0.1769,0.400948,0.853242,0.8401
300,0.118,0.60301,0.860556,0.841387
360,0.0699,0.540754,0.844466,0.831937
420,0.0633,0.751275,0.858118,0.842918
480,0.0466,0.774821,0.85763,0.840106
540,0.0322,0.862724,0.85373,0.840968
600,0.0234,0.905148,0.858606,0.841883


DatasetDict({
    train: Dataset({
        features: ['comment_message', 'label'],
        num_rows: 8203
    })
    test: Dataset({
        features: ['comment_message', 'label'],
        num_rows: 2051
    })
})

UBC-NLP/MARBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4285,0.338697,0.864456,0.846988
120,0.3634,0.335557,0.863481,0.840467
180,0.2379,0.441742,0.856655,0.835534
240,0.1914,0.36675,0.861531,0.843685
300,0.1394,0.508007,0.83959,0.826062
360,0.0989,0.525899,0.845929,0.829595
420,0.0738,0.748289,0.854705,0.83343
480,0.0627,0.639085,0.847879,0.829767
540,0.0462,1.169614,0.823501,0.810091
600,0.0314,1.019813,0.824476,0.811763


UBC-NLP/MARBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4285,0.338697,0.864456,0.846988
120,0.3634,0.335557,0.863481,0.840467
180,0.2379,0.441742,0.856655,0.835534
240,0.1914,0.36675,0.861531,0.843685
300,0.1394,0.508007,0.83959,0.826062
360,0.0989,0.525899,0.845929,0.829595
420,0.0738,0.748289,0.854705,0.83343
480,0.0627,0.639085,0.847879,0.829767
540,0.0462,1.169614,0.823501,0.810091
600,0.0314,1.019813,0.824476,0.811763


UBC-NLP/MARBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4285,0.338697,0.864456,0.846988
120,0.3634,0.335557,0.863481,0.840467
180,0.2379,0.441742,0.856655,0.835534
240,0.1914,0.36675,0.861531,0.843685
300,0.1394,0.508007,0.83959,0.826062
360,0.0989,0.525899,0.845929,0.829595
420,0.0738,0.748289,0.854705,0.83343
480,0.0627,0.639085,0.847879,0.829767
540,0.0462,1.169614,0.823501,0.810091
600,0.0314,1.019813,0.824476,0.811763


UBC-NLP/MARBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4546,0.361048,0.851292,0.824608
120,0.3763,0.312754,0.874695,0.858599
180,0.2434,0.328313,0.868844,0.855654
240,0.2316,0.314172,0.86982,0.852545
300,0.1413,0.428602,0.867869,0.853117
360,0.0986,0.527584,0.866407,0.851337
420,0.0806,0.698084,0.849829,0.836923
480,0.0684,0.835363,0.835202,0.825184
540,0.0466,0.815834,0.848854,0.836537
600,0.043,0.870873,0.864456,0.845101


UBC-NLP/MARBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4546,0.361048,0.851292,0.824608
120,0.3763,0.312754,0.874695,0.858599
180,0.2434,0.328313,0.868844,0.855654
240,0.2316,0.314172,0.86982,0.852545
300,0.1413,0.428602,0.867869,0.853117
360,0.0986,0.527584,0.866407,0.851337
420,0.0806,0.698084,0.849829,0.836923
480,0.0684,0.835363,0.835202,0.825184
540,0.0466,0.815834,0.848854,0.836537
600,0.043,0.870873,0.864456,0.845101


UBC-NLP/MARBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4546,0.361048,0.851292,0.824608
120,0.3763,0.312754,0.874695,0.858599
180,0.2434,0.328313,0.868844,0.855654
240,0.2316,0.314172,0.86982,0.852545
300,0.1413,0.428602,0.867869,0.853117
360,0.0986,0.527584,0.866407,0.851337
420,0.0806,0.698084,0.849829,0.836923
480,0.0684,0.835363,0.835202,0.825184
540,0.0466,0.815834,0.848854,0.836537
600,0.043,0.870873,0.864456,0.845101


UBC-NLP/MARBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4567,0.372381,0.856168,0.84221
120,0.3672,0.380743,0.840566,0.808433
180,0.2534,0.413368,0.859093,0.847566
240,0.2188,0.356931,0.865431,0.850148
300,0.131,0.552411,0.850317,0.833027
360,0.0975,0.472748,0.857143,0.843479
420,0.0607,0.7843,0.859093,0.843468
480,0.038,0.917362,0.85373,0.836777
540,0.0452,0.99452,0.847392,0.833213
600,0.0315,1.023019,0.844466,0.827572


UBC-NLP/MARBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4567,0.372381,0.856168,0.84221
120,0.3672,0.380743,0.840566,0.808433
180,0.2534,0.413368,0.859093,0.847566
240,0.2188,0.356931,0.865431,0.850148
300,0.131,0.552411,0.850317,0.833027
360,0.0975,0.472748,0.857143,0.843479
420,0.0607,0.7843,0.859093,0.843468
480,0.038,0.917362,0.85373,0.836777
540,0.0452,0.99452,0.847392,0.833213
600,0.0315,1.023019,0.844466,0.827572


UBC-NLP/MARBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4567,0.372381,0.856168,0.84221
120,0.3672,0.380743,0.840566,0.808433
180,0.2534,0.413368,0.859093,0.847566
240,0.2188,0.356931,0.865431,0.850148
300,0.131,0.552411,0.850317,0.833027
360,0.0975,0.472748,0.857143,0.843479
420,0.0607,0.7843,0.859093,0.843468
480,0.038,0.917362,0.85373,0.836777
540,0.0452,0.99452,0.847392,0.833213
600,0.0315,1.023019,0.844466,0.827572


DatasetDict({
    train: Dataset({
        features: ['comment_message', 'label'],
        num_rows: 8203
    })
    test: Dataset({
        features: ['comment_message', 'label'],
        num_rows: 2051
    })
})

UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4351,0.328148,0.865431,0.84523
120,0.3449,0.321765,0.87177,0.849696
180,0.2365,0.330817,0.861043,0.84626
240,0.1998,0.376475,0.865919,0.84535
300,0.1392,0.495495,0.857143,0.840191
360,0.0992,0.451566,0.862994,0.848009
420,0.0659,0.654003,0.862506,0.847828
480,0.0601,0.707979,0.855193,0.839463
540,0.0701,0.753655,0.844466,0.833427
600,0.0519,0.627995,0.873233,0.854202


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4351,0.328148,0.865431,0.84523
120,0.3449,0.321765,0.87177,0.849696
180,0.2365,0.330817,0.861043,0.84626
240,0.1998,0.376475,0.865919,0.84535
300,0.1392,0.495495,0.857143,0.840191
360,0.0992,0.451566,0.862994,0.848009
420,0.0659,0.654003,0.862506,0.847828
480,0.0601,0.707979,0.855193,0.839463
540,0.0701,0.753655,0.844466,0.833427
600,0.0519,0.627995,0.873233,0.854202


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4351,0.328148,0.865431,0.84523
120,0.3449,0.321765,0.87177,0.849696
180,0.2365,0.330817,0.861043,0.84626
240,0.1998,0.376475,0.865919,0.84535
300,0.1392,0.495495,0.857143,0.840191
360,0.0992,0.451566,0.862994,0.848009
420,0.0659,0.654003,0.862506,0.847828
480,0.0601,0.707979,0.855193,0.839463
540,0.0701,0.753655,0.844466,0.833427
600,0.0519,0.627995,0.873233,0.854202


UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4484,0.368968,0.859093,0.833055
120,0.3519,0.299389,0.884447,0.871189
180,0.2388,0.31974,0.874695,0.863223
240,0.2268,0.322319,0.880059,0.866713
300,0.1427,0.405654,0.874695,0.862093
360,0.0966,0.499166,0.86982,0.856912
420,0.091,0.655361,0.864456,0.854953
480,0.0608,0.591277,0.859093,0.848847
540,0.0529,0.609896,0.871282,0.860631
600,0.0323,0.652717,0.876646,0.8623


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4484,0.368968,0.859093,0.833055
120,0.3519,0.299389,0.884447,0.871189
180,0.2388,0.31974,0.874695,0.863223
240,0.2268,0.322319,0.880059,0.866713
300,0.1427,0.405654,0.874695,0.862093
360,0.0966,0.499166,0.86982,0.856912
420,0.091,0.655361,0.864456,0.854953
480,0.0608,0.591277,0.859093,0.848847
540,0.0529,0.609896,0.871282,0.860631
600,0.0323,0.652717,0.876646,0.8623


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4484,0.368968,0.859093,0.833055
120,0.3519,0.299389,0.884447,0.871189
180,0.2388,0.31974,0.874695,0.863223
240,0.2268,0.322319,0.880059,0.866713
300,0.1427,0.405654,0.874695,0.862093
360,0.0966,0.499166,0.86982,0.856912
420,0.091,0.655361,0.864456,0.854953
480,0.0608,0.591277,0.859093,0.848847
540,0.0529,0.609896,0.871282,0.860631
600,0.0323,0.652717,0.876646,0.8623


UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4428,0.355264,0.862506,0.842499
120,0.3509,0.360789,0.854705,0.826982
180,0.2457,0.323717,0.876646,0.862684
240,0.2082,0.34686,0.872257,0.862007
300,0.1553,0.482392,0.859093,0.849413
360,0.1104,0.473103,0.850317,0.841796
420,0.0845,0.703531,0.865919,0.848807
480,0.0515,0.652947,0.873233,0.861498
540,0.0603,0.598395,0.87372,0.860003
600,0.0555,0.570377,0.861043,0.848321


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4428,0.355264,0.862506,0.842499
120,0.3509,0.360789,0.854705,0.826982
180,0.2457,0.323717,0.876646,0.862684
240,0.2082,0.34686,0.872257,0.862007
300,0.1553,0.482392,0.859093,0.849413
360,0.1104,0.473103,0.850317,0.841796
420,0.0845,0.703531,0.865919,0.848807
480,0.0515,0.652947,0.873233,0.861498
540,0.0603,0.598395,0.87372,0.860003
600,0.0555,0.570377,0.861043,0.848321


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4428,0.355264,0.862506,0.842499
120,0.3509,0.360789,0.854705,0.826982
180,0.2457,0.323717,0.876646,0.862684
240,0.2082,0.34686,0.872257,0.862007
300,0.1553,0.482392,0.859093,0.849413
360,0.1104,0.473103,0.850317,0.841796
420,0.0845,0.703531,0.865919,0.848807
480,0.0515,0.652947,0.873233,0.861498
540,0.0603,0.598395,0.87372,0.860003
600,0.0555,0.570377,0.861043,0.848321


DatasetDict({
    train: Dataset({
        features: ['comment_message', 'label'],
        num_rows: 8203
    })
    test: Dataset({
        features: ['comment_message', 'label'],
        num_rows: 2051
    })
})

SI2M-Lab/DarijaBERT-mix, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.5124,0.501269,0.758654,0.750716
120,0.4389,0.369967,0.844954,0.81705
180,0.3805,0.347401,0.858606,0.836578
240,0.3299,0.348951,0.85568,0.836714
300,0.2575,0.449928,0.847392,0.832368
360,0.196,0.383032,0.860556,0.837049
420,0.1411,0.489436,0.847392,0.833522
480,0.092,0.512435,0.854705,0.83343
540,0.0983,0.658702,0.860556,0.841752
600,0.041,0.674409,0.864456,0.844733


SI2M-Lab/DarijaBERT-mix, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.5124,0.501269,0.758654,0.750716
120,0.4389,0.369967,0.844954,0.81705
180,0.3805,0.347401,0.858606,0.836578
240,0.3299,0.348951,0.85568,0.836714
300,0.2575,0.449928,0.847392,0.832368
360,0.196,0.383032,0.860556,0.837049
420,0.1411,0.489436,0.847392,0.833522
480,0.092,0.512435,0.854705,0.83343
540,0.0983,0.658702,0.860556,0.841752
600,0.041,0.674409,0.864456,0.844733


SI2M-Lab/DarijaBERT-mix, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.5124,0.501269,0.758654,0.750716
120,0.4389,0.369967,0.844954,0.81705
180,0.3805,0.347401,0.858606,0.836578
240,0.3299,0.348951,0.85568,0.836714
300,0.2575,0.449928,0.847392,0.832368
360,0.196,0.383032,0.860556,0.837049
420,0.1411,0.489436,0.847392,0.833522
480,0.092,0.512435,0.854705,0.83343
540,0.0983,0.658702,0.860556,0.841752
600,0.041,0.674409,0.864456,0.844733


SI2M-Lab/DarijaBERT-mix, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.545,0.375861,0.841541,0.81841
120,0.3976,0.351011,0.861531,0.845698
180,0.3205,0.342189,0.861043,0.846054
240,0.3256,0.33823,0.859093,0.845713
300,0.2157,0.423984,0.847879,0.835483
360,0.1551,0.435624,0.848854,0.835369
420,0.1179,0.642573,0.852755,0.836258
480,0.0782,0.607093,0.861531,0.844487
540,0.0615,0.755177,0.850804,0.833395
600,0.0418,0.730729,0.85178,0.835956


SI2M-Lab/DarijaBERT-mix, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.545,0.375861,0.841541,0.81841
120,0.3976,0.351011,0.861531,0.845698
180,0.3205,0.342189,0.861043,0.846054
240,0.3256,0.33823,0.859093,0.845713
300,0.2157,0.423984,0.847879,0.835483
360,0.1551,0.435624,0.848854,0.835369
420,0.1179,0.642573,0.852755,0.836258
480,0.0782,0.607093,0.861531,0.844487
540,0.0615,0.755177,0.850804,0.833395
600,0.0418,0.730729,0.85178,0.835956


SI2M-Lab/DarijaBERT-mix, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.545,0.375861,0.841541,0.81841
120,0.3976,0.351011,0.861531,0.845698
180,0.3205,0.342189,0.861043,0.846054
240,0.3256,0.33823,0.859093,0.845713
300,0.2157,0.423984,0.847879,0.835483
360,0.1551,0.435624,0.848854,0.835369
420,0.1179,0.642573,0.852755,0.836258
480,0.0782,0.607093,0.861531,0.844487
540,0.0615,0.755177,0.850804,0.833395
600,0.0418,0.730729,0.85178,0.835956


SI2M-Lab/DarijaBERT-mix, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4703,0.378496,0.830327,0.810661
120,0.405,0.3757,0.843491,0.816226
180,0.3149,0.39028,0.834715,0.822108
240,0.2985,0.352109,0.849342,0.826371
300,0.224,0.430093,0.850317,0.835687
360,0.1775,0.39093,0.845929,0.826458
420,0.1271,0.639537,0.843979,0.83087
480,0.1033,0.553771,0.849829,0.827285
540,0.0758,0.693306,0.858118,0.843747
600,0.0649,0.724817,0.847392,0.833005


SI2M-Lab/DarijaBERT-mix, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4703,0.378496,0.830327,0.810661
120,0.405,0.3757,0.843491,0.816226
180,0.3149,0.39028,0.834715,0.822108
240,0.2985,0.352109,0.849342,0.826371
300,0.224,0.430093,0.850317,0.835687
360,0.1775,0.39093,0.845929,0.826458
420,0.1271,0.639537,0.843979,0.83087
480,0.1033,0.553771,0.849829,0.827285
540,0.0758,0.693306,0.858118,0.843747
600,0.0649,0.724817,0.847392,0.833005


SI2M-Lab/DarijaBERT-mix, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4703,0.378496,0.830327,0.810661
120,0.405,0.3757,0.843491,0.816226
180,0.3149,0.39028,0.834715,0.822108
240,0.2985,0.352109,0.849342,0.826371
300,0.224,0.430093,0.850317,0.835687
360,0.1775,0.39093,0.845929,0.826458
420,0.1271,0.639537,0.843979,0.83087
480,0.1033,0.553771,0.849829,0.827285
540,0.0758,0.693306,0.858118,0.843747
600,0.0649,0.724817,0.847392,0.833005


DatasetDict({
    train: Dataset({
        features: ['comment_message', 'label'],
        num_rows: 8203
    })
    test: Dataset({
        features: ['comment_message', 'label'],
        num_rows: 2051
    })
})

SI2M-Lab/DarijaBERT-arabizi, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4989,0.467862,0.793272,0.777689
120,0.435,0.462001,0.80156,0.73935
180,0.3479,0.415867,0.818625,0.792233
240,0.3062,0.416615,0.831789,0.806301
300,0.2262,0.48179,0.828376,0.803403
360,0.1778,0.4881,0.832765,0.807892
420,0.1401,0.804721,0.798147,0.784338
480,0.099,0.788331,0.793272,0.779245
540,0.0816,0.685482,0.830814,0.802208
600,0.0406,0.912527,0.823501,0.805813


SI2M-Lab/DarijaBERT-arabizi, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4989,0.467862,0.793272,0.777689
120,0.435,0.462001,0.80156,0.73935
180,0.3479,0.415867,0.818625,0.792233
240,0.3062,0.416615,0.831789,0.806301
300,0.2262,0.48179,0.828376,0.803403
360,0.1778,0.4881,0.832765,0.807892
420,0.1401,0.804721,0.798147,0.784338
480,0.099,0.788331,0.793272,0.779245
540,0.0816,0.685482,0.830814,0.802208
600,0.0406,0.912527,0.823501,0.805813


SI2M-Lab/DarijaBERT-arabizi, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.4989,0.467862,0.793272,0.777689
120,0.435,0.462001,0.80156,0.73935
180,0.3479,0.415867,0.818625,0.792233
240,0.3062,0.416615,0.831789,0.806301
300,0.2262,0.48179,0.828376,0.803403
360,0.1778,0.4881,0.832765,0.807892
420,0.1401,0.804721,0.798147,0.784338
480,0.099,0.788331,0.793272,0.779245
540,0.0816,0.685482,0.830814,0.802208
600,0.0406,0.912527,0.823501,0.805813


SI2M-Lab/DarijaBERT-arabizi, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.5086,0.400263,0.823988,0.794049
120,0.4375,0.377068,0.838615,0.813704
180,0.3435,0.409003,0.836177,0.817824
240,0.3109,0.400466,0.83569,0.819515
300,0.2195,0.536499,0.828864,0.811035
360,0.1697,0.482029,0.827889,0.808142
420,0.1261,0.699511,0.807899,0.792484
480,0.0952,0.682021,0.809849,0.796077
540,0.0785,0.826258,0.834715,0.809514
600,0.0356,0.955492,0.829839,0.811228


SI2M-Lab/DarijaBERT-arabizi, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.5086,0.400263,0.823988,0.794049
120,0.4375,0.377068,0.838615,0.813704
180,0.3435,0.409003,0.836177,0.817824
240,0.3109,0.400466,0.83569,0.819515
300,0.2195,0.536499,0.828864,0.811035
360,0.1697,0.482029,0.827889,0.808142
420,0.1261,0.699511,0.807899,0.792484
480,0.0952,0.682021,0.809849,0.796077
540,0.0785,0.826258,0.834715,0.809514
600,0.0356,0.955492,0.829839,0.811228


SI2M-Lab/DarijaBERT-arabizi, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.5086,0.400263,0.823988,0.794049
120,0.4375,0.377068,0.838615,0.813704
180,0.3435,0.409003,0.836177,0.817824
240,0.3109,0.400466,0.83569,0.819515
300,0.2195,0.536499,0.828864,0.811035
360,0.1697,0.482029,0.827889,0.808142
420,0.1261,0.699511,0.807899,0.792484
480,0.0952,0.682021,0.809849,0.796077
540,0.0785,0.826258,0.834715,0.809514
600,0.0356,0.955492,0.829839,0.811228


SI2M-Lab/DarijaBERT-arabizi, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.5051,0.445808,0.798635,0.780468
120,0.452,0.439255,0.810336,0.768018
180,0.3334,0.450055,0.818137,0.786077
240,0.3232,0.446,0.810824,0.792268
300,0.2339,0.499006,0.824963,0.795896
360,0.1813,0.543101,0.807899,0.789723
420,0.1226,1.119851,0.759629,0.75127
480,0.0928,0.806001,0.800585,0.788092
540,0.0728,0.962623,0.809361,0.792163
600,0.0488,1.095183,0.784495,0.773849


SI2M-Lab/DarijaBERT-arabizi, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.5051,0.445808,0.798635,0.780468
120,0.452,0.439255,0.810336,0.768018
180,0.3334,0.450055,0.818137,0.786077
240,0.3232,0.446,0.810824,0.792268
300,0.2339,0.499006,0.824963,0.795896
360,0.1813,0.543101,0.807899,0.789723
420,0.1226,1.119851,0.759629,0.75127
480,0.0928,0.806001,0.800585,0.788092
540,0.0728,0.962623,0.809361,0.792163
600,0.0488,1.095183,0.784495,0.773849


SI2M-Lab/DarijaBERT-arabizi, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/8203 [00:00<?, ? examples/s]

Map:   0%|          | 0/2051 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
60,0.5051,0.445808,0.798635,0.780468
120,0.452,0.439255,0.810336,0.768018
180,0.3334,0.450055,0.818137,0.786077
240,0.3232,0.446,0.810824,0.792268
300,0.2339,0.499006,0.824963,0.795896
360,0.1813,0.543101,0.807899,0.789723
420,0.1226,1.119851,0.759629,0.75127
480,0.0928,0.806001,0.800585,0.788092
540,0.0728,0.962623,0.809361,0.792163
600,0.0488,1.095183,0.784495,0.773849


Unnamed: 0,Model,Accuracy,F1
0,CAMeL-Lab/bert-base-arabic-camelbert-da,0.852755,0.836816
3,SI2M-Lab/DarijaBERT-arabizi,0.83569,0.819515
6,SI2M-Lab/DarijaBERT-mix,0.861043,0.846054
9,UBC-NLP/MARBERT,0.874695,0.858599
12,UBC-NLP/MARBERTv2,0.884447,0.871189
15,aubmindlab/bert-base-arabertv02-twitter,0.883471,0.870011
18,qarib/bert-base-qarib,0.87177,0.858597
