In [1]:
import os
os.environ["CUDA_VISIBLE_DEVICES"]="1" 

import numpy as np
import tensorflow as tf
import pandas as pd
import pyarabic.araby as araby
import warnings
warnings.filterwarnings('ignore')
from sklearn.model_selection import train_test_split
from sklearn.metrics import classification_report
from tensorflow.keras.layers import Dense, Input
from tensorflow.keras.utils import to_categorical
from tensorflow.keras.optimizers import Adam
from tensorflow.keras.callbacks import EarlyStopping
from tensorflow.keras.initializers import TruncatedNormal
from tensorflow.keras.losses import CategoricalCrossentropy
from tensorflow.keras.metrics import CategoricalAccuracy
import torch
from sklearn.metrics import accuracy_score, f1_score
from transformers import Trainer, TrainingArguments
from transformers import AutoTokenizer, AutoModelForSequenceClassification
from datasets import load_dataset, Dataset, concatenate_datasets
pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', None)
pd.set_option('display.max_colwidth', 1000)


fname = 'OpenTC_1'
log_file = fname + '.txt'

with open(log_file, 'w') as f:
    f.write('Model,Accuracy,F1\n')


df1 = pd.read_csv('datasets/OpenAccessArDialect/Topic.csv', encoding='utf-8', engine='python', sep='\t') #, quotechar="'"  , quoting=3
df2 = pd.read_csv('datasets/OpenAccessArDialect/dialect.csv', encoding='utf-8', engine='python') #, quotechar="'"  , quoting=3

df2 = df2[df2['dialect'] == 'Morocco']
      
display(df1.columns)
display(df1[:4])

display(df2.columns)
display(df2[:4])
display(len(df2))




df = df1[df1['Text'].isin(df2['Twits'])]

display(df[:5])
display(len(df))

c = df['Tag'].value_counts()
display(c)

classes = set(df['Tag'].values)
display(classes)

df['Tag'] = df['Tag'].astype('category')
df['label'] = df['Tag'].cat.codes

df = df[['Text', 'label']]
classes_num = len(classes)
display(classes_num)
display(len(df))



max_sequence_length = 128



models = [ 
        'aubmindlab/bert-base-arabertv02-twitter',
        'CAMeL-Lab/bert-base-arabic-camelbert-da',
        'qarib/bert-base-qarib', 
        'UBC-NLP/MARBERT',
        'UBC-NLP/MARBERTv2',
    'SI2M-Lab/DarijaBERT-mix',
    'SI2M-Lab/DarijaBERT-arabizi'
]


seeds = [0, 1, 42]

for model_name in models:
    for seed in seeds:
        ds = Dataset.from_pandas(df)
        ds = ds.train_test_split(test_size=0.2, seed = seed)
        if seed==0:
            display(ds)
            
        for i in range(3):
            print(f'{model_name}, try:{i}')
                  
            tokenizer = AutoTokenizer.from_pretrained(model_name)
            model = AutoModelForSequenceClassification.from_pretrained(model_name,
                                                                  num_labels=classes_num).to('cuda')                                                 
            dataset_train = ds['train']
            dataset_validation = ds['test']                                                    
            
          
    
            def preprocess_function(examples):
                return tokenizer(examples['Text'], truncation=True, padding="max_length",
                                max_length=max_sequence_length)
            
            
            dataset_train = dataset_train.map(preprocess_function, batched=True)
            dataset_validation = dataset_validation.map(preprocess_function, batched=True)
            
           
            
            def compute_metrics(eval_pred):
                logits, labels = eval_pred
                predictions = np.argmax(logits, axis=-1)    
                acc = accuracy_score(labels, predictions)        
                f1 = f1_score(labels, predictions, average='macro')   
                with open(log_file, 'a') as f:
                    f.write(f'{model_name},{acc},{f1}\n')
                return {'accuracy': acc, 'f1_score': f1}
    
    
            
            
            epochs = 15
            save_steps = 10000 #save checkpoint every 10000 steps
            batch_size = 64
            
            training_args = TrainingArguments(
                output_dir = 'bert/',
                overwrite_output_dir=True,
                num_train_epochs = epochs,
                per_device_train_batch_size = batch_size,
                per_device_eval_batch_size = batch_size,
                save_steps = save_steps,
                save_total_limit = 1, #only save the last 5 checkpoints
                fp16=True,
                learning_rate = 5e-5,  # 5e-5 is the default
                logging_steps = 50, #50_000
                evaluation_strategy = 'steps',
                # evaluate_during_training = True,
                eval_steps = 50
                
            )
            
            trainer = Trainer(
                model = model,
                args = training_args,
                # data_collator=data_collator,
                train_dataset=dataset_train,
                eval_dataset=dataset_validation,
                compute_metrics = compute_metrics
            )
            
            
            trainer.train()


results = pd.read_csv(log_file)

best_results = results.groupby('Model', as_index=False)['F1'].max()

best_results = pd.merge(best_results, results, on=['Model', 'F1'])
best_results = best_results[['Model', 'Accuracy', 'F1']]
best_results = best_results.drop_duplicates()
best_results.to_csv(f'{fname}.csv')
display(best_results)



2024-09-18 15:02:23.870580: I tensorflow/core/util/port.cc:110] oneDNN custom operations are on. You may see slightly different numerical results due to floating-point round-off errors from different computation orders. To turn them off, set the environment variable `TF_ENABLE_ONEDNN_OPTS=0`.
2024-09-18 15:02:23.893528: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.
To enable the following instructions: AVX2 AVX512F AVX512_VNNI AVX512_BF16 FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.


Index(['Text', 'Tag'], dtype='object')

Unnamed: 0,Text,Tag
0,: حالة الطوارئ الصحية: وثيقة التنقل لن تسلم للقاصرين، عند وجود حالة ضرورية لتنقل القاصرين لا بد ان يكونوا مرفوقين باشخاص ب…,social
1,: السلطات تعمل على الإغلاق الشامل لبويزاكارن البؤرة الجديدة لڤيروس كورونا بالمغرب والأقاليم الجنوبية.,sante
2,"للأسف هادي أنانية ولكن لبعلوك عجبني الرد ديالو ههههه , أميييين شكرا خويا",autre
3,انا لله وانا اليه راجعون. الله يرحمها و يغفر لها,autre


Index(['Twits', 'dialect'], dtype='object')

Unnamed: 0,Twits,dialect
13393,slawiya msikina tb9a f darha 😐😕😕,Morocco
13394,ناس د الرباط أش واقع عندكم تما ... ياكما شي شبه عائلية 😐,Morocco
13395,لي دوا مشاا 😂😂,Morocco
13396,: وزراء تقلقوا,Morocco


9965

Unnamed: 0,Text,Tag
0,: حالة الطوارئ الصحية: وثيقة التنقل لن تسلم للقاصرين، عند وجود حالة ضرورية لتنقل القاصرين لا بد ان يكونوا مرفوقين باشخاص ب…,social
1,: السلطات تعمل على الإغلاق الشامل لبويزاكارن البؤرة الجديدة لڤيروس كورونا بالمغرب والأقاليم الجنوبية.,sante
2,"للأسف هادي أنانية ولكن لبعلوك عجبني الرد ديالو ههههه , أميييين شكرا خويا",autre
3,انا لله وانا اليه راجعون. الله يرحمها و يغفر لها,autre
4,مالنا,autre


6091

Tag
autre         5411
social         346
sante          217
politique       93
sport           12
économique      12
Name: count, dtype: int64

{'autre', 'politique', 'sante', 'social', 'sport', 'économique'}

6

6091

DatasetDict({
    train: Dataset({
        features: ['Text', 'label', '__index_level_0__'],
        num_rows: 4872
    })
    test: Dataset({
        features: ['Text', 'label', '__index_level_0__'],
        num_rows: 1219
    })
})

aubmindlab/bert-base-arabertv02-twitter, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3719,0.214103,0.924528,0.415141
100,0.2231,0.203357,0.932732,0.460995
150,0.1982,0.222039,0.92863,0.397309
200,0.1239,0.262024,0.913864,0.394064
250,0.0899,0.307031,0.913043,0.417406
300,0.0496,0.374638,0.90402,0.390995
350,0.0261,0.319584,0.92863,0.431467
400,0.015,0.360239,0.922888,0.427331
450,0.0116,0.36964,0.923708,0.435141
500,0.0046,0.379611,0.925349,0.436668


aubmindlab/bert-base-arabertv02-twitter, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3547,0.214592,0.926169,0.411447
100,0.2219,0.207123,0.926989,0.450028
150,0.1943,0.231369,0.932732,0.417796
200,0.1089,0.313618,0.912223,0.404532
250,0.0842,0.30942,0.920427,0.4356
300,0.0572,0.302575,0.92945,0.445935
350,0.0284,0.442617,0.90402,0.413087
400,0.0228,0.377503,0.918786,0.408006
450,0.0128,0.384164,0.925349,0.434571
500,0.005,0.38612,0.926169,0.427562


aubmindlab/bert-base-arabertv02-twitter, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3547,0.214592,0.926169,0.411447
100,0.2219,0.207123,0.926989,0.450028
150,0.1943,0.231369,0.932732,0.417796
200,0.1089,0.313618,0.912223,0.404532
250,0.0842,0.30942,0.920427,0.4356
300,0.0572,0.302575,0.92945,0.445935
350,0.0284,0.442617,0.90402,0.413087
400,0.0228,0.377503,0.918786,0.408006
450,0.0128,0.384164,0.925349,0.434571
500,0.005,0.38612,0.926169,0.427562


aubmindlab/bert-base-arabertv02-twitter, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3452,0.262148,0.910582,0.304831
100,0.2158,0.236936,0.916325,0.402538
150,0.1816,0.241882,0.924528,0.406315
200,0.0915,0.304441,0.913043,0.415212
250,0.0882,0.356963,0.912223,0.423148
300,0.0433,0.394473,0.916325,0.406903
350,0.0179,0.437663,0.908121,0.409196
400,0.0194,0.465046,0.917966,0.399255
450,0.0113,0.469469,0.918786,0.418248
500,0.0063,0.468018,0.913043,0.417035


aubmindlab/bert-base-arabertv02-twitter, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3452,0.262148,0.910582,0.304831
100,0.2158,0.236936,0.916325,0.402538
150,0.1816,0.241882,0.924528,0.406315
200,0.0915,0.304441,0.913043,0.415212
250,0.0882,0.356963,0.912223,0.423148
300,0.0433,0.394473,0.916325,0.406903
350,0.0179,0.437663,0.908121,0.409196
400,0.0194,0.465046,0.917966,0.399255
450,0.0113,0.469469,0.918786,0.418248
500,0.0063,0.468018,0.913043,0.417035


aubmindlab/bert-base-arabertv02-twitter, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3452,0.262148,0.910582,0.304831
100,0.2158,0.236936,0.916325,0.402538
150,0.1816,0.241882,0.924528,0.406315
200,0.0915,0.304441,0.913043,0.415212
250,0.0882,0.356963,0.912223,0.423148
300,0.0433,0.394473,0.916325,0.406903
350,0.0179,0.437663,0.908121,0.409196
400,0.0194,0.465046,0.917966,0.399255
450,0.0113,0.469469,0.918786,0.418248
500,0.0063,0.468018,0.913043,0.417035


aubmindlab/bert-base-arabertv02-twitter, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3281,0.307573,0.903199,0.259396
100,0.244,0.252799,0.918786,0.353654
150,0.1936,0.236136,0.923708,0.381671
200,0.1068,0.291216,0.913864,0.365575
250,0.073,0.3788,0.896637,0.413828
300,0.0391,0.331962,0.910582,0.410226
350,0.0212,0.370332,0.907301,0.393039
400,0.011,0.418137,0.903199,0.400462
450,0.0074,0.446197,0.910582,0.428395
500,0.0033,0.429462,0.908121,0.411574


aubmindlab/bert-base-arabertv02-twitter, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3281,0.307573,0.903199,0.259396
100,0.244,0.252799,0.918786,0.353654
150,0.1936,0.236136,0.923708,0.381671
200,0.1068,0.291216,0.913864,0.365575
250,0.073,0.3788,0.896637,0.413828
300,0.0391,0.331962,0.910582,0.410226
350,0.0212,0.370332,0.907301,0.393039
400,0.011,0.418137,0.903199,0.400462
450,0.0074,0.446197,0.910582,0.428395
500,0.0033,0.429462,0.908121,0.411574


aubmindlab/bert-base-arabertv02-twitter, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3281,0.307573,0.903199,0.259396
100,0.244,0.252799,0.918786,0.353654
150,0.1936,0.236136,0.923708,0.381671
200,0.1068,0.291216,0.913864,0.365575
250,0.073,0.3788,0.896637,0.413828
300,0.0391,0.331962,0.910582,0.410226
350,0.0212,0.370332,0.907301,0.393039
400,0.011,0.418137,0.903199,0.400462
450,0.0074,0.446197,0.910582,0.428395
500,0.0033,0.429462,0.908121,0.411574


DatasetDict({
    train: Dataset({
        features: ['Text', 'label', '__index_level_0__'],
        num_rows: 4872
    })
    test: Dataset({
        features: ['Text', 'label', '__index_level_0__'],
        num_rows: 1219
    })
})

CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4412,0.223968,0.923708,0.402119
100,0.239,0.232815,0.920427,0.456064
150,0.2205,0.209236,0.92863,0.432417
200,0.1318,0.282804,0.926169,0.374775
250,0.1196,0.350901,0.922067,0.351196
300,0.0929,0.281414,0.920427,0.346897
350,0.0545,0.403412,0.90484,0.409007
400,0.0295,0.354905,0.922888,0.409331
450,0.0224,0.391174,0.926989,0.435188
500,0.0103,0.379064,0.934372,0.451359


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4412,0.223968,0.923708,0.402119
100,0.239,0.232815,0.920427,0.456064
150,0.2205,0.209236,0.92863,0.432417
200,0.1318,0.282804,0.926169,0.374775
250,0.1196,0.350901,0.922067,0.351196
300,0.0929,0.281414,0.920427,0.346897
350,0.0545,0.403412,0.90484,0.409007
400,0.0295,0.354905,0.922888,0.409331
450,0.0224,0.391174,0.926989,0.435188
500,0.0103,0.379064,0.934372,0.451359


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4412,0.223968,0.923708,0.402119
100,0.239,0.232815,0.920427,0.456064
150,0.2205,0.209236,0.92863,0.432417
200,0.1318,0.282804,0.926169,0.374775
250,0.1196,0.350901,0.922067,0.351196
300,0.0929,0.281414,0.920427,0.346897
350,0.0545,0.403412,0.90484,0.409007
400,0.0295,0.354905,0.922888,0.409331
450,0.0224,0.391174,0.926989,0.435188
500,0.0103,0.379064,0.934372,0.451359


CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4283,0.282339,0.913864,0.330201
100,0.242,0.273967,0.916325,0.370732
150,0.2237,0.323412,0.919606,0.341471
200,0.1372,0.322892,0.914684,0.376038
250,0.1269,0.341503,0.916325,0.398724
300,0.0762,0.421827,0.920427,0.507514
350,0.0535,0.398069,0.90484,0.463315
400,0.0314,0.441587,0.913864,0.49393
450,0.0168,0.489433,0.911403,0.52315
500,0.014,0.505835,0.917966,0.396809


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4283,0.282339,0.913864,0.330201
100,0.242,0.273967,0.916325,0.370732
150,0.2237,0.323412,0.919606,0.341471
200,0.1372,0.322892,0.914684,0.376038
250,0.1269,0.341503,0.916325,0.398724
300,0.0762,0.421827,0.920427,0.507514
350,0.0535,0.398069,0.90484,0.463315
400,0.0314,0.441587,0.913864,0.49393
450,0.0168,0.489433,0.911403,0.52315
500,0.014,0.505835,0.917966,0.396809


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4283,0.282339,0.913864,0.330201
100,0.242,0.273967,0.916325,0.370732
150,0.2237,0.323412,0.919606,0.341471
200,0.1372,0.322892,0.914684,0.376038
250,0.1269,0.341503,0.916325,0.398724
300,0.0762,0.421827,0.920427,0.507514
350,0.0535,0.398069,0.90484,0.463315
400,0.0314,0.441587,0.913864,0.49393
450,0.0168,0.489433,0.911403,0.52315
500,0.014,0.505835,0.917966,0.396809


CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4169,0.318362,0.90402,0.270525
100,0.2607,0.274712,0.922067,0.353298
150,0.2234,0.239968,0.921247,0.374382
200,0.143,0.293371,0.923708,0.387224
250,0.1099,0.398067,0.910582,0.395354
300,0.0834,0.376529,0.920427,0.389662
350,0.0403,0.421246,0.914684,0.442327
400,0.0362,0.438543,0.922888,0.510235
450,0.0304,0.46387,0.914684,0.486722
500,0.0173,0.480267,0.920427,0.610428


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4169,0.318362,0.90402,0.270525
100,0.2607,0.274712,0.922067,0.353298
150,0.2234,0.239968,0.921247,0.374382
200,0.143,0.293371,0.923708,0.387224
250,0.1099,0.398067,0.910582,0.395354
300,0.0834,0.376529,0.920427,0.389662
350,0.0403,0.421246,0.914684,0.442327
400,0.0362,0.438543,0.922888,0.510235
450,0.0304,0.46387,0.914684,0.486722
500,0.0173,0.480267,0.920427,0.610428


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4169,0.318362,0.90402,0.270525
100,0.2607,0.274712,0.922067,0.353298
150,0.2234,0.239968,0.921247,0.374382
200,0.143,0.293371,0.923708,0.387224
250,0.1099,0.398067,0.910582,0.395354
300,0.0834,0.376529,0.920427,0.389662
350,0.0403,0.421246,0.914684,0.442327
400,0.0362,0.438543,0.922888,0.510235
450,0.0304,0.46387,0.914684,0.486722
500,0.0173,0.480267,0.920427,0.610428


DatasetDict({
    train: Dataset({
        features: ['Text', 'label', '__index_level_0__'],
        num_rows: 4872
    })
    test: Dataset({
        features: ['Text', 'label', '__index_level_0__'],
        num_rows: 1219
    })
})

qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4308,0.229139,0.917966,0.35997
100,0.2344,0.227809,0.92945,0.435622
150,0.2127,0.217902,0.926989,0.423121
200,0.116,0.341201,0.930271,0.454252
250,0.1093,0.307681,0.916325,0.418995
300,0.0698,0.37629,0.926989,0.384313
350,0.0511,0.378267,0.914684,0.40179
400,0.0445,0.372569,0.921247,0.409168
450,0.0269,0.419688,0.922888,0.427942
500,0.0127,0.428745,0.923708,0.435662


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4308,0.229139,0.917966,0.35997
100,0.2344,0.227809,0.92945,0.435622
150,0.2127,0.217902,0.926989,0.423121
200,0.116,0.341201,0.930271,0.454252
250,0.1093,0.307681,0.916325,0.418995
300,0.0698,0.37629,0.926989,0.384313
350,0.0511,0.378267,0.914684,0.40179
400,0.0445,0.372569,0.921247,0.409168
450,0.0269,0.419688,0.922888,0.427942
500,0.0127,0.428745,0.923708,0.435662


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4308,0.229139,0.917966,0.35997
100,0.2344,0.227809,0.92945,0.435622
150,0.2127,0.217902,0.926989,0.423121
200,0.116,0.341201,0.930271,0.454252
250,0.1093,0.307681,0.916325,0.418995
300,0.0698,0.37629,0.926989,0.384313
350,0.0511,0.378267,0.914684,0.40179
400,0.0445,0.372569,0.921247,0.409168
450,0.0269,0.419688,0.922888,0.427942
500,0.0127,0.428745,0.923708,0.435662


qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3979,0.279302,0.912223,0.32873
100,0.2223,0.249239,0.920427,0.393223
150,0.1866,0.293893,0.923708,0.378286
200,0.1182,0.325791,0.923708,0.415649
250,0.1043,0.329766,0.912223,0.419733
300,0.0726,0.428861,0.922888,0.406232
350,0.0458,0.398642,0.922888,0.428405
400,0.0433,0.434244,0.915505,0.397889
450,0.0289,0.416533,0.919606,0.424121
500,0.015,0.482695,0.915505,0.4144


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3979,0.279302,0.912223,0.32873
100,0.2223,0.249239,0.920427,0.393223
150,0.1866,0.293893,0.923708,0.378286
200,0.1182,0.325791,0.923708,0.415649
250,0.1043,0.329766,0.912223,0.419733
300,0.0726,0.428861,0.922888,0.406232
350,0.0458,0.398642,0.922888,0.428405
400,0.0433,0.434244,0.915505,0.397889
450,0.0289,0.416533,0.919606,0.424121
500,0.015,0.482695,0.915505,0.4144


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3979,0.279302,0.912223,0.32873
100,0.2223,0.249239,0.920427,0.393223
150,0.1866,0.293893,0.923708,0.378286
200,0.1182,0.325791,0.923708,0.415649
250,0.1043,0.329766,0.912223,0.419733
300,0.0726,0.428861,0.922888,0.406232
350,0.0458,0.398642,0.922888,0.428405
400,0.0433,0.434244,0.915505,0.397889
450,0.0289,0.416533,0.919606,0.424121
500,0.015,0.482695,0.915505,0.4144


qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3741,0.289357,0.908942,0.308787
100,0.236,0.357484,0.922067,0.354623
150,0.1906,0.260664,0.915505,0.38236
200,0.109,0.396866,0.918786,0.389936
250,0.0928,0.416626,0.916325,0.39639
300,0.0643,0.368144,0.919606,0.434253
350,0.0515,0.382745,0.918786,0.485328
400,0.0308,0.38719,0.921247,0.412917
450,0.0161,0.420593,0.921247,0.544056
500,0.014,0.425932,0.922067,0.557553


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3741,0.289357,0.908942,0.308787
100,0.236,0.357484,0.922067,0.354623
150,0.1906,0.260664,0.915505,0.38236
200,0.109,0.396866,0.918786,0.389936
250,0.0928,0.416626,0.916325,0.39639
300,0.0643,0.368144,0.919606,0.434253
350,0.0515,0.382745,0.918786,0.485328
400,0.0308,0.38719,0.921247,0.412917
450,0.0161,0.420593,0.921247,0.544056
500,0.014,0.425932,0.922067,0.557553


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3741,0.289357,0.908942,0.308787
100,0.236,0.357484,0.922067,0.354623
150,0.1906,0.260664,0.915505,0.38236
200,0.109,0.396866,0.918786,0.389936
250,0.0928,0.416626,0.916325,0.39639
300,0.0643,0.368144,0.919606,0.434253
350,0.0515,0.382745,0.918786,0.485328
400,0.0308,0.38719,0.921247,0.412917
450,0.0161,0.420593,0.921247,0.544056
500,0.014,0.425932,0.922067,0.557553


DatasetDict({
    train: Dataset({
        features: ['Text', 'label', '__index_level_0__'],
        num_rows: 4872
    })
    test: Dataset({
        features: ['Text', 'label', '__index_level_0__'],
        num_rows: 1219
    })
})

UBC-NLP/MARBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4519,0.226384,0.916325,0.428692
100,0.2414,0.26438,0.895816,0.423114
150,0.2195,0.253699,0.918786,0.412748
200,0.1248,0.336659,0.925349,0.450788
250,0.1189,0.330284,0.923708,0.425131
300,0.09,0.382674,0.917966,0.420009
350,0.0897,0.391363,0.919606,0.387945
400,0.0556,0.41884,0.922067,0.428482
450,0.0546,0.477984,0.90402,0.403748
500,0.0316,0.462549,0.915505,0.417402


UBC-NLP/MARBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4519,0.226384,0.916325,0.428692
100,0.2414,0.26438,0.895816,0.423114
150,0.2195,0.253699,0.918786,0.412748
200,0.1248,0.336659,0.925349,0.450788
250,0.1189,0.330284,0.923708,0.425131
300,0.09,0.382674,0.917966,0.420009
350,0.0897,0.391363,0.919606,0.387945
400,0.0556,0.41884,0.922067,0.428482
450,0.0546,0.477984,0.90402,0.403748
500,0.0316,0.462549,0.915505,0.417402


UBC-NLP/MARBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4519,0.226384,0.916325,0.428692
100,0.2414,0.26438,0.895816,0.423114
150,0.2195,0.253699,0.918786,0.412748
200,0.1248,0.336659,0.925349,0.450788
250,0.1189,0.330284,0.923708,0.425131
300,0.09,0.382674,0.917966,0.420009
350,0.0897,0.391363,0.919606,0.387945
400,0.0556,0.41884,0.922067,0.428482
450,0.0546,0.477984,0.90402,0.403748
500,0.0316,0.462549,0.915505,0.417402


UBC-NLP/MARBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4325,0.279736,0.90484,0.305137
100,0.2357,0.284612,0.910582,0.388529
150,0.2048,0.315444,0.923708,0.372354
200,0.131,0.355919,0.903199,0.384482
250,0.132,0.514867,0.88105,0.377825
300,0.0968,0.407652,0.907301,0.373618
350,0.0702,0.522535,0.899918,0.411489
400,0.0689,0.523896,0.902379,0.388923
450,0.0521,0.597915,0.900738,0.400815
500,0.0485,0.591441,0.899918,0.405089


UBC-NLP/MARBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4325,0.279736,0.90484,0.305137
100,0.2357,0.284612,0.910582,0.388529
150,0.2048,0.315444,0.923708,0.372354
200,0.131,0.355919,0.903199,0.384482
250,0.132,0.514867,0.88105,0.377825
300,0.0968,0.407652,0.907301,0.373618
350,0.0702,0.522535,0.899918,0.411489
400,0.0689,0.523896,0.902379,0.388923
450,0.0521,0.597915,0.900738,0.400815
500,0.0485,0.591441,0.899918,0.405089


UBC-NLP/MARBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4325,0.279736,0.90484,0.305137
100,0.2357,0.284612,0.910582,0.388529
150,0.2048,0.315444,0.923708,0.372354
200,0.131,0.355919,0.903199,0.384482
250,0.132,0.514867,0.88105,0.377825
300,0.0968,0.407652,0.907301,0.373618
350,0.0702,0.522535,0.899918,0.411489
400,0.0689,0.523896,0.902379,0.388923
450,0.0521,0.597915,0.900738,0.400815
500,0.0485,0.591441,0.899918,0.405089


UBC-NLP/MARBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4036,0.289671,0.909762,0.299394
100,0.2451,0.371411,0.922067,0.356175
150,0.1983,0.288687,0.911403,0.377101
200,0.1261,0.33837,0.917966,0.379582
250,0.1076,0.469938,0.917145,0.342479
300,0.0853,0.42677,0.913864,0.377094
350,0.0576,0.436997,0.913043,0.380627
400,0.0672,0.423678,0.910582,0.386103
450,0.0322,0.44121,0.925349,0.413895
500,0.0223,0.515115,0.918786,0.59828


UBC-NLP/MARBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4036,0.289671,0.909762,0.299394
100,0.2451,0.371411,0.922067,0.356175
150,0.1983,0.288687,0.911403,0.377101
200,0.1261,0.33837,0.917966,0.379582
250,0.1076,0.469938,0.917145,0.342479
300,0.0853,0.42677,0.913864,0.377094
350,0.0576,0.436997,0.913043,0.380627
400,0.0672,0.423678,0.910582,0.386103
450,0.0322,0.44121,0.925349,0.413895
500,0.0223,0.515115,0.918786,0.59828


UBC-NLP/MARBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4036,0.289671,0.909762,0.299394
100,0.2451,0.371411,0.922067,0.356175
150,0.1983,0.288687,0.911403,0.377101
200,0.1261,0.33837,0.917966,0.379582
250,0.1076,0.469938,0.917145,0.342479
300,0.0853,0.42677,0.913864,0.377094
350,0.0576,0.436997,0.913043,0.380627
400,0.0672,0.423678,0.910582,0.386103
450,0.0322,0.44121,0.925349,0.413895
500,0.0223,0.515115,0.918786,0.59828


DatasetDict({
    train: Dataset({
        features: ['Text', 'label', '__index_level_0__'],
        num_rows: 4872
    })
    test: Dataset({
        features: ['Text', 'label', '__index_level_0__'],
        num_rows: 1219
    })
})

UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.5317,0.260418,0.903199,0.247771
100,0.2566,0.22221,0.926989,0.459561
150,0.2268,0.258791,0.930271,0.444444
200,0.1432,0.328992,0.921247,0.425624
250,0.1242,0.380332,0.911403,0.432071
300,0.1075,0.357966,0.922067,0.450414
350,0.0919,0.368317,0.917966,0.366632
400,0.0556,0.437401,0.913043,0.415767
450,0.0649,0.393809,0.917966,0.439818
500,0.0436,0.366408,0.926169,0.442256


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.5317,0.260418,0.903199,0.247771
100,0.2566,0.22221,0.926989,0.459561
150,0.2268,0.258791,0.930271,0.444444
200,0.1432,0.328992,0.921247,0.425624
250,0.1242,0.380332,0.911403,0.432071
300,0.1075,0.357966,0.922067,0.450414
350,0.0919,0.368317,0.917966,0.366632
400,0.0556,0.437401,0.913043,0.415767
450,0.0649,0.393809,0.917966,0.439818
500,0.0436,0.366408,0.926169,0.442256


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.5317,0.260418,0.903199,0.247771
100,0.2566,0.22221,0.926989,0.459561
150,0.2268,0.258791,0.930271,0.444444
200,0.1432,0.328992,0.921247,0.425624
250,0.1242,0.380332,0.911403,0.432071
300,0.1075,0.357966,0.922067,0.450414
350,0.0919,0.368317,0.917966,0.366632
400,0.0556,0.437401,0.913043,0.415767
450,0.0649,0.393809,0.917966,0.439818
500,0.0436,0.366408,0.926169,0.442256


UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.5112,0.292025,0.913043,0.310703
100,0.2469,0.265944,0.910582,0.369385
150,0.2112,0.264175,0.926989,0.383144
200,0.1395,0.332265,0.903199,0.381462
250,0.1209,0.343481,0.911403,0.37567
300,0.0824,0.406892,0.911403,0.400947
350,0.0631,0.394246,0.918786,0.427958
400,0.0615,0.410881,0.917966,0.545433
450,0.0447,0.438237,0.919606,0.543782
500,0.0491,0.477984,0.916325,0.523889


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.5112,0.292025,0.913043,0.310703
100,0.2469,0.265944,0.910582,0.369385
150,0.2112,0.264175,0.926989,0.383144
200,0.1395,0.332265,0.903199,0.381462
250,0.1209,0.343481,0.911403,0.37567
300,0.0824,0.406892,0.911403,0.400947
350,0.0631,0.394246,0.918786,0.427958
400,0.0615,0.410881,0.917966,0.545433
450,0.0447,0.438237,0.919606,0.543782
500,0.0491,0.477984,0.916325,0.523889


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.5112,0.292025,0.913043,0.310703
100,0.2469,0.265944,0.910582,0.369385
150,0.2112,0.264175,0.926989,0.383144
200,0.1395,0.332265,0.903199,0.381462
250,0.1209,0.343481,0.911403,0.37567
300,0.0824,0.406892,0.911403,0.400947
350,0.0631,0.394246,0.918786,0.427958
400,0.0615,0.410881,0.917966,0.545433
450,0.0447,0.438237,0.919606,0.543782
500,0.0491,0.477984,0.916325,0.523889


UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.5112,0.374366,0.90566,0.277835
100,0.2676,0.324487,0.921247,0.358051
150,0.2217,0.293697,0.899098,0.363884
200,0.1562,0.330374,0.913043,0.366549
250,0.1228,0.374002,0.925349,0.368039
300,0.1144,0.357446,0.916325,0.361732
350,0.0849,0.36119,0.90484,0.370939
400,0.0753,0.568655,0.870386,0.388724
450,0.0496,0.43554,0.90566,0.40346
500,0.0346,0.446307,0.907301,0.586797


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.5112,0.374366,0.90566,0.277835
100,0.2676,0.324487,0.921247,0.358051
150,0.2217,0.293697,0.899098,0.363884
200,0.1562,0.330374,0.913043,0.366549
250,0.1228,0.374002,0.925349,0.368039
300,0.1144,0.357446,0.916325,0.361732
350,0.0849,0.36119,0.90484,0.370939
400,0.0753,0.568655,0.870386,0.388724
450,0.0496,0.43554,0.90566,0.40346
500,0.0346,0.446307,0.907301,0.586797


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.5112,0.374366,0.90566,0.277835
100,0.2676,0.324487,0.921247,0.358051
150,0.2217,0.293697,0.899098,0.363884
200,0.1562,0.330374,0.913043,0.366549
250,0.1228,0.374002,0.925349,0.368039
300,0.1144,0.357446,0.916325,0.361732
350,0.0849,0.36119,0.90484,0.370939
400,0.0753,0.568655,0.870386,0.388724
450,0.0496,0.43554,0.90566,0.40346
500,0.0346,0.446307,0.907301,0.586797


DatasetDict({
    train: Dataset({
        features: ['Text', 'label', '__index_level_0__'],
        num_rows: 4872
    })
    test: Dataset({
        features: ['Text', 'label', '__index_level_0__'],
        num_rows: 1219
    })
})

SI2M-Lab/DarijaBERT-mix, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4514,0.270958,0.896637,0.373777
100,0.3086,0.294741,0.897457,0.208913
150,0.2928,0.231566,0.918786,0.379199
200,0.2236,0.245522,0.92945,0.444737
250,0.209,0.264504,0.933552,0.462523
300,0.1416,0.291744,0.913864,0.437475
350,0.1097,0.301764,0.92945,0.516719
400,0.0605,0.36502,0.926989,0.519617
450,0.0478,0.403165,0.916325,0.433822
500,0.0268,0.368834,0.931091,0.440027


SI2M-Lab/DarijaBERT-mix, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4514,0.270958,0.896637,0.373777
100,0.3086,0.294741,0.897457,0.208913
150,0.2928,0.231566,0.918786,0.379199
200,0.2236,0.245522,0.92945,0.444737
250,0.209,0.264504,0.933552,0.462523
300,0.1416,0.291744,0.913864,0.437475
350,0.1097,0.301764,0.92945,0.516719
400,0.0605,0.36502,0.926989,0.519617
450,0.0478,0.403165,0.916325,0.433822
500,0.0268,0.368834,0.931091,0.440027


SI2M-Lab/DarijaBERT-mix, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4514,0.270958,0.896637,0.373777
100,0.3086,0.294741,0.897457,0.208913
150,0.2928,0.231566,0.918786,0.379199
200,0.2236,0.245522,0.92945,0.444737
250,0.209,0.264504,0.933552,0.462523
300,0.1416,0.291744,0.913864,0.437475
350,0.1097,0.301764,0.92945,0.516719
400,0.0605,0.36502,0.926989,0.519617
450,0.0478,0.403165,0.916325,0.433822
500,0.0268,0.368834,0.931091,0.440027


SI2M-Lab/DarijaBERT-mix, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4369,0.305716,0.909762,0.301833
100,0.2561,0.275023,0.907301,0.381371
150,0.2291,0.237312,0.92945,0.403572
200,0.1725,0.27242,0.913043,0.376563
250,0.137,0.373435,0.876948,0.378885
300,0.1028,0.338484,0.918786,0.380064
350,0.0475,0.440508,0.893355,0.398322
400,0.0482,0.43089,0.908942,0.519368
450,0.027,0.457061,0.906481,0.467285
500,0.0164,0.483125,0.911403,0.532997


SI2M-Lab/DarijaBERT-mix, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4369,0.305716,0.909762,0.301833
100,0.2561,0.275023,0.907301,0.381371
150,0.2291,0.237312,0.92945,0.403572
200,0.1725,0.27242,0.913043,0.376563
250,0.137,0.373435,0.876948,0.378885
300,0.1028,0.338484,0.918786,0.380064
350,0.0475,0.440508,0.893355,0.398322
400,0.0482,0.43089,0.908942,0.519368
450,0.027,0.457061,0.906481,0.467285
500,0.0164,0.483125,0.911403,0.532997


SI2M-Lab/DarijaBERT-mix, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4369,0.305716,0.909762,0.301833
100,0.2561,0.275023,0.907301,0.381371
150,0.2291,0.237312,0.92945,0.403572
200,0.1725,0.27242,0.913043,0.376563
250,0.137,0.373435,0.876948,0.378885
300,0.1028,0.338484,0.918786,0.380064
350,0.0475,0.440508,0.893355,0.398322
400,0.0482,0.43089,0.908942,0.519368
450,0.027,0.457061,0.906481,0.467285
500,0.0164,0.483125,0.911403,0.532997


SI2M-Lab/DarijaBERT-mix, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4163,0.369036,0.903199,0.256043
100,0.2846,0.339725,0.906481,0.299283
150,0.253,0.292244,0.909762,0.331416
200,0.1772,0.373625,0.88105,0.335597
250,0.2161,0.345627,0.908942,0.333999
300,0.1288,0.321814,0.910582,0.38523
350,0.1118,0.389045,0.906481,0.359771
400,0.1384,0.393977,0.915505,0.359787
450,0.0696,0.451807,0.916325,0.376211
500,0.0549,0.400354,0.914684,0.450094


SI2M-Lab/DarijaBERT-mix, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4163,0.369036,0.903199,0.256043
100,0.2846,0.339725,0.906481,0.299283
150,0.253,0.292244,0.909762,0.331416
200,0.1772,0.373625,0.88105,0.335597
250,0.2161,0.345627,0.908942,0.333999
300,0.1288,0.321814,0.910582,0.38523
350,0.1118,0.389045,0.906481,0.359771
400,0.1384,0.393977,0.915505,0.359787
450,0.0696,0.451807,0.916325,0.376211
500,0.0549,0.400354,0.914684,0.450094


SI2M-Lab/DarijaBERT-mix, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4163,0.369036,0.903199,0.256043
100,0.2846,0.339725,0.906481,0.299283
150,0.253,0.292244,0.909762,0.331416
200,0.1772,0.373625,0.88105,0.335597
250,0.2161,0.345627,0.908942,0.333999
300,0.1288,0.321814,0.910582,0.38523
350,0.1118,0.389045,0.906481,0.359771
400,0.1384,0.393977,0.915505,0.359787
450,0.0696,0.451807,0.916325,0.376211
500,0.0549,0.400354,0.914684,0.450094


DatasetDict({
    train: Dataset({
        features: ['Text', 'label', '__index_level_0__'],
        num_rows: 4872
    })
    test: Dataset({
        features: ['Text', 'label', '__index_level_0__'],
        num_rows: 1219
    })
})

SI2M-Lab/DarijaBERT-arabizi, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4023,0.240447,0.920427,0.358081
100,0.2389,0.237993,0.914684,0.451674
150,0.2108,0.205361,0.930271,0.474673
200,0.123,0.286054,0.92863,0.452998
250,0.0973,0.270726,0.935193,0.491479
300,0.0699,0.358542,0.906481,0.405094
350,0.0327,0.36479,0.924528,0.399376
400,0.0196,0.426639,0.921247,0.501495
450,0.0117,0.466984,0.912223,0.399769
500,0.0075,0.435013,0.92781,0.411738


SI2M-Lab/DarijaBERT-arabizi, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4023,0.240447,0.920427,0.358081
100,0.2389,0.237993,0.914684,0.451674
150,0.2108,0.205361,0.930271,0.474673
200,0.123,0.286054,0.92863,0.452998
250,0.0973,0.270726,0.935193,0.491479
300,0.0699,0.358542,0.906481,0.405094
350,0.0327,0.36479,0.924528,0.399376
400,0.0196,0.426639,0.921247,0.501495
450,0.0117,0.466984,0.912223,0.399769
500,0.0075,0.435013,0.92781,0.411738


SI2M-Lab/DarijaBERT-arabizi, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4023,0.240447,0.920427,0.358081
100,0.2389,0.237993,0.914684,0.451674
150,0.2108,0.205361,0.930271,0.474673
200,0.123,0.286054,0.92863,0.452998
250,0.0973,0.270726,0.935193,0.491479
300,0.0699,0.358542,0.906481,0.405094
350,0.0327,0.36479,0.924528,0.399376
400,0.0196,0.426639,0.921247,0.501495
450,0.0117,0.466984,0.912223,0.399769
500,0.0075,0.435013,0.92781,0.411738


SI2M-Lab/DarijaBERT-arabizi, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3899,0.302656,0.912223,0.298369
100,0.2554,0.302363,0.895816,0.368517
150,0.2117,0.280151,0.923708,0.387648
200,0.1296,0.368995,0.908942,0.396522
250,0.1286,0.358366,0.915505,0.411964
300,0.0861,0.37068,0.915505,0.412768
350,0.0498,0.454879,0.926169,0.411305
400,0.0448,0.42389,0.913864,0.416395
450,0.0237,0.402614,0.920427,0.536192
500,0.0139,0.447574,0.919606,0.404847


SI2M-Lab/DarijaBERT-arabizi, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3899,0.302656,0.912223,0.298369
100,0.2554,0.302363,0.895816,0.368517
150,0.2117,0.280151,0.923708,0.387648
200,0.1296,0.368995,0.908942,0.396522
250,0.1286,0.358366,0.915505,0.411964
300,0.0861,0.37068,0.915505,0.412768
350,0.0498,0.454879,0.926169,0.411305
400,0.0448,0.42389,0.913864,0.416395
450,0.0237,0.402614,0.920427,0.536192
500,0.0139,0.447574,0.919606,0.404847


SI2M-Lab/DarijaBERT-arabizi, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3899,0.302656,0.912223,0.298369
100,0.2554,0.302363,0.895816,0.368517
150,0.2117,0.280151,0.923708,0.387648
200,0.1296,0.368995,0.908942,0.396522
250,0.1286,0.358366,0.915505,0.411964
300,0.0861,0.37068,0.915505,0.412768
350,0.0498,0.454879,0.926169,0.411305
400,0.0448,0.42389,0.913864,0.416395
450,0.0237,0.402614,0.920427,0.536192
500,0.0139,0.447574,0.919606,0.404847


SI2M-Lab/DarijaBERT-arabizi, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3625,0.323426,0.907301,0.272771
100,0.2425,0.313778,0.926989,0.374056
150,0.1991,0.255485,0.912223,0.365764
200,0.1366,0.310749,0.931911,0.424679
250,0.099,0.349998,0.925349,0.410003
300,0.0766,0.311725,0.917145,0.411111
350,0.0406,0.461011,0.921247,0.366165
400,0.032,0.389101,0.931091,0.495605
450,0.0208,0.439088,0.926989,0.411137
500,0.008,0.469679,0.926989,0.467663


SI2M-Lab/DarijaBERT-arabizi, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3625,0.323426,0.907301,0.272771
100,0.2425,0.313778,0.926989,0.374056
150,0.1991,0.255485,0.912223,0.365764
200,0.1366,0.310749,0.931911,0.424679
250,0.099,0.349998,0.925349,0.410003
300,0.0766,0.311725,0.917145,0.411111
350,0.0406,0.461011,0.921247,0.366165
400,0.032,0.389101,0.931091,0.495605
450,0.0208,0.439088,0.926989,0.411137
500,0.008,0.469679,0.926989,0.467663


SI2M-Lab/DarijaBERT-arabizi, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/4872 [00:00<?, ? examples/s]

Map:   0%|          | 0/1219 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3625,0.323426,0.907301,0.272771
100,0.2425,0.313778,0.926989,0.374056
150,0.1991,0.255485,0.912223,0.365764
200,0.1366,0.310749,0.931911,0.424679
250,0.099,0.349998,0.925349,0.410003
300,0.0766,0.311725,0.917145,0.411111
350,0.0406,0.461011,0.921247,0.366165
400,0.032,0.389101,0.931091,0.495605
450,0.0208,0.439088,0.926989,0.411137
500,0.008,0.469679,0.926989,0.467663


Unnamed: 0,Model,Accuracy,F1
0,CAMeL-Lab/bert-base-arabic-camelbert-da,0.920427,0.610428
3,SI2M-Lab/DarijaBERT-arabizi,0.920427,0.536192
6,SI2M-Lab/DarijaBERT-mix,0.911403,0.532997
9,UBC-NLP/MARBERT,0.918786,0.59828
12,UBC-NLP/MARBERTv2,0.910582,0.619596
15,aubmindlab/bert-base-arabertv02-twitter,0.932732,0.460995
16,qarib/bert-base-qarib,0.922888,0.605085
