In [3]:
import os
os.environ["CUDA_VISIBLE_DEVICES"]="1" 

import numpy as np
import tensorflow as tf
import pandas as pd
import pyarabic.araby as araby
import warnings
warnings.filterwarnings('ignore')
from sklearn.model_selection import train_test_split
from sklearn.metrics import classification_report
from tensorflow.keras.layers import Dense, Input
from tensorflow.keras.utils import to_categorical
from tensorflow.keras.optimizers import Adam
from tensorflow.keras.callbacks import EarlyStopping
from tensorflow.keras.initializers import TruncatedNormal
from tensorflow.keras.losses import CategoricalCrossentropy
from tensorflow.keras.metrics import CategoricalAccuracy
import torch
from sklearn.metrics import accuracy_score, f1_score
from transformers import Trainer, TrainingArguments
from transformers import AutoTokenizer, AutoModelForSequenceClassification
from datasets import load_dataset, Dataset, concatenate_datasets
pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', None)
pd.set_option('display.max_colwidth', 1000)


fname = 'TCMD_1'
log_file = fname + '.txt'

with open(log_file, 'w') as f:
    f.write('Model,Accuracy,F1\n')


df = pd.read_csv('datasets/Tweet_Classification_Moroccan_Dataset/data.csv', encoding='utf-16', engine='python', sep='\t') #, quotechar="'"  , quoting=3

display(len(df))
      
display(df.columns)
display(df[:4])



c = df['Topic'].value_counts()
display(c)

classes = set(df['Topic'].values)
display(classes)

df['Topic'] = df['Topic'].astype('category')
df['label'] = df['Topic'].cat.codes

df = df[['Tweet', 'label']]
classes_num = len(classes)
display(classes_num)
display(len(df))


max_sequence_length = 128



models = [ 
        'aubmindlab/bert-base-arabertv02-twitter',
        'CAMeL-Lab/bert-base-arabic-camelbert-da',
        'qarib/bert-base-qarib', 
        'UBC-NLP/MARBERT',
        'UBC-NLP/MARBERTv2',
    'SI2M-Lab/DarijaBERT-mix',
    'SI2M-Lab/DarijaBERT-arabizi'
]


seeds = [0, 1, 42]

for model_name in models:
    for seed in seeds:
        ds = Dataset.from_pandas(df)
        ds = ds.train_test_split(test_size=0.2, seed = seed)
        if seed==0:
            display(ds)
            
        for i in range(3):
            print(f'{model_name}, try:{i}')
                  
            tokenizer = AutoTokenizer.from_pretrained(model_name)
            model = AutoModelForSequenceClassification.from_pretrained(model_name,
                                                                  num_labels=classes_num).to('cuda')                                                 
            dataset_train = ds['train']
            dataset_validation = ds['test']                                                    
            
          
    
            def preprocess_function(examples):
                return tokenizer(examples['Tweet'], truncation=True, padding="max_length",
                                max_length=max_sequence_length)
            
            
            dataset_train = dataset_train.map(preprocess_function, batched=True)
            dataset_validation = dataset_validation.map(preprocess_function, batched=True)
            
           
            
            def compute_metrics(eval_pred):
                logits, labels = eval_pred
                predictions = np.argmax(logits, axis=-1)    
                acc = accuracy_score(labels, predictions)        
                f1 = f1_score(labels, predictions, average='macro')   
                with open(log_file, 'a') as f:
                    f.write(f'{model_name},{acc},{f1}\n')
                return {'accuracy': acc, 'f1_score': f1}
    
    
            
            
            epochs = 20
            save_steps = 10000 #save checkpoint every 10000 steps
            batch_size = 64
            
            training_args = TrainingArguments(
                output_dir = 'bert/',
                overwrite_output_dir=True,
                num_train_epochs = epochs,
                per_device_train_batch_size = batch_size,
                per_device_eval_batch_size = batch_size,
                save_steps = save_steps,
                save_total_limit = 1, #only save the last 5 checkpoints
                fp16=True,
                learning_rate = 5e-5,  # 5e-5 is the default
                logging_steps = 25, #50_000
                evaluation_strategy = 'steps',
                # evaluate_during_training = True,
                eval_steps = 25
                
            )
            
            trainer = Trainer(
                model = model,
                args = training_args,
                # data_collator=data_collator,
                train_dataset=dataset_train,
                eval_dataset=dataset_validation,
                compute_metrics = compute_metrics
            )
            
            
            trainer.train()


results = pd.read_csv(log_file)

best_results = results.groupby('Model', as_index=False)['F1'].max()

best_results = pd.merge(best_results, results, on=['Model', 'F1'])
best_results = best_results[['Model', 'Accuracy', 'F1']]
best_results = best_results.drop_duplicates()
best_results.to_csv(f'{fname}.csv')
display(best_results)



2399

Index(['Tweet', 'Topic'], dtype='object')

Unnamed: 0,Tweet,Topic
0,برا وخيط: أمل بنكيران... مصممة تبتكر الزي المغربي التقليدي بلمسة عالمية,ميديا
1,ربورتاج: قافلة توجيه مُتنقّلة تُطلع تلاميذ العيون على مختلف الآفاق الدراسية,مجتمع
2,ساعة الفطور: طريقة تحضير «وراب» بالخضر وصلصة «تزاتزيكي »,ميديا
3,ربورتاج: مائدة إفطار رمضانية تجمع الديانات الثلاث بالدار البيضاء,ثقافة


Topic
مجتمع     357
رياضة     354
ميديا     353
دولي      348
اقتصاد    344
سياسة     333
ثقافة     310
Name: count, dtype: int64

{'اقتصاد', 'ثقافة', 'دولي', 'رياضة', 'سياسة', 'مجتمع', 'ميديا'}

7

2399

DatasetDict({
    train: Dataset({
        features: ['Tweet', 'label'],
        num_rows: 1919
    })
    test: Dataset({
        features: ['Tweet', 'label'],
        num_rows: 480
    })
})

aubmindlab/bert-base-arabertv02-twitter, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.2411,0.657963,0.802083,0.801895
50,0.5115,0.549965,0.814583,0.817531
75,0.316,0.521616,0.84375,0.843381
100,0.2217,0.597004,0.833333,0.833471
125,0.1187,0.543976,0.85625,0.857291
150,0.0748,0.612204,0.85625,0.857858
175,0.0458,0.725318,0.833333,0.83429
200,0.0409,0.702079,0.835417,0.837773
225,0.0229,0.744603,0.833333,0.833642
250,0.0135,0.774035,0.835417,0.837913


aubmindlab/bert-base-arabertv02-twitter, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.3162,0.731843,0.791667,0.790839
50,0.5233,0.547081,0.8125,0.814717
75,0.3211,0.571492,0.841667,0.840463
100,0.2246,0.585852,0.816667,0.818517
125,0.1207,0.596102,0.835417,0.836069
150,0.0723,0.684178,0.839583,0.840321
175,0.0384,0.779411,0.820833,0.820655
200,0.0315,0.757989,0.839583,0.842168
225,0.0172,0.753498,0.841667,0.841988
250,0.015,0.818561,0.84375,0.845303


aubmindlab/bert-base-arabertv02-twitter, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.3162,0.731843,0.791667,0.790839
50,0.5233,0.547081,0.8125,0.814717
75,0.3211,0.571492,0.841667,0.840463
100,0.2246,0.585852,0.816667,0.818517
125,0.1207,0.596102,0.835417,0.836069
150,0.0723,0.684178,0.839583,0.840321
175,0.0384,0.779411,0.820833,0.820655
200,0.0315,0.757989,0.839583,0.842168
225,0.0172,0.753498,0.841667,0.841988
250,0.015,0.818561,0.84375,0.845303


aubmindlab/bert-base-arabertv02-twitter, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.311,0.669919,0.7875,0.782775
50,0.5651,0.535789,0.829167,0.829369
75,0.2958,0.544734,0.825,0.827628
100,0.2092,0.572566,0.841667,0.84294
125,0.1136,0.597357,0.847917,0.848315
150,0.0764,0.651253,0.847917,0.846709
175,0.0413,0.775223,0.833333,0.833374
200,0.0252,0.844808,0.8375,0.837367
225,0.0228,0.859501,0.835417,0.834547
250,0.0226,0.886217,0.839583,0.838067


aubmindlab/bert-base-arabertv02-twitter, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.311,0.669919,0.7875,0.782775
50,0.5651,0.535789,0.829167,0.829369
75,0.2958,0.544734,0.825,0.827628
100,0.2092,0.572566,0.841667,0.84294
125,0.1136,0.597357,0.847917,0.848315
150,0.0764,0.651253,0.847917,0.846709
175,0.0413,0.775223,0.833333,0.833374
200,0.0252,0.844808,0.8375,0.837367
225,0.0228,0.859501,0.835417,0.834547
250,0.0226,0.886217,0.839583,0.838067


aubmindlab/bert-base-arabertv02-twitter, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.311,0.669919,0.7875,0.782775
50,0.5651,0.535789,0.829167,0.829369
75,0.2958,0.544734,0.825,0.827628
100,0.2092,0.572566,0.841667,0.84294
125,0.1136,0.597357,0.847917,0.848315
150,0.0764,0.651253,0.847917,0.846709
175,0.0413,0.775223,0.833333,0.833374
200,0.0252,0.844808,0.8375,0.837367
225,0.0228,0.859501,0.835417,0.834547
250,0.0226,0.886217,0.839583,0.838067


aubmindlab/bert-base-arabertv02-twitter, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.2881,0.690935,0.7875,0.782633
50,0.5045,0.623803,0.791667,0.794371
75,0.3289,0.548177,0.827083,0.831467
100,0.1796,0.643679,0.81875,0.823773
125,0.1247,0.659277,0.80625,0.809136
150,0.0828,0.685355,0.827083,0.831275
175,0.0437,0.764454,0.829167,0.832368
200,0.056,0.822362,0.822917,0.82698
225,0.0148,0.8408,0.820833,0.826082
250,0.0184,0.867567,0.81875,0.822062


aubmindlab/bert-base-arabertv02-twitter, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.2881,0.690935,0.7875,0.782633
50,0.5045,0.623803,0.791667,0.794371
75,0.3289,0.548177,0.827083,0.831467
100,0.1796,0.643679,0.81875,0.823773
125,0.1247,0.659277,0.80625,0.809136
150,0.0828,0.685355,0.827083,0.831275
175,0.0437,0.764454,0.829167,0.832368
200,0.056,0.822362,0.822917,0.82698
225,0.0148,0.8408,0.820833,0.826082
250,0.0184,0.867567,0.81875,0.822062


aubmindlab/bert-base-arabertv02-twitter, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.2881,0.690935,0.7875,0.782633
50,0.5045,0.623803,0.791667,0.794371
75,0.3289,0.548177,0.827083,0.831467
100,0.1796,0.643679,0.81875,0.823773
125,0.1247,0.659277,0.80625,0.809136
150,0.0828,0.685355,0.827083,0.831275
175,0.0437,0.764454,0.829167,0.832368
200,0.056,0.822362,0.822917,0.82698
225,0.0148,0.8408,0.820833,0.826082
250,0.0184,0.867567,0.81875,0.822062


DatasetDict({
    train: Dataset({
        features: ['Tweet', 'label'],
        num_rows: 1919
    })
    test: Dataset({
        features: ['Tweet', 'label'],
        num_rows: 480
    })
})

CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.5475,1.059691,0.683333,0.684825
50,0.8043,0.794526,0.754167,0.755147
75,0.4529,0.741963,0.779167,0.779093
100,0.2516,0.73868,0.785417,0.787276
125,0.1381,0.880945,0.770833,0.77192
150,0.0924,0.895591,0.7875,0.789274
175,0.0382,1.043122,0.783333,0.784707
200,0.0396,1.043337,0.79375,0.795601
225,0.02,1.171835,0.770833,0.77154
250,0.0222,1.178952,0.775,0.778402


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.5475,1.059691,0.683333,0.684825
50,0.8043,0.794526,0.754167,0.755147
75,0.4529,0.741963,0.779167,0.779093
100,0.2516,0.73868,0.785417,0.787276
125,0.1381,0.880945,0.770833,0.77192
150,0.0924,0.895591,0.7875,0.789274
175,0.0382,1.043122,0.783333,0.784707
200,0.0396,1.043337,0.79375,0.795601
225,0.02,1.171835,0.770833,0.77154
250,0.0222,1.178952,0.775,0.778402


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.5475,1.059691,0.683333,0.684825
50,0.8043,0.794526,0.754167,0.755147
75,0.4529,0.741963,0.779167,0.779093
100,0.2516,0.73868,0.785417,0.787276
125,0.1381,0.880945,0.770833,0.77192
150,0.0924,0.895591,0.7875,0.789274
175,0.0382,1.043122,0.783333,0.784707
200,0.0396,1.043337,0.79375,0.795601
225,0.02,1.171835,0.770833,0.77154
250,0.0222,1.178952,0.775,0.778402


CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.5914,1.07346,0.6625,0.659293
50,0.8078,0.789215,0.727083,0.723187
75,0.4309,0.761516,0.760417,0.759107
100,0.2444,0.840997,0.754167,0.756269
125,0.1034,0.982328,0.75,0.748768
150,0.0802,0.96071,0.766667,0.766076
175,0.0351,1.161786,0.74375,0.740978
200,0.025,1.157146,0.772917,0.771053
225,0.0202,1.228702,0.7625,0.761745
250,0.0261,1.211015,0.777083,0.776878


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.5914,1.07346,0.6625,0.659293
50,0.8078,0.789215,0.727083,0.723187
75,0.4309,0.761516,0.760417,0.759107
100,0.2444,0.840997,0.754167,0.756269
125,0.1034,0.982328,0.75,0.748768
150,0.0802,0.96071,0.766667,0.766076
175,0.0351,1.161786,0.74375,0.740978
200,0.025,1.157146,0.772917,0.771053
225,0.0202,1.228702,0.7625,0.761745
250,0.0261,1.211015,0.777083,0.776878


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.5914,1.07346,0.6625,0.659293
50,0.8078,0.789215,0.727083,0.723187
75,0.4309,0.761516,0.760417,0.759107
100,0.2444,0.840997,0.754167,0.756269
125,0.1034,0.982328,0.75,0.748768
150,0.0802,0.96071,0.766667,0.766076
175,0.0351,1.161786,0.74375,0.740978
200,0.025,1.157146,0.772917,0.771053
225,0.0202,1.228702,0.7625,0.761745
250,0.0261,1.211015,0.777083,0.776878


CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.5566,1.148369,0.635417,0.639082
50,0.8078,0.89048,0.702083,0.705445
75,0.4618,0.854254,0.735417,0.739137
100,0.2624,0.861281,0.754167,0.75638
125,0.1269,1.026515,0.75,0.754616
150,0.0877,1.133947,0.739583,0.732864
175,0.0382,1.249345,0.725,0.72908
200,0.0442,1.499887,0.714583,0.71852
225,0.0217,1.458039,0.71875,0.722241
250,0.0258,1.451469,0.729167,0.730696


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.5566,1.148369,0.635417,0.639082
50,0.8078,0.89048,0.702083,0.705445
75,0.4618,0.854254,0.735417,0.739137
100,0.2624,0.861281,0.754167,0.75638
125,0.1269,1.026515,0.75,0.754616
150,0.0877,1.133947,0.739583,0.732864
175,0.0382,1.249345,0.725,0.72908
200,0.0442,1.499887,0.714583,0.71852
225,0.0217,1.458039,0.71875,0.722241
250,0.0258,1.451469,0.729167,0.730696


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.5566,1.148369,0.635417,0.639082
50,0.8078,0.89048,0.702083,0.705445
75,0.4618,0.854254,0.735417,0.739137
100,0.2624,0.861281,0.754167,0.75638
125,0.1269,1.026515,0.75,0.754616
150,0.0877,1.133947,0.739583,0.732864
175,0.0382,1.249345,0.725,0.72908
200,0.0442,1.499887,0.714583,0.71852
225,0.0217,1.458039,0.71875,0.722241
250,0.0258,1.451469,0.729167,0.730696


DatasetDict({
    train: Dataset({
        features: ['Tweet', 'label'],
        num_rows: 1919
    })
    test: Dataset({
        features: ['Tweet', 'label'],
        num_rows: 480
    })
})

qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.302,0.763501,0.745833,0.745107
50,0.4646,0.641744,0.816667,0.818601
75,0.2951,0.660772,0.814583,0.813862
100,0.1743,0.622649,0.827083,0.827188
125,0.0985,0.73995,0.814583,0.8158
150,0.0784,0.795366,0.822917,0.82418
175,0.0332,0.914769,0.816667,0.820845
200,0.0452,0.961504,0.814583,0.816798
225,0.0274,0.894179,0.822917,0.823695
250,0.0124,0.985537,0.820833,0.821516


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.302,0.763501,0.745833,0.745107
50,0.4646,0.641744,0.816667,0.818601
75,0.2951,0.660772,0.814583,0.813862
100,0.1743,0.622649,0.827083,0.827188
125,0.0985,0.73995,0.814583,0.8158
150,0.0784,0.795366,0.822917,0.82418
175,0.0332,0.914769,0.816667,0.820845
200,0.0452,0.961504,0.814583,0.816798
225,0.0274,0.894179,0.822917,0.823695
250,0.0124,0.985537,0.820833,0.821516


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.302,0.763501,0.745833,0.745107
50,0.4646,0.641744,0.816667,0.818601
75,0.2951,0.660772,0.814583,0.813862
100,0.1743,0.622649,0.827083,0.827188
125,0.0985,0.73995,0.814583,0.8158
150,0.0784,0.795366,0.822917,0.82418
175,0.0332,0.914769,0.816667,0.820845
200,0.0452,0.961504,0.814583,0.816798
225,0.0274,0.894179,0.822917,0.823695
250,0.0124,0.985537,0.820833,0.821516


qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.3542,0.741602,0.766667,0.761156
50,0.5416,0.525058,0.839583,0.839394
75,0.285,0.579937,0.845833,0.845078
100,0.1801,0.643726,0.820833,0.82072
125,0.0952,0.770127,0.825,0.825198
150,0.0587,0.757152,0.835417,0.832564
175,0.0308,0.955276,0.829167,0.826066
200,0.0299,0.996025,0.816667,0.812328
225,0.0229,1.013592,0.829167,0.827536
250,0.0146,0.993801,0.833333,0.832303


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.3542,0.741602,0.766667,0.761156
50,0.5416,0.525058,0.839583,0.839394
75,0.285,0.579937,0.845833,0.845078
100,0.1801,0.643726,0.820833,0.82072
125,0.0952,0.770127,0.825,0.825198
150,0.0587,0.757152,0.835417,0.832564
175,0.0308,0.955276,0.829167,0.826066
200,0.0299,0.996025,0.816667,0.812328
225,0.0229,1.013592,0.829167,0.827536
250,0.0146,0.993801,0.833333,0.832303


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.3542,0.741602,0.766667,0.761156
50,0.5416,0.525058,0.839583,0.839394
75,0.285,0.579937,0.845833,0.845078
100,0.1801,0.643726,0.820833,0.82072
125,0.0952,0.770127,0.825,0.825198
150,0.0587,0.757152,0.835417,0.832564
175,0.0308,0.955276,0.829167,0.826066
200,0.0299,0.996025,0.816667,0.812328
225,0.0229,1.013592,0.829167,0.827536
250,0.0146,0.993801,0.833333,0.832303


qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.283,0.715174,0.791667,0.788074
50,0.4856,0.606021,0.81875,0.82063
75,0.2675,0.684091,0.791667,0.7967
100,0.1499,0.791596,0.791667,0.793687
125,0.1065,0.77487,0.820833,0.823555
150,0.071,0.871292,0.816667,0.818989
175,0.0423,0.84928,0.808333,0.812062
200,0.0279,0.937316,0.804167,0.80585
225,0.0127,1.021281,0.804167,0.811333
250,0.0201,1.013876,0.827083,0.832094


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.283,0.715174,0.791667,0.788074
50,0.4856,0.606021,0.81875,0.82063
75,0.2675,0.684091,0.791667,0.7967
100,0.1499,0.791596,0.791667,0.793687
125,0.1065,0.77487,0.820833,0.823555
150,0.071,0.871292,0.816667,0.818989
175,0.0423,0.84928,0.808333,0.812062
200,0.0279,0.937316,0.804167,0.80585
225,0.0127,1.021281,0.804167,0.811333
250,0.0201,1.013876,0.827083,0.832094


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.283,0.715174,0.791667,0.788074
50,0.4856,0.606021,0.81875,0.82063
75,0.2675,0.684091,0.791667,0.7967
100,0.1499,0.791596,0.791667,0.793687
125,0.1065,0.77487,0.820833,0.823555
150,0.071,0.871292,0.816667,0.818989
175,0.0423,0.84928,0.808333,0.812062
200,0.0279,0.937316,0.804167,0.80585
225,0.0127,1.021281,0.804167,0.811333
250,0.0201,1.013876,0.827083,0.832094


DatasetDict({
    train: Dataset({
        features: ['Tweet', 'label'],
        num_rows: 1919
    })
    test: Dataset({
        features: ['Tweet', 'label'],
        num_rows: 480
    })
})

UBC-NLP/MARBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.3785,0.810909,0.772917,0.77515
50,0.5513,0.614073,0.8125,0.814386
75,0.3632,0.605358,0.808333,0.80934
100,0.2374,0.688074,0.8125,0.81271
125,0.1523,0.724123,0.810417,0.814803
150,0.1033,0.85267,0.810417,0.809322
175,0.075,0.823568,0.814583,0.815132
200,0.044,0.930853,0.804167,0.804091
225,0.051,1.082822,0.804167,0.801656
250,0.0454,0.997828,0.814583,0.815127


UBC-NLP/MARBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.3785,0.810909,0.772917,0.77515
50,0.5513,0.614073,0.8125,0.814386
75,0.3632,0.605358,0.808333,0.80934
100,0.2374,0.688074,0.8125,0.81271
125,0.1523,0.724123,0.810417,0.814803
150,0.1033,0.85267,0.810417,0.809322
175,0.075,0.823568,0.814583,0.815132
200,0.044,0.930853,0.804167,0.804091
225,0.051,1.082822,0.804167,0.801656
250,0.0454,0.997828,0.814583,0.815127


UBC-NLP/MARBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.3785,0.810909,0.772917,0.77515
50,0.5513,0.614073,0.8125,0.814386
75,0.3632,0.605358,0.808333,0.80934
100,0.2374,0.688074,0.8125,0.81271
125,0.1523,0.724123,0.810417,0.814803
150,0.1033,0.85267,0.810417,0.809322
175,0.075,0.823568,0.814583,0.815132
200,0.044,0.930853,0.804167,0.804091
225,0.051,1.082822,0.804167,0.801656
250,0.0454,0.997828,0.814583,0.815127


UBC-NLP/MARBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.3547,0.761781,0.7875,0.786222
50,0.6102,0.563098,0.81875,0.81451
75,0.3472,0.623541,0.81875,0.819564
100,0.2316,0.728653,0.795833,0.79533
125,0.1644,0.695758,0.822917,0.821789
150,0.0879,0.767208,0.81875,0.815998
175,0.0736,0.815761,0.833333,0.833643
200,0.0472,0.920883,0.822917,0.820094
225,0.0319,0.977591,0.820833,0.818849
250,0.0386,1.12415,0.802083,0.799895


UBC-NLP/MARBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.3547,0.761781,0.7875,0.786222
50,0.6102,0.563098,0.81875,0.81451
75,0.3472,0.623541,0.81875,0.819564
100,0.2316,0.728653,0.795833,0.79533
125,0.1644,0.695758,0.822917,0.821789
150,0.0879,0.767208,0.81875,0.815998
175,0.0736,0.815761,0.833333,0.833643
200,0.0472,0.920883,0.822917,0.820094
225,0.0319,0.977591,0.820833,0.818849
250,0.0386,1.12415,0.802083,0.799895


UBC-NLP/MARBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.3547,0.761781,0.7875,0.786222
50,0.6102,0.563098,0.81875,0.81451
75,0.3472,0.623541,0.81875,0.819564
100,0.2316,0.728653,0.795833,0.79533
125,0.1644,0.695758,0.822917,0.821789
150,0.0879,0.767208,0.81875,0.815998
175,0.0736,0.815761,0.833333,0.833643
200,0.0472,0.920883,0.822917,0.820094
225,0.0319,0.977591,0.820833,0.818849
250,0.0386,1.12415,0.802083,0.799895


UBC-NLP/MARBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.3474,0.857503,0.775,0.771378
50,0.5649,0.601721,0.829167,0.830792
75,0.3178,0.73001,0.785417,0.790986
100,0.1854,0.798911,0.789583,0.790641
125,0.1475,0.795134,0.81875,0.817345
150,0.0949,0.821347,0.797917,0.802724
175,0.0566,0.916495,0.797917,0.80251
200,0.0652,0.922385,0.8125,0.818351
225,0.0228,0.986391,0.814583,0.816026
250,0.0396,1.172724,0.789583,0.79371


UBC-NLP/MARBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.3474,0.857503,0.775,0.771378
50,0.5649,0.601721,0.829167,0.830792
75,0.3178,0.73001,0.785417,0.790986
100,0.1854,0.798911,0.789583,0.790641
125,0.1475,0.795134,0.81875,0.817345
150,0.0949,0.821347,0.797917,0.802724
175,0.0566,0.916495,0.797917,0.80251
200,0.0652,0.922385,0.8125,0.818351
225,0.0228,0.986391,0.814583,0.816026
250,0.0396,1.172724,0.789583,0.79371


UBC-NLP/MARBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.3474,0.857503,0.775,0.771378
50,0.5649,0.601721,0.829167,0.830792
75,0.3178,0.73001,0.785417,0.790986
100,0.1854,0.798911,0.789583,0.790641
125,0.1475,0.795134,0.81875,0.817345
150,0.0949,0.821347,0.797917,0.802724
175,0.0566,0.916495,0.797917,0.80251
200,0.0652,0.922385,0.8125,0.818351
225,0.0228,0.986391,0.814583,0.816026
250,0.0396,1.172724,0.789583,0.79371


DatasetDict({
    train: Dataset({
        features: ['Tweet', 'label'],
        num_rows: 1919
    })
    test: Dataset({
        features: ['Tweet', 'label'],
        num_rows: 480
    })
})

UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.5573,1.069026,0.716667,0.714868
50,0.8084,0.671593,0.80625,0.807929
75,0.4747,0.578326,0.841667,0.843383
100,0.303,0.639903,0.822917,0.820834
125,0.1913,0.606658,0.835417,0.836441
150,0.1406,0.727294,0.810417,0.811804
175,0.1243,0.73434,0.814583,0.818045
200,0.0716,0.761079,0.833333,0.838435
225,0.0652,0.801618,0.81875,0.819025
250,0.0463,0.741482,0.83125,0.833056


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.5573,1.069026,0.716667,0.714868
50,0.8084,0.671593,0.80625,0.807929
75,0.4747,0.578326,0.841667,0.843383
100,0.303,0.639903,0.822917,0.820834
125,0.1913,0.606658,0.835417,0.836441
150,0.1406,0.727294,0.810417,0.811804
175,0.1243,0.73434,0.814583,0.818045
200,0.0716,0.761079,0.833333,0.838435
225,0.0652,0.801618,0.81875,0.819025
250,0.0463,0.741482,0.83125,0.833056


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.5573,1.069026,0.716667,0.714868
50,0.8084,0.671593,0.80625,0.807929
75,0.4747,0.578326,0.841667,0.843383
100,0.303,0.639903,0.822917,0.820834
125,0.1913,0.606658,0.835417,0.836441
150,0.1406,0.727294,0.810417,0.811804
175,0.1243,0.73434,0.814583,0.818045
200,0.0716,0.761079,0.833333,0.838435
225,0.0652,0.801618,0.81875,0.819025
250,0.0463,0.741482,0.83125,0.833056


UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.5712,1.017526,0.775,0.774687
50,0.8233,0.600525,0.835417,0.833411
75,0.4589,0.527399,0.85,0.849732
100,0.308,0.519288,0.839583,0.837412
125,0.2226,0.573526,0.822917,0.819063
150,0.1478,0.641697,0.8375,0.833995
175,0.1056,0.644598,0.845833,0.841539
200,0.0705,0.717488,0.841667,0.840085
225,0.0698,0.705423,0.84375,0.841337
250,0.0585,0.822983,0.820833,0.82059


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.5712,1.017526,0.775,0.774687
50,0.8233,0.600525,0.835417,0.833411
75,0.4589,0.527399,0.85,0.849732
100,0.308,0.519288,0.839583,0.837412
125,0.2226,0.573526,0.822917,0.819063
150,0.1478,0.641697,0.8375,0.833995
175,0.1056,0.644598,0.845833,0.841539
200,0.0705,0.717488,0.841667,0.840085
225,0.0698,0.705423,0.84375,0.841337
250,0.0585,0.822983,0.820833,0.82059


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.5712,1.017526,0.775,0.774687
50,0.8233,0.600525,0.835417,0.833411
75,0.4589,0.527399,0.85,0.849732
100,0.308,0.519288,0.839583,0.837412
125,0.2226,0.573526,0.822917,0.819063
150,0.1478,0.641697,0.8375,0.833995
175,0.1056,0.644598,0.845833,0.841539
200,0.0705,0.717488,0.841667,0.840085
225,0.0698,0.705423,0.84375,0.841337
250,0.0585,0.822983,0.820833,0.82059


UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.5556,1.009697,0.7875,0.780908
50,0.791,0.640468,0.835417,0.836975
75,0.464,0.637217,0.808333,0.811419
100,0.2698,0.602581,0.810417,0.812927
125,0.2235,0.599281,0.839583,0.843462
150,0.1394,0.703063,0.808333,0.814431
175,0.0899,0.749129,0.810417,0.819433
200,0.0977,0.728949,0.814583,0.818019
225,0.0587,0.809746,0.81875,0.821298
250,0.0639,0.942991,0.789583,0.794688


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.5556,1.009697,0.7875,0.780908
50,0.791,0.640468,0.835417,0.836975
75,0.464,0.637217,0.808333,0.811419
100,0.2698,0.602581,0.810417,0.812927
125,0.2235,0.599281,0.839583,0.843462
150,0.1394,0.703063,0.808333,0.814431
175,0.0899,0.749129,0.810417,0.819433
200,0.0977,0.728949,0.814583,0.818019
225,0.0587,0.809746,0.81875,0.821298
250,0.0639,0.942991,0.789583,0.794688


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.5556,1.009697,0.7875,0.780908
50,0.791,0.640468,0.835417,0.836975
75,0.464,0.637217,0.808333,0.811419
100,0.2698,0.602581,0.810417,0.812927
125,0.2235,0.599281,0.839583,0.843462
150,0.1394,0.703063,0.808333,0.814431
175,0.0899,0.749129,0.810417,0.819433
200,0.0977,0.728949,0.814583,0.818019
225,0.0587,0.809746,0.81875,0.821298
250,0.0639,0.942991,0.789583,0.794688


DatasetDict({
    train: Dataset({
        features: ['Tweet', 'label'],
        num_rows: 1919
    })
    test: Dataset({
        features: ['Tweet', 'label'],
        num_rows: 480
    })
})

SI2M-Lab/DarijaBERT-mix, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.7687,1.439387,0.525,0.53154
50,1.2867,1.116004,0.63125,0.630572
75,0.9348,0.885442,0.679167,0.686474
100,0.6437,0.748766,0.74375,0.746026
125,0.4475,0.728863,0.7625,0.764293
150,0.2799,0.842925,0.7625,0.760038
175,0.1584,0.776,0.777083,0.778279
200,0.0801,0.801966,0.795833,0.79648
225,0.0589,0.963952,0.758333,0.754729
250,0.0294,0.971395,0.78125,0.782729


SI2M-Lab/DarijaBERT-mix, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.7687,1.439387,0.525,0.53154
50,1.2867,1.116004,0.63125,0.630572
75,0.9348,0.885442,0.679167,0.686474
100,0.6437,0.748766,0.74375,0.746026
125,0.4475,0.728863,0.7625,0.764293
150,0.2799,0.842925,0.7625,0.760038
175,0.1584,0.776,0.777083,0.778279
200,0.0801,0.801966,0.795833,0.79648
225,0.0589,0.963952,0.758333,0.754729
250,0.0294,0.971395,0.78125,0.782729


SI2M-Lab/DarijaBERT-mix, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.7687,1.439387,0.525,0.53154
50,1.2867,1.116004,0.63125,0.630572
75,0.9348,0.885442,0.679167,0.686474
100,0.6437,0.748766,0.74375,0.746026
125,0.4475,0.728863,0.7625,0.764293
150,0.2799,0.842925,0.7625,0.760038
175,0.1584,0.776,0.777083,0.778279
200,0.0801,0.801966,0.795833,0.79648
225,0.0589,0.963952,0.758333,0.754729
250,0.0294,0.971395,0.78125,0.782729


SI2M-Lab/DarijaBERT-mix, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.778,1.375164,0.570833,0.567539
50,1.268,1.033334,0.660417,0.657976
75,0.8452,0.824576,0.71875,0.714562
100,0.6081,0.794426,0.716667,0.703747
125,0.4078,0.750581,0.747917,0.745611
150,0.2505,0.802122,0.758333,0.756545
175,0.1396,0.841865,0.775,0.769873
200,0.0812,0.869589,0.777083,0.77442
225,0.0482,0.987518,0.78125,0.780261
250,0.0476,1.066905,0.772917,0.771292


SI2M-Lab/DarijaBERT-mix, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.778,1.375164,0.570833,0.567539
50,1.268,1.033334,0.660417,0.657976
75,0.8452,0.824576,0.71875,0.714562
100,0.6081,0.794426,0.716667,0.703747
125,0.4078,0.750581,0.747917,0.745611
150,0.2505,0.802122,0.758333,0.756545
175,0.1396,0.841865,0.775,0.769873
200,0.0812,0.869589,0.777083,0.77442
225,0.0482,0.987518,0.78125,0.780261
250,0.0476,1.066905,0.772917,0.771292


SI2M-Lab/DarijaBERT-mix, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.778,1.375164,0.570833,0.567539
50,1.268,1.033334,0.660417,0.657976
75,0.8452,0.824576,0.71875,0.714562
100,0.6081,0.794426,0.716667,0.703747
125,0.4078,0.750581,0.747917,0.745611
150,0.2505,0.802122,0.758333,0.756545
175,0.1396,0.841865,0.775,0.769873
200,0.0812,0.869589,0.777083,0.77442
225,0.0482,0.987518,0.78125,0.780261
250,0.0476,1.066905,0.772917,0.771292


SI2M-Lab/DarijaBERT-mix, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.8409,1.641297,0.43125,0.429309
50,1.3994,1.141994,0.60625,0.600146
75,0.9592,1.069258,0.604167,0.605025
100,0.6647,0.853747,0.71875,0.718554
125,0.4443,0.87496,0.722917,0.723177
150,0.3019,0.832358,0.741667,0.746914
175,0.1748,0.849019,0.75625,0.759107
200,0.1327,0.94962,0.739583,0.745485
225,0.0726,0.971381,0.7625,0.765533
250,0.0509,1.148705,0.745833,0.749333


SI2M-Lab/DarijaBERT-mix, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.8409,1.641297,0.43125,0.429309
50,1.3994,1.141994,0.60625,0.600146
75,0.9592,1.069258,0.604167,0.605025
100,0.6647,0.853747,0.71875,0.718554
125,0.4443,0.87496,0.722917,0.723177
150,0.3019,0.832358,0.741667,0.746914
175,0.1748,0.849019,0.75625,0.759107
200,0.1327,0.94962,0.739583,0.745485
225,0.0726,0.971381,0.7625,0.765533
250,0.0509,1.148705,0.745833,0.749333


SI2M-Lab/DarijaBERT-mix, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.8409,1.641297,0.43125,0.429309
50,1.3994,1.141994,0.60625,0.600146
75,0.9592,1.069258,0.604167,0.605025
100,0.6647,0.853747,0.71875,0.718554
125,0.4443,0.87496,0.722917,0.723177
150,0.3019,0.832358,0.741667,0.746914
175,0.1748,0.849019,0.75625,0.759107
200,0.1327,0.94962,0.739583,0.745485
225,0.0726,0.971381,0.7625,0.765533
250,0.0509,1.148705,0.745833,0.749333


DatasetDict({
    train: Dataset({
        features: ['Tweet', 'label'],
        num_rows: 1919
    })
    test: Dataset({
        features: ['Tweet', 'label'],
        num_rows: 480
    })
})

SI2M-Lab/DarijaBERT-arabizi, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.7652,1.409523,0.510417,0.493054
50,1.1566,1.030456,0.6375,0.639593
75,0.7551,0.976776,0.6625,0.656013
100,0.4933,0.958737,0.6875,0.686214
125,0.2945,0.912092,0.71875,0.719392
150,0.1558,1.052582,0.702083,0.698381
175,0.093,1.085981,0.7125,0.707756
200,0.0562,1.134325,0.716667,0.716058
225,0.0338,1.172425,0.71875,0.715945
250,0.0187,1.346207,0.722917,0.723141


SI2M-Lab/DarijaBERT-arabizi, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.7652,1.409523,0.510417,0.493054
50,1.1566,1.030456,0.6375,0.639593
75,0.7551,0.976776,0.6625,0.656013
100,0.4933,0.958737,0.6875,0.686214
125,0.2945,0.912092,0.71875,0.719392
150,0.1558,1.052582,0.702083,0.698381
175,0.093,1.085981,0.7125,0.707756
200,0.0562,1.134325,0.716667,0.716058
225,0.0338,1.172425,0.71875,0.715945
250,0.0187,1.346207,0.722917,0.723141


SI2M-Lab/DarijaBERT-arabizi, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.7652,1.409523,0.510417,0.493054
50,1.1566,1.030456,0.6375,0.639593
75,0.7551,0.976776,0.6625,0.656013
100,0.4933,0.958737,0.6875,0.686214
125,0.2945,0.912092,0.71875,0.719392
150,0.1558,1.052582,0.702083,0.698381
175,0.093,1.085981,0.7125,0.707756
200,0.0562,1.134325,0.716667,0.716058
225,0.0338,1.172425,0.71875,0.715945
250,0.0187,1.346207,0.722917,0.723141


SI2M-Lab/DarijaBERT-arabizi, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.798,1.41992,0.50625,0.474965
50,1.2563,1.005754,0.660417,0.658458
75,0.7947,0.884983,0.685417,0.684102
100,0.5554,0.873422,0.710417,0.702883
125,0.3292,0.863639,0.729167,0.721831
150,0.1619,0.958422,0.7,0.700387
175,0.0746,1.001179,0.722917,0.716902
200,0.0545,1.102071,0.702083,0.700011
225,0.0335,1.200048,0.720833,0.718589
250,0.0214,1.28813,0.73125,0.728034


SI2M-Lab/DarijaBERT-arabizi, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.798,1.41992,0.50625,0.474965
50,1.2563,1.005754,0.660417,0.658458
75,0.7947,0.884983,0.685417,0.684102
100,0.5554,0.873422,0.710417,0.702883
125,0.3292,0.863639,0.729167,0.721831
150,0.1619,0.958422,0.7,0.700387
175,0.0746,1.001179,0.722917,0.716902
200,0.0545,1.102071,0.702083,0.700011
225,0.0335,1.200048,0.720833,0.718589
250,0.0214,1.28813,0.73125,0.728034


SI2M-Lab/DarijaBERT-arabizi, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.798,1.41992,0.50625,0.474965
50,1.2563,1.005754,0.660417,0.658458
75,0.7947,0.884983,0.685417,0.684102
100,0.5554,0.873422,0.710417,0.702883
125,0.3292,0.863639,0.729167,0.721831
150,0.1619,0.958422,0.7,0.700387
175,0.0746,1.001179,0.722917,0.716902
200,0.0545,1.102071,0.702083,0.700011
225,0.0335,1.200048,0.720833,0.718589
250,0.0214,1.28813,0.73125,0.728034


SI2M-Lab/DarijaBERT-arabizi, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.7507,1.464526,0.485417,0.487555
50,1.1762,1.116076,0.602083,0.60411
75,0.7566,1.165259,0.602083,0.603397
100,0.4703,1.045791,0.677083,0.677819
125,0.2777,1.097797,0.677083,0.680107
150,0.1474,1.160033,0.683333,0.688896
175,0.0807,1.406651,0.664583,0.663667
200,0.071,1.386584,0.69375,0.697555
225,0.0321,1.411193,0.697917,0.702075
250,0.0294,1.50306,0.691667,0.693671


SI2M-Lab/DarijaBERT-arabizi, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.7507,1.464526,0.485417,0.487555
50,1.1762,1.116076,0.602083,0.60411
75,0.7566,1.165259,0.602083,0.603397
100,0.4703,1.045791,0.677083,0.677819
125,0.2777,1.097797,0.677083,0.680107
150,0.1474,1.160033,0.683333,0.688896
175,0.0807,1.406651,0.664583,0.663667
200,0.071,1.386584,0.69375,0.697555
225,0.0321,1.411193,0.697917,0.702075
250,0.0294,1.50306,0.691667,0.693671


SI2M-Lab/DarijaBERT-arabizi, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1919 [00:00<?, ? examples/s]

Map:   0%|          | 0/480 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,1.7507,1.464526,0.485417,0.487555
50,1.1762,1.116076,0.602083,0.60411
75,0.7566,1.165259,0.602083,0.603397
100,0.4703,1.045791,0.677083,0.677819
125,0.2777,1.097797,0.677083,0.680107
150,0.1474,1.160033,0.683333,0.688896
175,0.0807,1.406651,0.664583,0.663667
200,0.071,1.386584,0.69375,0.697555
225,0.0321,1.411193,0.697917,0.702075
250,0.0294,1.50306,0.691667,0.693671


Unnamed: 0,Model,Accuracy,F1
0,CAMeL-Lab/bert-base-arabic-camelbert-da,0.795833,0.795777
3,SI2M-Lab/DarijaBERT-arabizi,0.754167,0.756526
6,SI2M-Lab/DarijaBERT-mix,0.797917,0.79682
12,UBC-NLP/MARBERT,0.833333,0.833643
15,UBC-NLP/MARBERTv2,0.85,0.849732
18,aubmindlab/bert-base-arabertv02-twitter,0.85625,0.857858
19,qarib/bert-base-qarib,0.845833,0.845078
