In [1]:
import os
os.environ["CUDA_VISIBLE_DEVICES"]="0" 

import numpy as np
import tensorflow as tf
import pandas as pd
import pyarabic.araby as araby
import warnings
warnings.filterwarnings('ignore')
from sklearn.model_selection import train_test_split
from sklearn.metrics import classification_report
from tensorflow.keras.layers import Dense, Input
from tensorflow.keras.utils import to_categorical
from tensorflow.keras.optimizers import Adam
from tensorflow.keras.callbacks import EarlyStopping
from tensorflow.keras.initializers import TruncatedNormal
from tensorflow.keras.losses import CategoricalCrossentropy
from tensorflow.keras.metrics import CategoricalAccuracy
import torch
from sklearn.metrics import accuracy_score, f1_score
from transformers import Trainer, TrainingArguments
from transformers import AutoTokenizer, AutoModelForSequenceClassification
from datasets import load_dataset, Dataset, concatenate_datasets
pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', None)
pd.set_option('display.max_colwidth', 1000)


fname = 'MTCD_1'
log_file = fname + '.txt'

with open(log_file, 'w') as f:
    f.write('Model,Accuracy,F1\n')


df = pd.read_csv('datasets/MTCD.csv', encoding='utf-8', engine='python') #, quotechar="'"  , quoting=3


      
display(df.columns)
display(df[:4])



classes = set(df['labels'].values)
display(classes)

df['labels'] = df['labels'].astype('category')
df['label'] = df['labels'].cat.codes

df = df[['text', 'label']]
classes_num = len(classes)
display(classes_num)
display(len(df))


max_sequence_length = 128


models = [ 
        'aubmindlab/bert-base-arabertv02-twitter',
        'CAMeL-Lab/bert-base-arabic-camelbert-da',
        'qarib/bert-base-qarib', 
        'UBC-NLP/MARBERT',
        'UBC-NLP/MARBERTv2',
    'SI2M-Lab/DarijaBERT-mix',
    'SI2M-Lab/DarijaBERT-arabizi'
]




seeds = [0, 1, 42]

for model_name in models:
    for seed in seeds:
        ds = Dataset.from_pandas(df)
        ds = ds.train_test_split(test_size=0.2, seed = seed)
        if seed==0:
            display(ds)
            
        for i in range(3):
            print(f'{model_name}, try:{i}')
                  
            tokenizer = AutoTokenizer.from_pretrained(model_name)
            model = AutoModelForSequenceClassification.from_pretrained(model_name,
                                                                  num_labels=classes_num).to('cuda')                                                 
            dataset_train = ds['train']
            dataset_validation = ds['test']                                                    
            
          
    
            def preprocess_function(examples):
                return tokenizer(examples['text'], truncation=True, padding="max_length",
                                max_length=max_sequence_length)
            
            
            dataset_train = dataset_train.map(preprocess_function, batched=True)
            dataset_validation = dataset_validation.map(preprocess_function, batched=True)
            
           
            
            def compute_metrics(eval_pred):
                logits, labels = eval_pred
                predictions = np.argmax(logits, axis=-1)    
                acc = accuracy_score(labels, predictions)        
                f1 = f1_score(labels, predictions, average='macro')   
                with open(log_file, 'a') as f:
                    f.write(f'{model_name},{acc},{f1}\n')
                return {'accuracy': acc, 'f1_score': f1}
    
    
            
            
            epochs = 8
            save_steps = 10000 #save checkpoint every 10000 steps
            batch_size = 64
            
            training_args = TrainingArguments(
                output_dir = 'bert/',
                overwrite_output_dir=True,
                num_train_epochs = epochs,
                per_device_train_batch_size = batch_size,
                per_device_eval_batch_size = batch_size,
                save_steps = save_steps,
                save_total_limit = 1, #only save the last 5 checkpoints
                fp16=True,
                learning_rate = 5e-5,  # 5e-5 is the default
                logging_steps = 200, #50_000
                evaluation_strategy = 'steps',
                # evaluate_during_training = True,
                eval_steps = 200
                
            )
            
            trainer = Trainer(
                model = model,
                args = training_args,
                # data_collator=data_collator,
                train_dataset=dataset_train,
                eval_dataset=dataset_validation,
                compute_metrics = compute_metrics
            )
            
            
            trainer.train()


results = pd.read_csv(log_file)

best_results = results.groupby('Model', as_index=False)['F1'].max()

best_results = pd.merge(best_results, results, on=['Model', 'F1'])
best_results = best_results[['Model', 'Accuracy', 'F1']]
best_results = best_results.drop_duplicates()
best_results.to_csv(f'{fname}.csv')
display(best_results)



2024-09-17 22:41:16.367956: I tensorflow/core/util/port.cc:110] oneDNN custom operations are on. You may see slightly different numerical results due to floating-point round-off errors from different computation orders. To turn them off, set the environment variable `TF_ENABLE_ONEDNN_OPTS=0`.
2024-09-17 22:41:16.390862: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.
To enable the following instructions: AVX2 AVX512F AVX512_VNNI AVX512_BF16 FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.


Index(['text', 'labels'], dtype='object')

Unnamed: 0,text,labels
0,خويا نصيحة مني. كمل فخدمتك ومتديهاش فكلام ناس داك لقاليك نقاشة ولانگافة. اتلقا ختو لكتصرف عليه.,News
1,ضربناكم كاملين ١😂🖕🇲🇦🇲🇦🇲🇦🇲🇦,Sport
2,بغيت نشارك فشي مسابقة حيت عندي 90 فتخفيض,Gaming
3,چاتني 92ف10,Gaming


{'Gaming', 'Kitchen', 'News', 'Sport'}

4

64222

DatasetDict({
    train: Dataset({
        features: ['text', 'label'],
        num_rows: 51377
    })
    test: Dataset({
        features: ['text', 'label'],
        num_rows: 12845
    })
})

aubmindlab/bert-base-arabertv02-twitter, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5088,0.397281,0.857844,0.859287
400,0.3662,0.31629,0.883924,0.885853
600,0.3319,0.311246,0.883612,0.885666
800,0.3035,0.328268,0.880187,0.884813
1000,0.2134,0.306379,0.89817,0.899401
1200,0.2041,0.296843,0.894901,0.896389
1400,0.1818,0.30963,0.900662,0.901699
1600,0.1882,0.261263,0.907668,0.909109
1800,0.1104,0.372319,0.899805,0.901966
2000,0.1275,0.327782,0.90253,0.904085


aubmindlab/bert-base-arabertv02-twitter, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5315,0.410835,0.851304,0.854925
400,0.3704,0.332751,0.87536,0.876375
600,0.3297,0.317232,0.883457,0.885698
800,0.3054,0.320138,0.886181,0.889704
1000,0.2169,0.30416,0.899494,0.901151
1200,0.2038,0.294626,0.895134,0.896759
1400,0.1816,0.308425,0.897781,0.897338
1600,0.188,0.274121,0.905333,0.906608
1800,0.111,0.330861,0.904243,0.905455
2000,0.1295,0.312639,0.902842,0.903988


aubmindlab/bert-base-arabertv02-twitter, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5315,0.410835,0.851304,0.854925
400,0.3704,0.332751,0.87536,0.876375
600,0.3297,0.317232,0.883457,0.885698
800,0.3054,0.320138,0.886181,0.889704
1000,0.2169,0.30416,0.899494,0.901151
1200,0.2038,0.294626,0.895134,0.896759
1400,0.1816,0.308425,0.897781,0.897338
1600,0.188,0.274121,0.905333,0.906608
1800,0.111,0.330861,0.904243,0.905455
2000,0.1295,0.312639,0.902842,0.903988


aubmindlab/bert-base-arabertv02-twitter, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5369,0.361593,0.867108,0.869392
400,0.3715,0.347334,0.875749,0.876325
600,0.3336,0.29548,0.88875,0.891671
800,0.3086,0.270039,0.90144,0.902977
1000,0.2043,0.292789,0.893266,0.89542
1200,0.1982,0.281165,0.904399,0.904904
1400,0.205,0.295769,0.905956,0.907819
1600,0.1988,0.279015,0.907824,0.908234
1800,0.1131,0.313995,0.904476,0.905347
2000,0.122,0.301613,0.910549,0.911261


aubmindlab/bert-base-arabertv02-twitter, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5369,0.361593,0.867108,0.869392
400,0.3715,0.347334,0.875749,0.876325
600,0.3336,0.29548,0.88875,0.891671
800,0.3086,0.270039,0.90144,0.902977
1000,0.2043,0.292789,0.893266,0.89542
1200,0.1982,0.281165,0.904399,0.904904
1400,0.205,0.295769,0.905956,0.907819
1600,0.1988,0.279015,0.907824,0.908234
1800,0.1131,0.313995,0.904476,0.905347
2000,0.122,0.301613,0.910549,0.911261


aubmindlab/bert-base-arabertv02-twitter, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5369,0.361593,0.867108,0.869392
400,0.3715,0.347334,0.875749,0.876325
600,0.3336,0.29548,0.88875,0.891671
800,0.3086,0.270039,0.90144,0.902977
1000,0.2043,0.292789,0.893266,0.89542
1200,0.1982,0.281165,0.904399,0.904904
1400,0.205,0.295769,0.905956,0.907819
1600,0.1988,0.279015,0.907824,0.908234
1800,0.1131,0.313995,0.904476,0.905347
2000,0.122,0.301613,0.910549,0.911261


aubmindlab/bert-base-arabertv02-twitter, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5294,0.39321,0.856286,0.856592
400,0.3786,0.334886,0.878786,0.878588
600,0.3252,0.300385,0.889996,0.891275
800,0.304,0.284946,0.896069,0.897791
1000,0.2122,0.295275,0.899728,0.900719
1200,0.1946,0.297144,0.899572,0.900627
1400,0.1984,0.296427,0.898871,0.900163
1600,0.1963,0.274463,0.908058,0.908774
1800,0.1199,0.324276,0.906578,0.907588
2000,0.1173,0.330055,0.905099,0.904961


aubmindlab/bert-base-arabertv02-twitter, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5294,0.39321,0.856286,0.856592
400,0.3786,0.334886,0.878786,0.878588
600,0.3252,0.300385,0.889996,0.891275
800,0.304,0.284946,0.896069,0.897791
1000,0.2122,0.295275,0.899728,0.900719
1200,0.1946,0.297144,0.899572,0.900627
1400,0.1984,0.296427,0.898871,0.900163
1600,0.1963,0.274463,0.908058,0.908774
1800,0.1199,0.324276,0.906578,0.907588
2000,0.1173,0.330055,0.905099,0.904961


aubmindlab/bert-base-arabertv02-twitter, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5294,0.39321,0.856286,0.856592
400,0.3786,0.334886,0.878786,0.878588
600,0.3252,0.300385,0.889996,0.891275
800,0.304,0.284946,0.896069,0.897791
1000,0.2122,0.295275,0.899728,0.900719
1200,0.1946,0.297144,0.899572,0.900627
1400,0.1984,0.296427,0.898871,0.900163
1600,0.1963,0.274463,0.908058,0.908774
1800,0.1199,0.324276,0.906578,0.907588
2000,0.1173,0.330055,0.905099,0.904961


DatasetDict({
    train: Dataset({
        features: ['text', 'label'],
        num_rows: 51377
    })
    test: Dataset({
        features: ['text', 'label'],
        num_rows: 12845
    })
})

CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5697,0.420992,0.849046,0.851027
400,0.3837,0.342205,0.872246,0.871845
600,0.3413,0.320257,0.882912,0.883167
800,0.3177,0.309318,0.886649,0.889232
1000,0.2034,0.333919,0.889918,0.890628
1200,0.1939,0.3065,0.897158,0.898169
1400,0.1756,0.33203,0.895757,0.895779
1600,0.1833,0.315067,0.899105,0.900081
1800,0.0997,0.41303,0.895368,0.896041
2000,0.1096,0.383955,0.898404,0.899189


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5697,0.420992,0.849046,0.851027
400,0.3837,0.342205,0.872246,0.871845
600,0.3413,0.320257,0.882912,0.883167
800,0.3177,0.309318,0.886649,0.889232
1000,0.2034,0.333919,0.889918,0.890628
1200,0.1939,0.3065,0.897158,0.898169
1400,0.1756,0.33203,0.895757,0.895779
1600,0.1833,0.315067,0.899105,0.900081
1800,0.0997,0.41303,0.895368,0.896041
2000,0.1096,0.383955,0.898404,0.899189


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5697,0.420992,0.849046,0.851027
400,0.3837,0.342205,0.872246,0.871845
600,0.3413,0.320257,0.882912,0.883167
800,0.3177,0.309318,0.886649,0.889232
1000,0.2034,0.333919,0.889918,0.890628
1200,0.1939,0.3065,0.897158,0.898169
1400,0.1756,0.33203,0.895757,0.895779
1600,0.1833,0.315067,0.899105,0.900081
1800,0.0997,0.41303,0.895368,0.896041
2000,0.1096,0.383955,0.898404,0.899189


CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5863,0.418959,0.846789,0.851274
400,0.388,0.337141,0.878708,0.880512
600,0.346,0.337185,0.87427,0.876638
800,0.3166,0.287556,0.895835,0.898261
1000,0.1892,0.331814,0.891865,0.894101
1200,0.1935,0.315138,0.89926,0.900498
1400,0.1839,0.367583,0.89529,0.897815
1600,0.1924,0.298134,0.898093,0.898374
1800,0.0901,0.415397,0.900117,0.901781
2000,0.1024,0.345449,0.903231,0.904889


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5863,0.418959,0.846789,0.851274
400,0.388,0.337141,0.878708,0.880512
600,0.346,0.337185,0.87427,0.876638
800,0.3166,0.287556,0.895835,0.898261
1000,0.1892,0.331814,0.891865,0.894101
1200,0.1935,0.315138,0.89926,0.900498
1400,0.1839,0.367583,0.89529,0.897815
1600,0.1924,0.298134,0.898093,0.898374
1800,0.0901,0.415397,0.900117,0.901781
2000,0.1024,0.345449,0.903231,0.904889


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5863,0.418959,0.846789,0.851274
400,0.388,0.337141,0.878708,0.880512
600,0.346,0.337185,0.87427,0.876638
800,0.3166,0.287556,0.895835,0.898261
1000,0.1892,0.331814,0.891865,0.894101
1200,0.1935,0.315138,0.89926,0.900498
1400,0.1839,0.367583,0.89529,0.897815
1600,0.1924,0.298134,0.898093,0.898374
1800,0.0901,0.415397,0.900117,0.901781
2000,0.1024,0.345449,0.903231,0.904889


CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5794,0.406504,0.849981,0.852607
400,0.4006,0.329811,0.8826,0.883543
600,0.3353,0.312707,0.888984,0.890136
800,0.3184,0.311362,0.891475,0.892757
1000,0.195,0.326677,0.896769,0.897405
1200,0.1902,0.316513,0.897703,0.899082
1400,0.192,0.306719,0.898715,0.899855
1600,0.1826,0.302315,0.906033,0.906298
1800,0.1035,0.370305,0.899805,0.900931
2000,0.0966,0.362582,0.902297,0.902983


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5794,0.406504,0.849981,0.852607
400,0.4006,0.329811,0.8826,0.883543
600,0.3353,0.312707,0.888984,0.890136
800,0.3184,0.311362,0.891475,0.892757
1000,0.195,0.326677,0.896769,0.897405
1200,0.1902,0.316513,0.897703,0.899082
1400,0.192,0.306719,0.898715,0.899855
1600,0.1826,0.302315,0.906033,0.906298
1800,0.1035,0.370305,0.899805,0.900931
2000,0.0966,0.362582,0.902297,0.902983


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5794,0.406504,0.849981,0.852607
400,0.4006,0.329811,0.8826,0.883543
600,0.3353,0.312707,0.888984,0.890136
800,0.3184,0.311362,0.891475,0.892757
1000,0.195,0.326677,0.896769,0.897405
1200,0.1902,0.316513,0.897703,0.899082
1400,0.192,0.306719,0.898715,0.899855
1600,0.1826,0.302315,0.906033,0.906298
1800,0.1035,0.370305,0.899805,0.900931
2000,0.0966,0.362582,0.902297,0.902983


DatasetDict({
    train: Dataset({
        features: ['text', 'label'],
        num_rows: 51377
    })
    test: Dataset({
        features: ['text', 'label'],
        num_rows: 12845
    })
})

qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5183,0.400055,0.855819,0.85856
400,0.352,0.323563,0.880965,0.880229
600,0.322,0.321413,0.878474,0.879839
800,0.3002,0.320812,0.889062,0.891507
1000,0.1852,0.312078,0.899572,0.899827
1200,0.1804,0.321847,0.895056,0.895969
1400,0.1647,0.3322,0.892877,0.893622
1600,0.1673,0.27293,0.90471,0.90479
1800,0.0907,0.416385,0.902219,0.903558
2000,0.1022,0.417101,0.902686,0.902684


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5183,0.400055,0.855819,0.85856
400,0.352,0.323563,0.880965,0.880229
600,0.322,0.321413,0.878474,0.879839
800,0.3002,0.320812,0.889062,0.891507
1000,0.1852,0.312078,0.899572,0.899827
1200,0.1804,0.321847,0.895056,0.895969
1400,0.1647,0.3322,0.892877,0.893622
1600,0.1673,0.27293,0.90471,0.90479
1800,0.0907,0.416385,0.902219,0.903558
2000,0.1022,0.417101,0.902686,0.902684


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5183,0.400055,0.855819,0.85856
400,0.352,0.323563,0.880965,0.880229
600,0.322,0.321413,0.878474,0.879839
800,0.3002,0.320812,0.889062,0.891507
1000,0.1852,0.312078,0.899572,0.899827
1200,0.1804,0.321847,0.895056,0.895969
1400,0.1647,0.3322,0.892877,0.893622
1600,0.1673,0.27293,0.90471,0.90479
1800,0.0907,0.416385,0.902219,0.903558
2000,0.1022,0.417101,0.902686,0.902684


qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5318,0.377057,0.862826,0.864612
400,0.3639,0.346614,0.873881,0.878404
600,0.3245,0.31277,0.885247,0.887986
800,0.2986,0.28842,0.899961,0.902094
1000,0.1835,0.313491,0.89856,0.900427
1200,0.1785,0.314792,0.896769,0.897812
1400,0.181,0.324076,0.906501,0.907483
1600,0.1773,0.301949,0.908525,0.909531
1800,0.0916,0.391261,0.898871,0.899786
2000,0.1002,0.347001,0.90253,0.904451


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5318,0.377057,0.862826,0.864612
400,0.3639,0.346614,0.873881,0.878404
600,0.3245,0.31277,0.885247,0.887986
800,0.2986,0.28842,0.899961,0.902094
1000,0.1835,0.313491,0.89856,0.900427
1200,0.1785,0.314792,0.896769,0.897812
1400,0.181,0.324076,0.906501,0.907483
1600,0.1773,0.301949,0.908525,0.909531
1800,0.0916,0.391261,0.898871,0.899786
2000,0.1002,0.347001,0.90253,0.904451


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5318,0.377057,0.862826,0.864612
400,0.3639,0.346614,0.873881,0.878404
600,0.3245,0.31277,0.885247,0.887986
800,0.2986,0.28842,0.899961,0.902094
1000,0.1835,0.313491,0.89856,0.900427
1200,0.1785,0.314792,0.896769,0.897812
1400,0.181,0.324076,0.906501,0.907483
1600,0.1773,0.301949,0.908525,0.909531
1800,0.0916,0.391261,0.898871,0.899786
2000,0.1002,0.347001,0.90253,0.904451


qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5167,0.383668,0.865162,0.866277
400,0.3685,0.302611,0.892254,0.893209
600,0.3119,0.287366,0.896925,0.897515
800,0.2989,0.278034,0.901674,0.90228
1000,0.1815,0.302064,0.900895,0.902048
1200,0.1735,0.29859,0.904087,0.90503
1400,0.1767,0.313251,0.903542,0.904331
1600,0.1757,0.303742,0.906423,0.9064
1800,0.102,0.406801,0.902608,0.903977
2000,0.0957,0.397529,0.903464,0.904127


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5167,0.383668,0.865162,0.866277
400,0.3685,0.302611,0.892254,0.893209
600,0.3119,0.287366,0.896925,0.897515
800,0.2989,0.278034,0.901674,0.90228
1000,0.1815,0.302064,0.900895,0.902048
1200,0.1735,0.29859,0.904087,0.90503
1400,0.1767,0.313251,0.903542,0.904331
1600,0.1757,0.303742,0.906423,0.9064
1800,0.102,0.406801,0.902608,0.903977
2000,0.0957,0.397529,0.903464,0.904127


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5167,0.383668,0.865162,0.866277
400,0.3685,0.302611,0.892254,0.893209
600,0.3119,0.287366,0.896925,0.897515
800,0.2989,0.278034,0.901674,0.90228
1000,0.1815,0.302064,0.900895,0.902048
1200,0.1735,0.29859,0.904087,0.90503
1400,0.1767,0.313251,0.903542,0.904331
1600,0.1757,0.303742,0.906423,0.9064
1800,0.102,0.406801,0.902608,0.903977
2000,0.0957,0.397529,0.903464,0.904127


DatasetDict({
    train: Dataset({
        features: ['text', 'label'],
        num_rows: 51377
    })
    test: Dataset({
        features: ['text', 'label'],
        num_rows: 12845
    })
})

UBC-NLP/MARBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5477,0.467789,0.836201,0.837411
400,0.3776,0.353324,0.867419,0.868211
600,0.3421,0.330717,0.884936,0.885955
800,0.3166,0.34108,0.885325,0.887455
1000,0.2001,0.316769,0.898015,0.898974
1200,0.1856,0.309893,0.90362,0.904108
1400,0.1761,0.345774,0.892409,0.893904
1600,0.1854,0.300741,0.901051,0.902351
1800,0.0995,0.462509,0.890619,0.893796
2000,0.1109,0.395658,0.89926,0.900435


UBC-NLP/MARBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5477,0.467789,0.836201,0.837411
400,0.3776,0.353324,0.867419,0.868211
600,0.3421,0.330717,0.884936,0.885955
800,0.3166,0.34108,0.885325,0.887455
1000,0.2001,0.316769,0.898015,0.898974
1200,0.1856,0.309893,0.90362,0.904108
1400,0.1761,0.345774,0.892409,0.893904
1600,0.1854,0.300741,0.901051,0.902351
1800,0.0995,0.462509,0.890619,0.893796
2000,0.1109,0.395658,0.89926,0.900435


UBC-NLP/MARBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5477,0.467789,0.836201,0.837411
400,0.3776,0.353324,0.867419,0.868211
600,0.3421,0.330717,0.884936,0.885955
800,0.3166,0.34108,0.885325,0.887455
1000,0.2001,0.316769,0.898015,0.898974
1200,0.1856,0.309893,0.90362,0.904108
1400,0.1761,0.345774,0.892409,0.893904
1600,0.1854,0.300741,0.901051,0.902351
1800,0.0995,0.462509,0.890619,0.893796
2000,0.1109,0.395658,0.89926,0.900435


UBC-NLP/MARBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.568,0.429434,0.851927,0.852857
400,0.3731,0.363933,0.867886,0.868923
600,0.3399,0.316908,0.889918,0.88821
800,0.3121,0.297828,0.89817,0.89885
1000,0.1888,0.401092,0.881432,0.88447
1200,0.1824,0.302028,0.901051,0.901602
1400,0.1893,0.317201,0.903464,0.905169
1600,0.1896,0.293362,0.903387,0.903493
1800,0.1012,0.443456,0.899338,0.899546
2000,0.1049,0.36352,0.902997,0.902818


UBC-NLP/MARBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.568,0.429434,0.851927,0.852857
400,0.3731,0.363933,0.867886,0.868923
600,0.3399,0.316908,0.889918,0.88821
800,0.3121,0.297828,0.89817,0.89885
1000,0.1888,0.401092,0.881432,0.88447
1200,0.1824,0.302028,0.901051,0.901602
1400,0.1893,0.317201,0.903464,0.905169
1600,0.1896,0.293362,0.903387,0.903493
1800,0.1012,0.443456,0.899338,0.899546
2000,0.1049,0.36352,0.902997,0.902818


UBC-NLP/MARBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.568,0.429434,0.851927,0.852857
400,0.3731,0.363933,0.867886,0.868923
600,0.3399,0.316908,0.889918,0.88821
800,0.3121,0.297828,0.89817,0.89885
1000,0.1888,0.401092,0.881432,0.88447
1200,0.1824,0.302028,0.901051,0.901602
1400,0.1893,0.317201,0.903464,0.905169
1600,0.1896,0.293362,0.903387,0.903493
1800,0.1012,0.443456,0.899338,0.899546
2000,0.1049,0.36352,0.902997,0.902818


UBC-NLP/MARBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5506,0.392213,0.863215,0.863006
400,0.3811,0.325223,0.884157,0.883868
600,0.3245,0.317456,0.891086,0.891236
800,0.3059,0.314065,0.89202,0.891602
1000,0.1953,0.337792,0.899027,0.900385
1200,0.1784,0.348104,0.896458,0.896068
1400,0.1845,0.301399,0.901674,0.902111
1600,0.1836,0.319159,0.902141,0.900406
1800,0.1055,0.435346,0.894278,0.894228
2000,0.1091,0.348592,0.905177,0.905092


UBC-NLP/MARBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5506,0.392213,0.863215,0.863006
400,0.3811,0.325223,0.884157,0.883868
600,0.3245,0.317456,0.891086,0.891236
800,0.3059,0.314065,0.89202,0.891602
1000,0.1953,0.337792,0.899027,0.900385
1200,0.1784,0.348104,0.896458,0.896068
1400,0.1845,0.301399,0.901674,0.902111
1600,0.1836,0.319159,0.902141,0.900406
1800,0.1055,0.435346,0.894278,0.894228
2000,0.1091,0.348592,0.905177,0.905092


UBC-NLP/MARBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5506,0.392213,0.863215,0.863006
400,0.3811,0.325223,0.884157,0.883868
600,0.3245,0.317456,0.891086,0.891236
800,0.3059,0.314065,0.89202,0.891602
1000,0.1953,0.337792,0.899027,0.900385
1200,0.1784,0.348104,0.896458,0.896068
1400,0.1845,0.301399,0.901674,0.902111
1600,0.1836,0.319159,0.902141,0.900406
1800,0.1055,0.435346,0.894278,0.894228
2000,0.1091,0.348592,0.905177,0.905092


DatasetDict({
    train: Dataset({
        features: ['text', 'label'],
        num_rows: 51377
    })
    test: Dataset({
        features: ['text', 'label'],
        num_rows: 12845
    })
})

UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5623,0.398733,0.858311,0.860448
400,0.3641,0.32917,0.878474,0.880981
600,0.3277,0.302806,0.889607,0.891233
800,0.2999,0.307573,0.895134,0.897054
1000,0.1959,0.313354,0.897081,0.898744
1200,0.1874,0.296946,0.903464,0.903369
1400,0.1653,0.298588,0.899105,0.898997
1600,0.1681,0.264517,0.910004,0.910339
1800,0.0942,0.347955,0.905411,0.906394
2000,0.1023,0.316166,0.906189,0.906145


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5623,0.398733,0.858311,0.860448
400,0.3641,0.32917,0.878474,0.880981
600,0.3277,0.302806,0.889607,0.891233
800,0.2999,0.307573,0.895134,0.897054
1000,0.1959,0.313354,0.897081,0.898744
1200,0.1874,0.296946,0.903464,0.903369
1400,0.1653,0.298588,0.899105,0.898997
1600,0.1681,0.264517,0.910004,0.910339
1800,0.0942,0.347955,0.905411,0.906394
2000,0.1023,0.316166,0.906189,0.906145


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5623,0.398733,0.858311,0.860448
400,0.3641,0.32917,0.878474,0.880981
600,0.3277,0.302806,0.889607,0.891233
800,0.2999,0.307573,0.895134,0.897054
1000,0.1959,0.313354,0.897081,0.898744
1200,0.1874,0.296946,0.903464,0.903369
1400,0.1653,0.298588,0.899105,0.898997
1600,0.1681,0.264517,0.910004,0.910339
1800,0.0942,0.347955,0.905411,0.906394
2000,0.1023,0.316166,0.906189,0.906145


UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5652,0.379404,0.866563,0.869108
400,0.3658,0.331956,0.878786,0.88213
600,0.328,0.321148,0.883067,0.885332
800,0.2962,0.280664,0.903309,0.904693
1000,0.1894,0.315495,0.900506,0.901884
1200,0.1784,0.291371,0.903931,0.905228
1400,0.1763,0.283496,0.911327,0.912207
1600,0.1789,0.284686,0.909926,0.910999
1800,0.0965,0.336459,0.9058,0.906894
2000,0.1003,0.338398,0.910315,0.910888


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5652,0.379404,0.866563,0.869108
400,0.3658,0.331956,0.878786,0.88213
600,0.328,0.321148,0.883067,0.885332
800,0.2962,0.280664,0.903309,0.904693
1000,0.1894,0.315495,0.900506,0.901884
1200,0.1784,0.291371,0.903931,0.905228
1400,0.1763,0.283496,0.911327,0.912207
1600,0.1789,0.284686,0.909926,0.910999
1800,0.0965,0.336459,0.9058,0.906894
2000,0.1003,0.338398,0.910315,0.910888


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5652,0.379404,0.866563,0.869108
400,0.3658,0.331956,0.878786,0.88213
600,0.328,0.321148,0.883067,0.885332
800,0.2962,0.280664,0.903309,0.904693
1000,0.1894,0.315495,0.900506,0.901884
1200,0.1784,0.291371,0.903931,0.905228
1400,0.1763,0.283496,0.911327,0.912207
1600,0.1789,0.284686,0.909926,0.910999
1800,0.0965,0.336459,0.9058,0.906894
2000,0.1003,0.338398,0.910315,0.910888


UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.6098,0.396944,0.85652,0.859077
400,0.3799,0.309884,0.887583,0.888084
600,0.3168,0.291406,0.89856,0.899622
800,0.2925,0.277076,0.904165,0.905704
1000,0.1871,0.298924,0.903542,0.904958
1200,0.1722,0.304146,0.902063,0.9034
1400,0.1788,0.305622,0.905333,0.906893
1600,0.1738,0.269006,0.909381,0.909706
1800,0.1028,0.340549,0.907591,0.908356
2000,0.0978,0.341122,0.907435,0.907761


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.6098,0.396944,0.85652,0.859077
400,0.3799,0.309884,0.887583,0.888084
600,0.3168,0.291406,0.89856,0.899622
800,0.2925,0.277076,0.904165,0.905704
1000,0.1871,0.298924,0.903542,0.904958
1200,0.1722,0.304146,0.902063,0.9034
1400,0.1788,0.305622,0.905333,0.906893
1600,0.1738,0.269006,0.909381,0.909706
1800,0.1028,0.340549,0.907591,0.908356
2000,0.0978,0.341122,0.907435,0.907761


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.6098,0.396944,0.85652,0.859077
400,0.3799,0.309884,0.887583,0.888084
600,0.3168,0.291406,0.89856,0.899622
800,0.2925,0.277076,0.904165,0.905704
1000,0.1871,0.298924,0.903542,0.904958
1200,0.1722,0.304146,0.902063,0.9034
1400,0.1788,0.305622,0.905333,0.906893
1600,0.1738,0.269006,0.909381,0.909706
1800,0.1028,0.340549,0.907591,0.908356
2000,0.0978,0.341122,0.907435,0.907761


DatasetDict({
    train: Dataset({
        features: ['text', 'label'],
        num_rows: 51377
    })
    test: Dataset({
        features: ['text', 'label'],
        num_rows: 12845
    })
})

SI2M-Lab/DarijaBERT-mix, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.4461,0.30391,0.893577,0.895881
400,0.2943,0.259559,0.906345,0.907004
600,0.2572,0.258683,0.908758,0.910629
800,0.2351,0.231949,0.919035,0.92136
1000,0.1603,0.24551,0.920981,0.922271
1200,0.1522,0.242382,0.920202,0.921152
1400,0.1467,0.252676,0.925496,0.926467
1600,0.1463,0.230767,0.923706,0.925349
1800,0.0808,0.338964,0.919891,0.921006
2000,0.0877,0.271695,0.926664,0.927262


SI2M-Lab/DarijaBERT-mix, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.4461,0.30391,0.893577,0.895881
400,0.2943,0.259559,0.906345,0.907004
600,0.2572,0.258683,0.908758,0.910629
800,0.2351,0.231949,0.919035,0.92136
1000,0.1603,0.24551,0.920981,0.922271
1200,0.1522,0.242382,0.920202,0.921152
1400,0.1467,0.252676,0.925496,0.926467
1600,0.1463,0.230767,0.923706,0.925349
1800,0.0808,0.338964,0.919891,0.921006
2000,0.0877,0.271695,0.926664,0.927262


SI2M-Lab/DarijaBERT-mix, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.4461,0.30391,0.893577,0.895881
400,0.2943,0.259559,0.906345,0.907004
600,0.2572,0.258683,0.908758,0.910629
800,0.2351,0.231949,0.919035,0.92136
1000,0.1603,0.24551,0.920981,0.922271
1200,0.1522,0.242382,0.920202,0.921152
1400,0.1467,0.252676,0.925496,0.926467
1600,0.1463,0.230767,0.923706,0.925349
1800,0.0808,0.338964,0.919891,0.921006
2000,0.0877,0.271695,0.926664,0.927262


SI2M-Lab/DarijaBERT-mix, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.4088,0.294806,0.896224,0.897341
400,0.2787,0.26064,0.906501,0.909149
600,0.2526,0.229713,0.918723,0.919592
800,0.2372,0.228036,0.921915,0.924899
1000,0.1456,0.243935,0.921137,0.923077
1200,0.136,0.25197,0.922538,0.924247
1400,0.1486,0.218421,0.927209,0.929135
1600,0.1413,0.230679,0.924873,0.926327
1800,0.0718,0.297609,0.926197,0.927254
2000,0.077,0.284617,0.927053,0.928174


SI2M-Lab/DarijaBERT-mix, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.4088,0.294806,0.896224,0.897341
400,0.2787,0.26064,0.906501,0.909149
600,0.2526,0.229713,0.918723,0.919592
800,0.2372,0.228036,0.921915,0.924899
1000,0.1456,0.243935,0.921137,0.923077
1200,0.136,0.25197,0.922538,0.924247
1400,0.1486,0.218421,0.927209,0.929135
1600,0.1413,0.230679,0.924873,0.926327
1800,0.0718,0.297609,0.926197,0.927254
2000,0.077,0.284617,0.927053,0.928174


SI2M-Lab/DarijaBERT-mix, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.4088,0.294806,0.896224,0.897341
400,0.2787,0.26064,0.906501,0.909149
600,0.2526,0.229713,0.918723,0.919592
800,0.2372,0.228036,0.921915,0.924899
1000,0.1456,0.243935,0.921137,0.923077
1200,0.136,0.25197,0.922538,0.924247
1400,0.1486,0.218421,0.927209,0.929135
1600,0.1413,0.230679,0.924873,0.926327
1800,0.0718,0.297609,0.926197,0.927254
2000,0.077,0.284617,0.927053,0.928174


SI2M-Lab/DarijaBERT-mix, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.4766,0.299961,0.893188,0.896118
400,0.293,0.258317,0.91016,0.912477
600,0.2571,0.240444,0.913663,0.914359
800,0.2379,0.223113,0.920202,0.920933
1000,0.1565,0.249944,0.91919,0.919463
1200,0.1486,0.26737,0.921214,0.921878
1400,0.1499,0.274503,0.919112,0.920227
1600,0.1488,0.231554,0.926041,0.926505
1800,0.0843,0.282479,0.923861,0.924619
2000,0.0781,0.320542,0.923472,0.924888


SI2M-Lab/DarijaBERT-mix, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.4766,0.299961,0.893188,0.896118
400,0.293,0.258317,0.91016,0.912477
600,0.2571,0.240444,0.913663,0.914359
800,0.2379,0.223113,0.920202,0.920933
1000,0.1565,0.249944,0.91919,0.919463
1200,0.1486,0.26737,0.921214,0.921878
1400,0.1499,0.274503,0.919112,0.920227
1600,0.1488,0.231554,0.926041,0.926505
1800,0.0843,0.282479,0.923861,0.924619
2000,0.0781,0.320542,0.923472,0.924888


SI2M-Lab/DarijaBERT-mix, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.4766,0.299961,0.893188,0.896118
400,0.293,0.258317,0.91016,0.912477
600,0.2571,0.240444,0.913663,0.914359
800,0.2379,0.223113,0.920202,0.920933
1000,0.1565,0.249944,0.91919,0.919463
1200,0.1486,0.26737,0.921214,0.921878
1400,0.1499,0.274503,0.919112,0.920227
1600,0.1488,0.231554,0.926041,0.926505
1800,0.0843,0.282479,0.923861,0.924619
2000,0.0781,0.320542,0.923472,0.924888


DatasetDict({
    train: Dataset({
        features: ['text', 'label'],
        num_rows: 51377
    })
    test: Dataset({
        features: ['text', 'label'],
        num_rows: 12845
    })
})

SI2M-Lab/DarijaBERT-arabizi, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5229,0.408635,0.844687,0.851695
400,0.3844,0.33805,0.873025,0.873689
600,0.341,0.36135,0.866329,0.87171
800,0.3161,0.3174,0.885948,0.889596
1000,0.2009,0.296507,0.899805,0.901718
1200,0.1943,0.324946,0.891475,0.892893
1400,0.1852,0.314213,0.898248,0.899359
1600,0.1767,0.292816,0.898793,0.900424
1800,0.0932,0.412669,0.897314,0.899403
2000,0.1024,0.337599,0.900428,0.901381


SI2M-Lab/DarijaBERT-arabizi, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5229,0.408635,0.844687,0.851695
400,0.3844,0.33805,0.873025,0.873689
600,0.341,0.36135,0.866329,0.87171
800,0.3161,0.3174,0.885948,0.889596
1000,0.2009,0.296507,0.899805,0.901718
1200,0.1943,0.324946,0.891475,0.892893
1400,0.1852,0.314213,0.898248,0.899359
1600,0.1767,0.292816,0.898793,0.900424
1800,0.0932,0.412669,0.897314,0.899403
2000,0.1024,0.337599,0.900428,0.901381


SI2M-Lab/DarijaBERT-arabizi, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5229,0.408635,0.844687,0.851695
400,0.3844,0.33805,0.873025,0.873689
600,0.341,0.36135,0.866329,0.87171
800,0.3161,0.3174,0.885948,0.889596
1000,0.2009,0.296507,0.899805,0.901718
1200,0.1943,0.324946,0.891475,0.892893
1400,0.1852,0.314213,0.898248,0.899359
1600,0.1767,0.292816,0.898793,0.900424
1800,0.0932,0.412669,0.897314,0.899403
2000,0.1024,0.337599,0.900428,0.901381


SI2M-Lab/DarijaBERT-arabizi, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.539,0.410684,0.850993,0.857287
400,0.3758,0.324545,0.880654,0.884067
600,0.3429,0.30275,0.888206,0.890315
800,0.3133,0.294278,0.896302,0.900187
1000,0.197,0.301851,0.889918,0.892497
1200,0.1868,0.298763,0.901129,0.903314
1400,0.1948,0.304276,0.899805,0.902328
1600,0.1889,0.291546,0.904944,0.907489
1800,0.0975,0.385142,0.89856,0.902611
2000,0.1021,0.36499,0.905333,0.907524


SI2M-Lab/DarijaBERT-arabizi, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.539,0.410684,0.850993,0.857287
400,0.3758,0.324545,0.880654,0.884067
600,0.3429,0.30275,0.888206,0.890315
800,0.3133,0.294278,0.896302,0.900187
1000,0.197,0.301851,0.889918,0.892497
1200,0.1868,0.298763,0.901129,0.903314
1400,0.1948,0.304276,0.899805,0.902328
1600,0.1889,0.291546,0.904944,0.907489
1800,0.0975,0.385142,0.89856,0.902611
2000,0.1021,0.36499,0.905333,0.907524


SI2M-Lab/DarijaBERT-arabizi, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.539,0.410684,0.850993,0.857287
400,0.3758,0.324545,0.880654,0.884067
600,0.3429,0.30275,0.888206,0.890315
800,0.3133,0.294278,0.896302,0.900187
1000,0.197,0.301851,0.889918,0.892497
1200,0.1868,0.298763,0.901129,0.903314
1400,0.1948,0.304276,0.899805,0.902328
1600,0.1889,0.291546,0.904944,0.907489
1800,0.0975,0.385142,0.89856,0.902611
2000,0.1021,0.36499,0.905333,0.907524


SI2M-Lab/DarijaBERT-arabizi, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5337,0.401213,0.852238,0.857688
400,0.3936,0.333646,0.872246,0.876476
600,0.3309,0.308024,0.884313,0.887139
800,0.3085,0.305779,0.891475,0.893667
1000,0.1984,0.314569,0.893655,0.896056
1200,0.1873,0.304661,0.897003,0.899069
1400,0.1886,0.312993,0.896302,0.898352
1600,0.19,0.296088,0.902842,0.904663
1800,0.0987,0.36607,0.90035,0.902915
2000,0.1005,0.366652,0.89856,0.899951


SI2M-Lab/DarijaBERT-arabizi, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5337,0.401213,0.852238,0.857688
400,0.3936,0.333646,0.872246,0.876476
600,0.3309,0.308024,0.884313,0.887139
800,0.3085,0.305779,0.891475,0.893667
1000,0.1984,0.314569,0.893655,0.896056
1200,0.1873,0.304661,0.897003,0.899069
1400,0.1886,0.312993,0.896302,0.898352
1600,0.19,0.296088,0.902842,0.904663
1800,0.0987,0.36607,0.90035,0.902915
2000,0.1005,0.366652,0.89856,0.899951


SI2M-Lab/DarijaBERT-arabizi, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/51377 [00:00<?, ? examples/s]

Map:   0%|          | 0/12845 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
200,0.5337,0.401213,0.852238,0.857688
400,0.3936,0.333646,0.872246,0.876476
600,0.3309,0.308024,0.884313,0.887139
800,0.3085,0.305779,0.891475,0.893667
1000,0.1984,0.314569,0.893655,0.896056
1200,0.1873,0.304661,0.897003,0.899069
1400,0.1886,0.312993,0.896302,0.898352
1600,0.19,0.296088,0.902842,0.904663
1800,0.0987,0.36607,0.90035,0.902915
2000,0.1005,0.366652,0.89856,0.899951


Unnamed: 0,Model,Accuracy,F1
0,CAMeL-Lab/bert-base-arabic-camelbert-da,0.910471,0.910979
3,SI2M-Lab/DarijaBERT-arabizi,0.911094,0.9131
6,SI2M-Lab/DarijaBERT-mix,0.928922,0.929488
9,UBC-NLP/MARBERT,0.906812,0.908132
12,UBC-NLP/MARBERTv2,0.914675,0.916232
15,aubmindlab/bert-base-arabertv02-twitter,0.913663,0.91508
18,qarib/bert-base-qarib,0.914675,0.915973
