In [1]:
import os
os.environ["CUDA_VISIBLE_DEVICES"]="1" 

import numpy as np
import tensorflow as tf
import pandas as pd
import pyarabic.araby as araby
import warnings
warnings.filterwarnings('ignore')
from sklearn.model_selection import train_test_split
from sklearn.metrics import classification_report
from tensorflow.keras.layers import Dense, Input
from tensorflow.keras.utils import to_categorical
from tensorflow.keras.optimizers import Adam
from tensorflow.keras.callbacks import EarlyStopping
from tensorflow.keras.initializers import TruncatedNormal
from tensorflow.keras.losses import CategoricalCrossentropy
from tensorflow.keras.metrics import CategoricalAccuracy
import torch
from sklearn.metrics import accuracy_score, f1_score
from transformers import Trainer, TrainingArguments
from transformers import AutoTokenizer, AutoModelForSequenceClassification
from datasets import load_dataset, Dataset, concatenate_datasets
pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', None)
pd.set_option('display.max_colwidth', 1000)


fname = 'MSA_MDA_1'
log_file = fname + '.txt'

with open(log_file, 'w') as f:
    f.write('Model,Accuracy,F1\n')


df = pd.read_csv('datasets/MSA_MDA_comments.csv', encoding='utf-8', engine='python', sep='\t') #, quotechar="'"  , quoting=3

display(len(df))
df = df[df['language'] == 'mda']
      
display(df.columns)
display(df[:4])


display(len(df))

c = df['sentiment'].value_counts()
display(c)

classes = set(df['sentiment'].values)
display(classes)

df['sentiment'] = df['sentiment'].astype('category')
df['label'] = df['sentiment'].cat.codes

df = df[['text', 'label']]
classes_num = len(classes)
display(classes_num)
display(len(df))


max_sequence_length = 128



models = [ 
        'aubmindlab/bert-base-arabertv02-twitter',
        'CAMeL-Lab/bert-base-arabic-camelbert-da',
        'qarib/bert-base-qarib', 
        'UBC-NLP/MARBERT',
        'UBC-NLP/MARBERTv2',
    'SI2M-Lab/DarijaBERT-mix',
    'SI2M-Lab/DarijaBERT-arabizi'
]


seeds = [0, 1, 42]

for model_name in models:
    for seed in seeds:
        ds = Dataset.from_pandas(df)
        ds = ds.train_test_split(test_size=0.2, seed = seed)
        if seed==0:
            display(ds)
            
        for i in range(3):
            print(f'{model_name}, try:{i}')
                  
            tokenizer = AutoTokenizer.from_pretrained(model_name)
            model = AutoModelForSequenceClassification.from_pretrained(model_name,
                                                                  num_labels=classes_num).to('cuda')                                                 
            dataset_train = ds['train']
            dataset_validation = ds['test']                                                    
            
          
    
            def preprocess_function(examples):
                return tokenizer(examples['text'], truncation=True, padding="max_length",
                                max_length=max_sequence_length)
            
            
            dataset_train = dataset_train.map(preprocess_function, batched=True)
            dataset_validation = dataset_validation.map(preprocess_function, batched=True)
            
           
            
            def compute_metrics(eval_pred):
                logits, labels = eval_pred
                predictions = np.argmax(logits, axis=-1)    
                acc = accuracy_score(labels, predictions)        
                f1 = f1_score(labels, predictions, average='macro')   
                with open(log_file, 'a') as f:
                    f.write(f'{model_name},{acc},{f1}\n')
                return {'accuracy': acc, 'f1_score': f1}
    
    
            
            
            epochs = 15
            save_steps = 10000 #save checkpoint every 10000 steps
            batch_size = 64
            
            training_args = TrainingArguments(
                output_dir = 'bert/',
                overwrite_output_dir=True,
                num_train_epochs = epochs,
                per_device_train_batch_size = batch_size,
                per_device_eval_batch_size = batch_size,
                save_steps = save_steps,
                save_total_limit = 1, #only save the last 5 checkpoints
                fp16=True,
                learning_rate = 5e-5,  # 5e-5 is the default
                logging_steps = 25, #50_000
                evaluation_strategy = 'steps',
                # evaluate_during_training = True,
                eval_steps = 25
                
            )
            
            trainer = Trainer(
                model = model,
                args = training_args,
                # data_collator=data_collator,
                train_dataset=dataset_train,
                eval_dataset=dataset_validation,
                compute_metrics = compute_metrics
            )
            
            
            trainer.train()


results = pd.read_csv(log_file)

best_results = results.groupby('Model', as_index=False)['F1'].max()

best_results = pd.merge(best_results, results, on=['Model', 'F1'])
best_results = best_results[['Model', 'Accuracy', 'F1']]
best_results = best_results.drop_duplicates()
best_results.to_csv(f'{fname}.csv')
display(best_results)



2024-09-18 17:19:36.631510: I tensorflow/core/util/port.cc:110] oneDNN custom operations are on. You may see slightly different numerical results due to floating-point round-off errors from different computation orders. To turn them off, set the environment variable `TF_ENABLE_ONEDNN_OPTS=0`.
2024-09-18 17:19:36.654432: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.
To enable the following instructions: AVX2 AVX512F AVX512_VNNI AVX512_BF16 FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.


9901

Index(['text', 'language', 'sentiment'], dtype='object')

Unnamed: 0,text,language,sentiment
6359,اجي هاك الطاجين راك فزت به سربي ما حدو سخون. بالصحة والعافية.,mda,positive
6360,اخصنى انديروها ابنات ميدالت فالصيف فالمو صمورة متافقين ويشجعون ولداتنا تخيلوها هههههههه,mda,positive
6361,الفلاح هوا العمود الفقري ديال المغرب تبرك الله عليك الله يعونك,mda,positive
6362,كاين الخير والأرض خضارت والفلاح نشط مع هاد الأمطار غير كاين سمر والبرد مع الصباح حيت ليالي قريبة والحمد القوي العزيز,mda,positive


3542

sentiment
negative    2858
positive     684
Name: count, dtype: int64

{'negative', 'positive'}

2

3542

DatasetDict({
    train: Dataset({
        features: ['text', 'label', '__index_level_0__'],
        num_rows: 2833
    })
    test: Dataset({
        features: ['text', 'label', '__index_level_0__'],
        num_rows: 709
    })
})

aubmindlab/bert-base-arabertv02-twitter, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3375,0.207084,0.928068,0.886214
50,0.2264,0.214652,0.921016,0.865709
75,0.1361,0.22563,0.923836,0.877858
100,0.0987,0.242153,0.928068,0.889178
125,0.0729,0.246467,0.916784,0.871129
150,0.0357,0.348549,0.919605,0.873511
175,0.0426,0.439359,0.912553,0.84554
200,0.0298,0.437067,0.885755,0.838331
225,0.016,0.452397,0.901269,0.852744
250,0.0114,0.493814,0.897038,0.849665


aubmindlab/bert-base-arabertv02-twitter, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3,0.229931,0.916784,0.867647
50,0.2202,0.202714,0.906911,0.860483
75,0.1354,0.243888,0.90409,0.854832
100,0.0998,0.273259,0.912553,0.857372
125,0.077,0.258759,0.923836,0.879846
150,0.0491,0.327968,0.919605,0.874846
175,0.0437,0.4028,0.916784,0.862292
200,0.0252,0.33559,0.911142,0.861671
225,0.0148,0.399127,0.913963,0.869451
250,0.011,0.432407,0.919605,0.86373


aubmindlab/bert-base-arabertv02-twitter, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3,0.229931,0.916784,0.867647
50,0.2202,0.202714,0.906911,0.860483
75,0.1354,0.243888,0.90409,0.854832
100,0.0998,0.273259,0.912553,0.857372
125,0.077,0.258759,0.923836,0.879846
150,0.0491,0.327968,0.919605,0.874846
175,0.0437,0.4028,0.916784,0.862292
200,0.0252,0.33559,0.911142,0.861671
225,0.0148,0.399127,0.913963,0.869451
250,0.011,0.432407,0.919605,0.86373


aubmindlab/bert-base-arabertv02-twitter, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3137,0.191774,0.929478,0.886273
50,0.2338,0.199869,0.930889,0.879113
75,0.1509,0.20005,0.925247,0.880452
100,0.0944,0.256647,0.926657,0.886713
125,0.0743,0.275015,0.930889,0.881396
150,0.0583,0.324196,0.916784,0.873731
175,0.0416,0.313772,0.923836,0.882356
200,0.023,0.302198,0.926657,0.881056
225,0.0063,0.380978,0.932299,0.893196
250,0.0024,0.397399,0.930889,0.890676


aubmindlab/bert-base-arabertv02-twitter, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3137,0.191774,0.929478,0.886273
50,0.2338,0.199869,0.930889,0.879113
75,0.1509,0.20005,0.925247,0.880452
100,0.0944,0.256647,0.926657,0.886713
125,0.0743,0.275015,0.930889,0.881396
150,0.0583,0.324196,0.916784,0.873731
175,0.0416,0.313772,0.923836,0.882356
200,0.023,0.302198,0.926657,0.881056
225,0.0063,0.380978,0.932299,0.893196
250,0.0024,0.397399,0.930889,0.890676


aubmindlab/bert-base-arabertv02-twitter, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3137,0.191774,0.929478,0.886273
50,0.2338,0.199869,0.930889,0.879113
75,0.1509,0.20005,0.925247,0.880452
100,0.0944,0.256647,0.926657,0.886713
125,0.0743,0.275015,0.930889,0.881396
150,0.0583,0.324196,0.916784,0.873731
175,0.0416,0.313772,0.923836,0.882356
200,0.023,0.302198,0.926657,0.881056
225,0.0063,0.380978,0.932299,0.893196
250,0.0024,0.397399,0.930889,0.890676


aubmindlab/bert-base-arabertv02-twitter, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3269,0.26857,0.925247,0.857952
50,0.2243,0.242812,0.912553,0.829393
75,0.1548,0.25565,0.928068,0.865292
100,0.1237,0.200083,0.929478,0.882954
125,0.0748,0.253201,0.930889,0.877525
150,0.0429,0.257624,0.93653,0.893072
175,0.027,0.303472,0.932299,0.878821
200,0.0263,0.324396,0.928068,0.879543
225,0.0145,0.346469,0.928068,0.872526
250,0.0063,0.397287,0.929478,0.886273


aubmindlab/bert-base-arabertv02-twitter, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3269,0.26857,0.925247,0.857952
50,0.2243,0.242812,0.912553,0.829393
75,0.1548,0.25565,0.928068,0.865292
100,0.1237,0.200083,0.929478,0.882954
125,0.0748,0.253201,0.930889,0.877525
150,0.0429,0.257624,0.93653,0.893072
175,0.027,0.303472,0.932299,0.878821
200,0.0263,0.324396,0.928068,0.879543
225,0.0145,0.346469,0.928068,0.872526
250,0.0063,0.397287,0.929478,0.886273


aubmindlab/bert-base-arabertv02-twitter, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3269,0.26857,0.925247,0.857952
50,0.2243,0.242812,0.912553,0.829393
75,0.1548,0.25565,0.928068,0.865292
100,0.1237,0.200083,0.929478,0.882954
125,0.0748,0.253201,0.930889,0.877525
150,0.0429,0.257624,0.93653,0.893072
175,0.027,0.303472,0.932299,0.878821
200,0.0263,0.324396,0.928068,0.879543
225,0.0145,0.346469,0.928068,0.872526
250,0.0063,0.397287,0.929478,0.886273


DatasetDict({
    train: Dataset({
        features: ['text', 'label', '__index_level_0__'],
        num_rows: 2833
    })
    test: Dataset({
        features: ['text', 'label', '__index_level_0__'],
        num_rows: 709
    })
})

CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3263,0.313917,0.894217,0.817319
50,0.2705,0.295167,0.887165,0.831707
75,0.15,0.284772,0.901269,0.837095
100,0.0986,0.395318,0.899859,0.844106
125,0.0777,0.297601,0.901269,0.840783
150,0.0365,0.465078,0.90409,0.848694
175,0.04,0.647011,0.850494,0.794953
200,0.0329,0.47926,0.908322,0.848287
225,0.0255,0.609188,0.898449,0.825178
250,0.0161,0.589552,0.898449,0.833412


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3263,0.313917,0.894217,0.817319
50,0.2705,0.295167,0.887165,0.831707
75,0.15,0.284772,0.901269,0.837095
100,0.0986,0.395318,0.899859,0.844106
125,0.0777,0.297601,0.901269,0.840783
150,0.0365,0.465078,0.90409,0.848694
175,0.04,0.647011,0.850494,0.794953
200,0.0329,0.47926,0.908322,0.848287
225,0.0255,0.609188,0.898449,0.825178
250,0.0161,0.589552,0.898449,0.833412


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3263,0.313917,0.894217,0.817319
50,0.2705,0.295167,0.887165,0.831707
75,0.15,0.284772,0.901269,0.837095
100,0.0986,0.395318,0.899859,0.844106
125,0.0777,0.297601,0.901269,0.840783
150,0.0365,0.465078,0.90409,0.848694
175,0.04,0.647011,0.850494,0.794953
200,0.0329,0.47926,0.908322,0.848287
225,0.0255,0.609188,0.898449,0.825178
250,0.0161,0.589552,0.898449,0.833412


CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3659,0.276124,0.899859,0.838053
50,0.2589,0.277694,0.912553,0.840241
75,0.1671,0.278858,0.922426,0.867699
100,0.1154,0.394684,0.889986,0.834306
125,0.0733,0.40994,0.888575,0.829212
150,0.0535,0.42582,0.901269,0.841668
175,0.0425,0.416044,0.908322,0.854979
200,0.0302,0.440367,0.913963,0.858453
225,0.0081,0.527375,0.905501,0.846309
250,0.0077,0.611171,0.901269,0.850562


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3659,0.276124,0.899859,0.838053
50,0.2589,0.277694,0.912553,0.840241
75,0.1671,0.278858,0.922426,0.867699
100,0.1154,0.394684,0.889986,0.834306
125,0.0733,0.40994,0.888575,0.829212
150,0.0535,0.42582,0.901269,0.841668
175,0.0425,0.416044,0.908322,0.854979
200,0.0302,0.440367,0.913963,0.858453
225,0.0081,0.527375,0.905501,0.846309
250,0.0077,0.611171,0.901269,0.850562


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3659,0.276124,0.899859,0.838053
50,0.2589,0.277694,0.912553,0.840241
75,0.1671,0.278858,0.922426,0.867699
100,0.1154,0.394684,0.889986,0.834306
125,0.0733,0.40994,0.888575,0.829212
150,0.0535,0.42582,0.901269,0.841668
175,0.0425,0.416044,0.908322,0.854979
200,0.0302,0.440367,0.913963,0.858453
225,0.0081,0.527375,0.905501,0.846309
250,0.0077,0.611171,0.901269,0.850562


CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.393,0.264584,0.913963,0.832786
50,0.2409,0.251296,0.891396,0.829128
75,0.1785,0.246763,0.921016,0.849355
100,0.1115,0.397505,0.863188,0.808047
125,0.0716,0.361336,0.915374,0.847501
150,0.0761,0.36871,0.923836,0.868052
175,0.0304,0.372725,0.906911,0.84458
200,0.0135,0.505332,0.918195,0.849502
225,0.0289,0.598238,0.909732,0.823889
250,0.012,0.569692,0.913963,0.844431


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.393,0.264584,0.913963,0.832786
50,0.2409,0.251296,0.891396,0.829128
75,0.1785,0.246763,0.921016,0.849355
100,0.1115,0.397505,0.863188,0.808047
125,0.0716,0.361336,0.915374,0.847501
150,0.0761,0.36871,0.923836,0.868052
175,0.0304,0.372725,0.906911,0.84458
200,0.0135,0.505332,0.918195,0.849502
225,0.0289,0.598238,0.909732,0.823889
250,0.012,0.569692,0.913963,0.844431


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.393,0.264584,0.913963,0.832786
50,0.2409,0.251296,0.891396,0.829128
75,0.1785,0.246763,0.921016,0.849355
100,0.1115,0.397505,0.863188,0.808047
125,0.0716,0.361336,0.915374,0.847501
150,0.0761,0.36871,0.923836,0.868052
175,0.0304,0.372725,0.906911,0.84458
200,0.0135,0.505332,0.918195,0.849502
225,0.0289,0.598238,0.909732,0.823889
250,0.012,0.569692,0.913963,0.844431


DatasetDict({
    train: Dataset({
        features: ['text', 'label', '__index_level_0__'],
        num_rows: 2833
    })
    test: Dataset({
        features: ['text', 'label', '__index_level_0__'],
        num_rows: 709
    })
})

qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3316,0.249617,0.918195,0.868811
50,0.2316,0.22769,0.921016,0.874719
75,0.1268,0.251838,0.916784,0.873731
100,0.1052,0.243495,0.922426,0.87525
125,0.0563,0.36914,0.915374,0.856995
150,0.0382,0.407392,0.918195,0.867331
175,0.0239,0.443966,0.915374,0.865035
200,0.0065,0.511793,0.909732,0.864711
225,0.0163,0.470916,0.909732,0.851921
250,0.0156,0.462656,0.918195,0.880278


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3316,0.249617,0.918195,0.868811
50,0.2316,0.22769,0.921016,0.874719
75,0.1268,0.251838,0.916784,0.873731
100,0.1052,0.243495,0.922426,0.87525
125,0.0563,0.36914,0.915374,0.856995
150,0.0382,0.407392,0.918195,0.867331
175,0.0239,0.443966,0.915374,0.865035
200,0.0065,0.511793,0.909732,0.864711
225,0.0163,0.470916,0.909732,0.851921
250,0.0156,0.462656,0.918195,0.880278


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3316,0.249617,0.918195,0.868811
50,0.2316,0.22769,0.921016,0.874719
75,0.1268,0.251838,0.916784,0.873731
100,0.1052,0.243495,0.922426,0.87525
125,0.0563,0.36914,0.915374,0.856995
150,0.0382,0.407392,0.918195,0.867331
175,0.0239,0.443966,0.915374,0.865035
200,0.0065,0.511793,0.909732,0.864711
225,0.0163,0.470916,0.909732,0.851921
250,0.0156,0.462656,0.918195,0.880278


qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3449,0.217253,0.933709,0.888319
50,0.2246,0.246524,0.918195,0.851575
75,0.1565,0.220571,0.928068,0.885593
100,0.1114,0.391557,0.90268,0.857902
125,0.0587,0.391273,0.915374,0.861973
150,0.0506,0.411834,0.915374,0.867911
175,0.0374,0.430394,0.911142,0.856301
200,0.0168,0.42742,0.919605,0.872134
225,0.0112,0.487488,0.918195,0.867331
250,0.018,0.520765,0.918195,0.868077


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3449,0.217253,0.933709,0.888319
50,0.2246,0.246524,0.918195,0.851575
75,0.1565,0.220571,0.928068,0.885593
100,0.1114,0.391557,0.90268,0.857902
125,0.0587,0.391273,0.915374,0.861973
150,0.0506,0.411834,0.915374,0.867911
175,0.0374,0.430394,0.911142,0.856301
200,0.0168,0.42742,0.919605,0.872134
225,0.0112,0.487488,0.918195,0.867331
250,0.018,0.520765,0.918195,0.868077


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3449,0.217253,0.933709,0.888319
50,0.2246,0.246524,0.918195,0.851575
75,0.1565,0.220571,0.928068,0.885593
100,0.1114,0.391557,0.90268,0.857902
125,0.0587,0.391273,0.915374,0.861973
150,0.0506,0.411834,0.915374,0.867911
175,0.0374,0.430394,0.911142,0.856301
200,0.0168,0.42742,0.919605,0.872134
225,0.0112,0.487488,0.918195,0.867331
250,0.018,0.520765,0.918195,0.868077


qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3372,0.229155,0.895628,0.835344
50,0.2335,0.216281,0.921016,0.866529
75,0.1517,0.217269,0.929478,0.871162
100,0.1098,0.234475,0.913963,0.862407
125,0.0535,0.315478,0.921016,0.857667
150,0.045,0.317443,0.913963,0.858453
175,0.0212,0.324676,0.923836,0.872073
200,0.0439,0.393694,0.930889,0.868672
225,0.0282,0.409517,0.926657,0.860115
250,0.0051,0.418061,0.921016,0.871175


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3372,0.229155,0.895628,0.835344
50,0.2335,0.216281,0.921016,0.866529
75,0.1517,0.217269,0.929478,0.871162
100,0.1098,0.234475,0.913963,0.862407
125,0.0535,0.315478,0.921016,0.857667
150,0.045,0.317443,0.913963,0.858453
175,0.0212,0.324676,0.923836,0.872073
200,0.0439,0.393694,0.930889,0.868672
225,0.0282,0.409517,0.926657,0.860115
250,0.0051,0.418061,0.921016,0.871175


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3372,0.229155,0.895628,0.835344
50,0.2335,0.216281,0.921016,0.866529
75,0.1517,0.217269,0.929478,0.871162
100,0.1098,0.234475,0.913963,0.862407
125,0.0535,0.315478,0.921016,0.857667
150,0.045,0.317443,0.913963,0.858453
175,0.0212,0.324676,0.923836,0.872073
200,0.0439,0.393694,0.930889,0.868672
225,0.0282,0.409517,0.926657,0.860115
250,0.0051,0.418061,0.921016,0.871175


DatasetDict({
    train: Dataset({
        features: ['text', 'label', '__index_level_0__'],
        num_rows: 2833
    })
    test: Dataset({
        features: ['text', 'label', '__index_level_0__'],
        num_rows: 709
    })
})

UBC-NLP/MARBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3823,0.451341,0.867419,0.737283
50,0.2972,0.265321,0.908322,0.854979
75,0.1819,0.316149,0.90409,0.83592
100,0.1747,0.261602,0.916784,0.869769
125,0.1365,0.33807,0.895628,0.822544
150,0.074,0.477394,0.906911,0.847294
175,0.0819,0.416294,0.892807,0.840122
200,0.042,0.589721,0.901269,0.822084
225,0.0283,0.563789,0.90409,0.837928
250,0.0115,0.68427,0.884344,0.80574


UBC-NLP/MARBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3823,0.451341,0.867419,0.737283
50,0.2972,0.265321,0.908322,0.854979
75,0.1819,0.316149,0.90409,0.83592
100,0.1747,0.261602,0.916784,0.869769
125,0.1365,0.33807,0.895628,0.822544
150,0.074,0.477394,0.906911,0.847294
175,0.0819,0.416294,0.892807,0.840122
200,0.042,0.589721,0.901269,0.822084
225,0.0283,0.563789,0.90409,0.837928
250,0.0115,0.68427,0.884344,0.80574


UBC-NLP/MARBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3823,0.451341,0.867419,0.737283
50,0.2972,0.265321,0.908322,0.854979
75,0.1819,0.316149,0.90409,0.83592
100,0.1747,0.261602,0.916784,0.869769
125,0.1365,0.33807,0.895628,0.822544
150,0.074,0.477394,0.906911,0.847294
175,0.0819,0.416294,0.892807,0.840122
200,0.042,0.589721,0.901269,0.822084
225,0.0283,0.563789,0.90409,0.837928
250,0.0115,0.68427,0.884344,0.80574


UBC-NLP/MARBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.4064,0.284844,0.897038,0.809913
50,0.2805,0.217623,0.923836,0.87433
75,0.2332,0.299272,0.899859,0.851711
100,0.1667,0.317126,0.926657,0.875301
125,0.1111,0.322117,0.912553,0.839123
150,0.1159,0.413574,0.912553,0.864223
175,0.0552,0.404611,0.913963,0.854167
200,0.0308,0.559265,0.905501,0.848873
225,0.0484,0.55118,0.913963,0.863903
250,0.0219,0.537521,0.912553,0.857372


UBC-NLP/MARBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.4064,0.284844,0.897038,0.809913
50,0.2805,0.217623,0.923836,0.87433
75,0.2332,0.299272,0.899859,0.851711
100,0.1667,0.317126,0.926657,0.875301
125,0.1111,0.322117,0.912553,0.839123
150,0.1159,0.413574,0.912553,0.864223
175,0.0552,0.404611,0.913963,0.854167
200,0.0308,0.559265,0.905501,0.848873
225,0.0484,0.55118,0.913963,0.863903
250,0.0219,0.537521,0.912553,0.857372


UBC-NLP/MARBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.4064,0.284844,0.897038,0.809913
50,0.2805,0.217623,0.923836,0.87433
75,0.2332,0.299272,0.899859,0.851711
100,0.1667,0.317126,0.926657,0.875301
125,0.1111,0.322117,0.912553,0.839123
150,0.1159,0.413574,0.912553,0.864223
175,0.0552,0.404611,0.913963,0.854167
200,0.0308,0.559265,0.905501,0.848873
225,0.0484,0.55118,0.913963,0.863903
250,0.0219,0.537521,0.912553,0.857372


UBC-NLP/MARBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3974,0.295962,0.905501,0.816339
50,0.2489,0.427995,0.826516,0.769767
75,0.2087,0.247952,0.911142,0.856301
100,0.176,0.309167,0.909732,0.846524
125,0.2533,0.365548,0.912553,0.847533
150,0.1296,0.336214,0.860367,0.797057
175,0.119,0.28471,0.913963,0.855053
200,0.0494,0.39921,0.915374,0.859545
225,0.0382,0.426419,0.918195,0.854549
250,0.0292,0.774001,0.857546,0.80423


UBC-NLP/MARBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3974,0.295962,0.905501,0.816339
50,0.2489,0.427995,0.826516,0.769767
75,0.2087,0.247952,0.911142,0.856301
100,0.176,0.309167,0.909732,0.846524
125,0.2533,0.365548,0.912553,0.847533
150,0.1296,0.336214,0.860367,0.797057
175,0.119,0.28471,0.913963,0.855053
200,0.0494,0.39921,0.915374,0.859545
225,0.0382,0.426419,0.918195,0.854549
250,0.0292,0.774001,0.857546,0.80423


UBC-NLP/MARBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3974,0.295962,0.905501,0.816339
50,0.2489,0.427995,0.826516,0.769767
75,0.2087,0.247952,0.911142,0.856301
100,0.176,0.309167,0.909732,0.846524
125,0.2533,0.365548,0.912553,0.847533
150,0.1296,0.336214,0.860367,0.797057
175,0.119,0.28471,0.913963,0.855053
200,0.0494,0.39921,0.915374,0.859545
225,0.0382,0.426419,0.918195,0.854549
250,0.0292,0.774001,0.857546,0.80423


DatasetDict({
    train: Dataset({
        features: ['text', 'label', '__index_level_0__'],
        num_rows: 2833
    })
    test: Dataset({
        features: ['text', 'label', '__index_level_0__'],
        num_rows: 709
    })
})

UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.4076,0.411957,0.878702,0.770353
50,0.2845,0.221763,0.912553,0.862045
75,0.185,0.232264,0.916784,0.870454
100,0.1358,0.321836,0.908322,0.86736
125,0.1267,0.334332,0.918195,0.867331
150,0.0594,0.363196,0.906911,0.858396
175,0.087,0.386122,0.921016,0.870431
200,0.0406,0.425387,0.90409,0.836932
225,0.0284,0.386693,0.912553,0.866978
250,0.0219,0.480977,0.912553,0.864223


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.4076,0.411957,0.878702,0.770353
50,0.2845,0.221763,0.912553,0.862045
75,0.185,0.232264,0.916784,0.870454
100,0.1358,0.321836,0.908322,0.86736
125,0.1267,0.334332,0.918195,0.867331
150,0.0594,0.363196,0.906911,0.858396
175,0.087,0.386122,0.921016,0.870431
200,0.0406,0.425387,0.90409,0.836932
225,0.0284,0.386693,0.912553,0.866978
250,0.0219,0.480977,0.912553,0.864223


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.4076,0.411957,0.878702,0.770353
50,0.2845,0.221763,0.912553,0.862045
75,0.185,0.232264,0.916784,0.870454
100,0.1358,0.321836,0.908322,0.86736
125,0.1267,0.334332,0.918195,0.867331
150,0.0594,0.363196,0.906911,0.858396
175,0.087,0.386122,0.921016,0.870431
200,0.0406,0.425387,0.90409,0.836932
225,0.0284,0.386693,0.912553,0.866978
250,0.0219,0.480977,0.912553,0.864223


UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.4069,0.276319,0.905501,0.846309
50,0.231,0.225302,0.925247,0.875563
75,0.1939,0.258501,0.922426,0.864311
100,0.1644,0.261877,0.916784,0.869769
125,0.1106,0.227335,0.937941,0.898196
150,0.0778,0.317568,0.923836,0.881743
175,0.0575,0.349964,0.919605,0.861162
200,0.0417,0.421373,0.916784,0.871795
225,0.0374,0.361525,0.929478,0.886273
250,0.0215,0.352465,0.930889,0.886954


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.4069,0.276319,0.905501,0.846309
50,0.231,0.225302,0.925247,0.875563
75,0.1939,0.258501,0.922426,0.864311
100,0.1644,0.261877,0.916784,0.869769
125,0.1106,0.227335,0.937941,0.898196
150,0.0778,0.317568,0.923836,0.881743
175,0.0575,0.349964,0.919605,0.861162
200,0.0417,0.421373,0.916784,0.871795
225,0.0374,0.361525,0.929478,0.886273
250,0.0215,0.352465,0.930889,0.886954


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.4069,0.276319,0.905501,0.846309
50,0.231,0.225302,0.925247,0.875563
75,0.1939,0.258501,0.922426,0.864311
100,0.1644,0.261877,0.916784,0.869769
125,0.1106,0.227335,0.937941,0.898196
150,0.0778,0.317568,0.923836,0.881743
175,0.0575,0.349964,0.919605,0.861162
200,0.0417,0.421373,0.916784,0.871795
225,0.0374,0.361525,0.929478,0.886273
250,0.0215,0.352465,0.930889,0.886954


UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3801,0.233216,0.906911,0.852348
50,0.2404,0.237357,0.925247,0.861992
75,0.1864,0.279254,0.921016,0.847076
100,0.1131,0.264522,0.922426,0.87662
125,0.0882,0.266224,0.932299,0.873671
150,0.0655,0.277154,0.918195,0.861762
175,0.0505,0.306087,0.929478,0.877043
200,0.0211,0.38501,0.925247,0.874819
225,0.0174,0.505904,0.918195,0.842806
250,0.0224,0.446047,0.926657,0.868722


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3801,0.233216,0.906911,0.852348
50,0.2404,0.237357,0.925247,0.861992
75,0.1864,0.279254,0.921016,0.847076
100,0.1131,0.264522,0.922426,0.87662
125,0.0882,0.266224,0.932299,0.873671
150,0.0655,0.277154,0.918195,0.861762
175,0.0505,0.306087,0.929478,0.877043
200,0.0211,0.38501,0.925247,0.874819
225,0.0174,0.505904,0.918195,0.842806
250,0.0224,0.446047,0.926657,0.868722


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3801,0.233216,0.906911,0.852348
50,0.2404,0.237357,0.925247,0.861992
75,0.1864,0.279254,0.921016,0.847076
100,0.1131,0.264522,0.922426,0.87662
125,0.0882,0.266224,0.932299,0.873671
150,0.0655,0.277154,0.918195,0.861762
175,0.0505,0.306087,0.929478,0.877043
200,0.0211,0.38501,0.925247,0.874819
225,0.0174,0.505904,0.918195,0.842806
250,0.0224,0.446047,0.926657,0.868722


DatasetDict({
    train: Dataset({
        features: ['text', 'label', '__index_level_0__'],
        num_rows: 2833
    })
    test: Dataset({
        features: ['text', 'label', '__index_level_0__'],
        num_rows: 709
    })
})

SI2M-Lab/DarijaBERT-mix, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3501,0.256929,0.909732,0.840558
50,0.2186,0.241283,0.909732,0.843617
75,0.1616,0.229976,0.909732,0.869696
100,0.0936,0.248885,0.923836,0.869701
125,0.0597,0.36242,0.925247,0.877726
150,0.0262,0.365813,0.918195,0.876792
175,0.0264,0.385287,0.921016,0.883317
200,0.0235,0.424178,0.915374,0.879985
225,0.0125,0.364926,0.933709,0.88899
250,0.0178,0.338035,0.930889,0.887599


SI2M-Lab/DarijaBERT-mix, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3501,0.256929,0.909732,0.840558
50,0.2186,0.241283,0.909732,0.843617
75,0.1616,0.229976,0.909732,0.869696
100,0.0936,0.248885,0.923836,0.869701
125,0.0597,0.36242,0.925247,0.877726
150,0.0262,0.365813,0.918195,0.876792
175,0.0264,0.385287,0.921016,0.883317
200,0.0235,0.424178,0.915374,0.879985
225,0.0125,0.364926,0.933709,0.88899
250,0.0178,0.338035,0.930889,0.887599


SI2M-Lab/DarijaBERT-mix, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3501,0.256929,0.909732,0.840558
50,0.2186,0.241283,0.909732,0.843617
75,0.1616,0.229976,0.909732,0.869696
100,0.0936,0.248885,0.923836,0.869701
125,0.0597,0.36242,0.925247,0.877726
150,0.0262,0.365813,0.918195,0.876792
175,0.0264,0.385287,0.921016,0.883317
200,0.0235,0.424178,0.915374,0.879985
225,0.0125,0.364926,0.933709,0.88899
250,0.0178,0.338035,0.930889,0.887599


SI2M-Lab/DarijaBERT-mix, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3942,0.237306,0.912553,0.839123
50,0.2337,0.23019,0.913963,0.867449
75,0.1419,0.234843,0.923836,0.86458
100,0.1318,0.222197,0.928068,0.886214
125,0.0835,0.260847,0.913963,0.860863
150,0.1016,0.29731,0.926657,0.877547
175,0.0544,0.274842,0.926657,0.885523
200,0.0375,0.314237,0.919605,0.877397
225,0.0456,0.396904,0.899859,0.855769
250,0.0214,0.324296,0.923836,0.880488


SI2M-Lab/DarijaBERT-mix, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3942,0.237306,0.912553,0.839123
50,0.2337,0.23019,0.913963,0.867449
75,0.1419,0.234843,0.923836,0.86458
100,0.1318,0.222197,0.928068,0.886214
125,0.0835,0.260847,0.913963,0.860863
150,0.1016,0.29731,0.926657,0.877547
175,0.0544,0.274842,0.926657,0.885523
200,0.0375,0.314237,0.919605,0.877397
225,0.0456,0.396904,0.899859,0.855769
250,0.0214,0.324296,0.923836,0.880488


SI2M-Lab/DarijaBERT-mix, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3942,0.237306,0.912553,0.839123
50,0.2337,0.23019,0.913963,0.867449
75,0.1419,0.234843,0.923836,0.86458
100,0.1318,0.222197,0.928068,0.886214
125,0.0835,0.260847,0.913963,0.860863
150,0.1016,0.29731,0.926657,0.877547
175,0.0544,0.274842,0.926657,0.885523
200,0.0375,0.314237,0.919605,0.877397
225,0.0456,0.396904,0.899859,0.855769
250,0.0214,0.324296,0.923836,0.880488


SI2M-Lab/DarijaBERT-mix, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3339,0.229832,0.922426,0.859733
50,0.2199,0.206305,0.922426,0.854727
75,0.1274,0.253374,0.928068,0.869934
100,0.1181,0.192117,0.929478,0.886906
125,0.0593,0.240309,0.93653,0.888982
150,0.0337,0.263788,0.933709,0.8903
175,0.0325,0.25616,0.93512,0.892318
200,0.0174,0.31473,0.929478,0.887529
225,0.0048,0.348402,0.93512,0.8876
250,0.0107,0.391387,0.929478,0.888746


SI2M-Lab/DarijaBERT-mix, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3339,0.229832,0.922426,0.859733
50,0.2199,0.206305,0.922426,0.854727
75,0.1274,0.253374,0.928068,0.869934
100,0.1181,0.192117,0.929478,0.886906
125,0.0593,0.240309,0.93653,0.888982
150,0.0337,0.263788,0.933709,0.8903
175,0.0325,0.25616,0.93512,0.892318
200,0.0174,0.31473,0.929478,0.887529
225,0.0048,0.348402,0.93512,0.8876
250,0.0107,0.391387,0.929478,0.888746


SI2M-Lab/DarijaBERT-mix, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3339,0.229832,0.922426,0.859733
50,0.2199,0.206305,0.922426,0.854727
75,0.1274,0.253374,0.928068,0.869934
100,0.1181,0.192117,0.929478,0.886906
125,0.0593,0.240309,0.93653,0.888982
150,0.0337,0.263788,0.933709,0.8903
175,0.0325,0.25616,0.93512,0.892318
200,0.0174,0.31473,0.929478,0.887529
225,0.0048,0.348402,0.93512,0.8876
250,0.0107,0.391387,0.929478,0.888746


DatasetDict({
    train: Dataset({
        features: ['text', 'label', '__index_level_0__'],
        num_rows: 2833
    })
    test: Dataset({
        features: ['text', 'label', '__index_level_0__'],
        num_rows: 709
    })
})

SI2M-Lab/DarijaBERT-arabizi, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3713,0.281799,0.899859,0.833302
50,0.2635,0.303905,0.906911,0.83873
75,0.1686,0.290394,0.897038,0.839714
100,0.1271,0.345174,0.897038,0.833492
125,0.0671,0.427737,0.898449,0.841493
150,0.0401,0.453815,0.909732,0.856822
175,0.0355,0.571351,0.892807,0.832687
200,0.0151,0.601775,0.90268,0.838951
225,0.031,0.551356,0.898449,0.845523
250,0.0168,0.55331,0.90409,0.837928


SI2M-Lab/DarijaBERT-arabizi, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3713,0.281799,0.899859,0.833302
50,0.2635,0.303905,0.906911,0.83873
75,0.1686,0.290394,0.897038,0.839714
100,0.1271,0.345174,0.897038,0.833492
125,0.0671,0.427737,0.898449,0.841493
150,0.0401,0.453815,0.909732,0.856822
175,0.0355,0.571351,0.892807,0.832687
200,0.0151,0.601775,0.90268,0.838951
225,0.031,0.551356,0.898449,0.845523
250,0.0168,0.55331,0.90409,0.837928


SI2M-Lab/DarijaBERT-arabizi, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3713,0.281799,0.899859,0.833302
50,0.2635,0.303905,0.906911,0.83873
75,0.1686,0.290394,0.897038,0.839714
100,0.1271,0.345174,0.897038,0.833492
125,0.0671,0.427737,0.898449,0.841493
150,0.0401,0.453815,0.909732,0.856822
175,0.0355,0.571351,0.892807,0.832687
200,0.0151,0.601775,0.90268,0.838951
225,0.031,0.551356,0.898449,0.845523
250,0.0168,0.55331,0.90409,0.837928


SI2M-Lab/DarijaBERT-arabizi, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3648,0.291657,0.897038,0.815086
50,0.2518,0.293498,0.909732,0.838428
75,0.2164,0.284016,0.911142,0.843562
100,0.1421,0.423001,0.864598,0.807976
125,0.0852,0.361272,0.915374,0.859545
150,0.1012,0.68888,0.832158,0.773853
175,0.0638,0.40977,0.919605,0.854632
200,0.039,0.712389,0.846262,0.789572
225,0.0245,0.518629,0.909732,0.848383
250,0.0118,0.559148,0.90268,0.839889


SI2M-Lab/DarijaBERT-arabizi, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3648,0.291657,0.897038,0.815086
50,0.2518,0.293498,0.909732,0.838428
75,0.2164,0.284016,0.911142,0.843562
100,0.1421,0.423001,0.864598,0.807976
125,0.0852,0.361272,0.915374,0.859545
150,0.1012,0.68888,0.832158,0.773853
175,0.0638,0.40977,0.919605,0.854632
200,0.039,0.712389,0.846262,0.789572
225,0.0245,0.518629,0.909732,0.848383
250,0.0118,0.559148,0.90268,0.839889


SI2M-Lab/DarijaBERT-arabizi, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3648,0.291657,0.897038,0.815086
50,0.2518,0.293498,0.909732,0.838428
75,0.2164,0.284016,0.911142,0.843562
100,0.1421,0.423001,0.864598,0.807976
125,0.0852,0.361272,0.915374,0.859545
150,0.1012,0.68888,0.832158,0.773853
175,0.0638,0.40977,0.919605,0.854632
200,0.039,0.712389,0.846262,0.789572
225,0.0245,0.518629,0.909732,0.848383
250,0.0118,0.559148,0.90268,0.839889


SI2M-Lab/DarijaBERT-arabizi, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3712,0.283534,0.894217,0.800458
50,0.257,0.278784,0.892807,0.823132
75,0.1478,0.275605,0.905501,0.839823
100,0.1264,0.593856,0.816643,0.762301
125,0.1214,0.399441,0.912553,0.834441
150,0.0816,0.361694,0.901269,0.838968
175,0.0373,0.397626,0.90409,0.83592
200,0.0096,0.624408,0.897038,0.828606
225,0.0243,0.580318,0.898449,0.831454
250,0.0018,0.603306,0.901269,0.83516


SI2M-Lab/DarijaBERT-arabizi, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3712,0.283534,0.894217,0.800458
50,0.257,0.278784,0.892807,0.823132
75,0.1478,0.275605,0.905501,0.839823
100,0.1264,0.593856,0.816643,0.762301
125,0.1214,0.399441,0.912553,0.834441
150,0.0816,0.361694,0.901269,0.838968
175,0.0373,0.397626,0.90409,0.83592
200,0.0096,0.624408,0.897038,0.828606
225,0.0243,0.580318,0.898449,0.831454
250,0.0018,0.603306,0.901269,0.83516


SI2M-Lab/DarijaBERT-arabizi, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/2833 [00:00<?, ? examples/s]

Map:   0%|          | 0/709 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
25,0.3712,0.283534,0.894217,0.800458
50,0.257,0.278784,0.892807,0.823132
75,0.1478,0.275605,0.905501,0.839823
100,0.1264,0.593856,0.816643,0.762301
125,0.1214,0.399441,0.912553,0.834441
150,0.0816,0.361694,0.901269,0.838968
175,0.0373,0.397626,0.90409,0.83592
200,0.0096,0.624408,0.897038,0.828606
225,0.0243,0.580318,0.898449,0.831454
250,0.0018,0.603306,0.901269,0.83516


Unnamed: 0,Model,Accuracy,F1
0,CAMeL-Lab/bert-base-arabic-camelbert-da,0.922426,0.871628
3,SI2M-Lab/DarijaBERT-arabizi,0.915374,0.859545
6,SI2M-Lab/DarijaBERT-mix,0.93653,0.900671
9,UBC-NLP/MARBERT,0.926657,0.875301
12,UBC-NLP/MARBERTv2,0.937941,0.898196
15,aubmindlab/bert-base-arabertv02-twitter,0.939351,0.896565
21,qarib/bert-base-qarib,0.93653,0.893072
