In [2]:
import os
os.environ["CUDA_VISIBLE_DEVICES"]="1" 

import numpy as np
import tensorflow as tf
import pandas as pd
import pyarabic.araby as araby
import warnings
warnings.filterwarnings('ignore')
from sklearn.model_selection import train_test_split
from sklearn.metrics import classification_report
from tensorflow.keras.layers import Dense, Input
from tensorflow.keras.utils import to_categorical
from tensorflow.keras.optimizers import Adam
from tensorflow.keras.callbacks import EarlyStopping
from tensorflow.keras.initializers import TruncatedNormal
from tensorflow.keras.losses import CategoricalCrossentropy
from tensorflow.keras.metrics import CategoricalAccuracy
import torch
from sklearn.metrics import accuracy_score, f1_score
from transformers import Trainer, TrainingArguments
from transformers import AutoTokenizer, AutoModelForSequenceClassification
from datasets import load_dataset, Dataset, concatenate_datasets
pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', None)
pd.set_option('display.max_colwidth', 1000)


fname = 'dreviews_tc_1'
log_file = fname + '.txt'

with open(log_file, 'w') as f:
    f.write('Model,Accuracy,F1\n')


dataset = load_dataset('ohidaoui/darija-reviews')


df = pd.DataFrame(dataset['test'])

display(len(df))
      
display(df.columns)
display(df[:4])

df['label'] = df['label'].replace('negative ', 'negative')

c = df['topic'].value_counts()
display(c)

classes = set(df['topic'].values)
display(classes)

df['topic'] = df['topic'].astype('category')
df['label'] = df['topic'].cat.codes

df = df[['review', 'label']]
classes_num = len(classes)
display(classes_num)
display(len(df))



max_sequence_length = 128



models = [ 
        'aubmindlab/bert-base-arabertv02-twitter',
        'CAMeL-Lab/bert-base-arabic-camelbert-da',
        'qarib/bert-base-qarib', 
        'UBC-NLP/MARBERT',
        'UBC-NLP/MARBERTv2',
    'SI2M-Lab/DarijaBERT-mix',
    'SI2M-Lab/DarijaBERT-arabizi'
]

seeds = [0, 1, 42]

for model_name in models:
    for seed in seeds:
        ds = Dataset.from_pandas(df)
        ds = ds.train_test_split(test_size=0.2, seed = seed)
        if seed==0:
            display(ds)
            
        for i in range(3):
            print(f'{model_name}, try:{i}')
                  
            tokenizer = AutoTokenizer.from_pretrained(model_name)
            model = AutoModelForSequenceClassification.from_pretrained(model_name,
                                                                  num_labels=classes_num).to('cuda')                                                 
            dataset_train = ds['train']
            dataset_validation = ds['test']                                                    
            
          
    
            def preprocess_function(examples):
                return tokenizer(examples['review'], truncation=True, padding="max_length",
                                max_length=max_sequence_length)
            
            
            dataset_train = dataset_train.map(preprocess_function, batched=True)
            dataset_validation = dataset_validation.map(preprocess_function, batched=True)
            
           
            
            def compute_metrics(eval_pred):
                logits, labels = eval_pred
                predictions = np.argmax(logits, axis=-1)    
                acc = accuracy_score(labels, predictions)        
                f1 = f1_score(labels, predictions, average='macro')   
                with open(log_file, 'a') as f:
                    f.write(f'{model_name},{acc},{f1}\n')
                return {'accuracy': acc, 'f1_score': f1}
    
    
            
            
            epochs = 30
            save_steps = 10000 #save checkpoint every 10000 steps
            batch_size = 64
            
            training_args = TrainingArguments(
                output_dir = 'bert/',
                overwrite_output_dir=True,
                num_train_epochs = epochs,
                per_device_train_batch_size = batch_size,
                per_device_eval_batch_size = batch_size,
                save_steps = save_steps,
                save_total_limit = 1, #only save the last 5 checkpoints
                fp16=True,
                learning_rate = 5e-5,  # 5e-5 is the default
                logging_steps = 10, #50_000
                evaluation_strategy = 'steps',
                # evaluate_during_training = True,
                eval_steps = 10
                
            )
            
            trainer = Trainer(
                model = model,
                args = training_args,
                # data_collator=data_collator,
                train_dataset=dataset_train,
                eval_dataset=dataset_validation,
                compute_metrics = compute_metrics
            )
            
            
            trainer.train()


results = pd.read_csv(log_file)

best_results = results.groupby('Model', as_index=False)['F1'].max()

best_results = pd.merge(best_results, results, on=['Model', 'F1'])
best_results = best_results[['Model', 'Accuracy', 'F1']]
best_results = best_results.drop_duplicates()
best_results.to_csv(f'{fname}.csv')
display(best_results)



Found cached dataset parquet (/home/ffq/.cache/huggingface/datasets/ohidaoui___parquet/ohidaoui--darija-reviews-34030453886e5230/0.0.0/14a00e99c0d15a23649d0db8944380ac81082d4b021f398733dd84f3a6c569a7)


  0%|          | 0/1 [00:00<?, ?it/s]

851

Index(['review', 'label', 'topic', 'writing_style'], dtype='object')

Unnamed: 0,review,label,topic,writing_style
0,داسيا فقدت أهم ميزة كانت تميزها وهي السعر للأسف !,negative,automotive,Arabic
1,لاأظنها ستنجح كالنسخ الأولى,negative,automotive,Arabic
2,Khas ykon tghyir mbanch li lfar9 rir fa dizayn lkrasa mikanik tablo fih dak lblstik lmryat 3lach mdyrinch lhm daw volm mzl kif mahwa jwant kifma howa fin kyn lfr9 fdizyn ama ljiti tchof mkynch fra9 fra9 howa y9riban 40% mli kt9ol l3mrya hdi bnsba li ana nas 3morya ama l3morya kolchi daw mzl khsha whd 10 ans wnchofo ana knfdl dacia l9dima,negative,automotive,Arabizi
3,هناك اختيارات أحسن وماركات عالميه أجود من داصيا.,negative,automotive,Arabic


topic
it                      287
cosmetics               172
entertainment           121
clothing                 93
cleaning                 57
hospitality              37
household appliances     33
automotive               20
restaurants              19
jewelry                   8
other                     4
Name: count, dtype: int64

{'automotive',
 'cleaning',
 'clothing',
 'cosmetics',
 'entertainment',
 'hospitality',
 'household appliances',
 'it',
 'jewelry',
 'other',
 'restaurants'}

11

851

DatasetDict({
    train: Dataset({
        features: ['review', 'label'],
        num_rows: 680
    })
    test: Dataset({
        features: ['review', 'label'],
        num_rows: 171
    })
})

aubmindlab/bert-base-arabertv02-twitter, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.8986,1.595783,0.497076,0.217005
20,1.3157,1.248549,0.631579,0.367401
30,0.9871,1.053109,0.649123,0.38316
40,0.7967,0.967388,0.666667,0.436717
50,0.6221,0.922083,0.701754,0.539588
60,0.4353,0.904201,0.707602,0.57489
70,0.3488,0.920319,0.719298,0.585627
80,0.2945,1.141648,0.707602,0.550054
90,0.2789,0.956942,0.730994,0.619259
100,0.2153,0.939259,0.719298,0.572987


aubmindlab/bert-base-arabertv02-twitter, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.8623,1.580484,0.526316,0.219239
20,1.3439,1.271077,0.631579,0.368891
30,1.0369,1.056322,0.643275,0.373912
40,0.7938,0.983507,0.666667,0.4606
50,0.6423,0.901179,0.701754,0.460227
60,0.4565,0.902529,0.719298,0.597208
70,0.3599,0.866693,0.736842,0.621025
80,0.2911,1.065517,0.701754,0.565184
90,0.2403,0.886938,0.730994,0.580374
100,0.1842,0.92336,0.725146,0.587115


aubmindlab/bert-base-arabertv02-twitter, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.8623,1.580484,0.526316,0.219239
20,1.3439,1.271077,0.631579,0.368891
30,1.0369,1.056322,0.643275,0.373912
40,0.7938,0.983507,0.666667,0.4606
50,0.6423,0.901179,0.701754,0.460227
60,0.4565,0.902529,0.719298,0.597208
70,0.3599,0.866693,0.736842,0.621025
80,0.2911,1.065517,0.701754,0.565184
90,0.2403,0.886938,0.730994,0.580374
100,0.1842,0.92336,0.725146,0.587115


aubmindlab/bert-base-arabertv02-twitter, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9107,1.644865,0.48538,0.163795
20,1.4609,1.307651,0.614035,0.285723
30,1.0168,1.149408,0.654971,0.302066
40,0.8522,0.99602,0.695906,0.380444
50,0.6081,0.931421,0.730994,0.412785
60,0.4681,0.981732,0.707602,0.410823
70,0.4036,1.019917,0.71345,0.440704
80,0.2992,0.895752,0.736842,0.48519
90,0.2151,1.028632,0.725146,0.462721
100,0.1726,1.120835,0.707602,0.478111


aubmindlab/bert-base-arabertv02-twitter, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9107,1.644865,0.48538,0.163795
20,1.4609,1.307651,0.614035,0.285723
30,1.0168,1.149408,0.654971,0.302066
40,0.8522,0.99602,0.695906,0.380444
50,0.6081,0.931421,0.730994,0.412785
60,0.4681,0.981732,0.707602,0.410823
70,0.4036,1.019917,0.71345,0.440704
80,0.2992,0.895752,0.736842,0.48519
90,0.2151,1.028632,0.725146,0.462721
100,0.1726,1.120835,0.707602,0.478111


aubmindlab/bert-base-arabertv02-twitter, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9107,1.644865,0.48538,0.163795
20,1.4609,1.307651,0.614035,0.285723
30,1.0168,1.149408,0.654971,0.302066
40,0.8522,0.99602,0.695906,0.380444
50,0.6081,0.931421,0.730994,0.412785
60,0.4681,0.981732,0.707602,0.410823
70,0.4036,1.019917,0.71345,0.440704
80,0.2992,0.895752,0.736842,0.48519
90,0.2151,1.028632,0.725146,0.462721
100,0.1726,1.120835,0.707602,0.478111


aubmindlab/bert-base-arabertv02-twitter, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.8572,1.577049,0.467836,0.199085
20,1.3672,1.263199,0.619883,0.373595
30,1.1248,1.03025,0.725146,0.478281
40,0.894,0.946544,0.707602,0.501001
50,0.6583,0.844273,0.736842,0.543647
60,0.5053,0.799913,0.766082,0.597057
70,0.4157,0.843935,0.736842,0.573918
80,0.3391,0.783372,0.754386,0.648086
90,0.2209,0.870069,0.74269,0.649842
100,0.1957,0.966106,0.736842,0.656639


aubmindlab/bert-base-arabertv02-twitter, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.8572,1.577049,0.467836,0.199085
20,1.3672,1.263199,0.619883,0.373595
30,1.1248,1.03025,0.725146,0.478281
40,0.894,0.946544,0.707602,0.501001
50,0.6583,0.844273,0.736842,0.543647
60,0.5053,0.799913,0.766082,0.597057
70,0.4157,0.843935,0.736842,0.573918
80,0.3391,0.783372,0.754386,0.648086
90,0.2209,0.870069,0.74269,0.649842
100,0.1957,0.966106,0.736842,0.656639


aubmindlab/bert-base-arabertv02-twitter, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.8572,1.577049,0.467836,0.199085
20,1.3672,1.263199,0.619883,0.373595
30,1.1248,1.03025,0.725146,0.478281
40,0.894,0.946544,0.707602,0.501001
50,0.6583,0.844273,0.736842,0.543647
60,0.5053,0.799913,0.766082,0.597057
70,0.4157,0.843935,0.736842,0.573918
80,0.3391,0.783372,0.754386,0.648086
90,0.2209,0.870069,0.74269,0.649842
100,0.1957,0.966106,0.736842,0.656639


DatasetDict({
    train: Dataset({
        features: ['review', 'label'],
        num_rows: 680
    })
    test: Dataset({
        features: ['review', 'label'],
        num_rows: 171
    })
})

CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9802,1.824761,0.362573,0.109098
20,1.5922,1.652565,0.467836,0.226789
30,1.2772,1.401314,0.549708,0.302174
40,0.9486,1.253666,0.631579,0.430101
50,0.6555,1.290158,0.614035,0.451809
60,0.554,1.344898,0.608187,0.434096
70,0.4571,1.285186,0.654971,0.467373
80,0.3525,1.366167,0.649123,0.517185
90,0.3295,1.275169,0.654971,0.497885
100,0.2351,1.361158,0.654971,0.519837


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9802,1.824761,0.362573,0.109098
20,1.5922,1.652565,0.467836,0.226789
30,1.2772,1.401314,0.549708,0.302174
40,0.9486,1.253666,0.631579,0.430101
50,0.6555,1.290158,0.614035,0.451809
60,0.554,1.344898,0.608187,0.434096
70,0.4571,1.285186,0.654971,0.467373
80,0.3525,1.366167,0.649123,0.517185
90,0.3295,1.275169,0.654971,0.497885
100,0.2351,1.361158,0.654971,0.519837


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9802,1.824761,0.362573,0.109098
20,1.5922,1.652565,0.467836,0.226789
30,1.2772,1.401314,0.549708,0.302174
40,0.9486,1.253666,0.631579,0.430101
50,0.6555,1.290158,0.614035,0.451809
60,0.554,1.344898,0.608187,0.434096
70,0.4571,1.285186,0.654971,0.467373
80,0.3525,1.366167,0.649123,0.517185
90,0.3295,1.275169,0.654971,0.497885
100,0.2351,1.361158,0.654971,0.519837


CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.0174,1.76484,0.497076,0.141341
20,1.667,1.518256,0.54386,0.194228
30,1.2502,1.343667,0.590643,0.246173
40,0.9479,1.344067,0.596491,0.291446
50,0.6842,1.329165,0.614035,0.377994
60,0.6464,1.231997,0.643275,0.350538
70,0.5136,1.20221,0.684211,0.403962
80,0.345,1.336012,0.625731,0.350788
90,0.3173,1.237446,0.672515,0.421623
100,0.2589,1.255185,0.666667,0.470853


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.0174,1.76484,0.497076,0.141341
20,1.667,1.518256,0.54386,0.194228
30,1.2502,1.343667,0.590643,0.246173
40,0.9479,1.344067,0.596491,0.291446
50,0.6842,1.329165,0.614035,0.377994
60,0.6464,1.231997,0.643275,0.350538
70,0.5136,1.20221,0.684211,0.403962
80,0.345,1.336012,0.625731,0.350788
90,0.3173,1.237446,0.672515,0.421623
100,0.2589,1.255185,0.666667,0.470853


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.0174,1.76484,0.497076,0.141341
20,1.667,1.518256,0.54386,0.194228
30,1.2502,1.343667,0.590643,0.246173
40,0.9479,1.344067,0.596491,0.291446
50,0.6842,1.329165,0.614035,0.377994
60,0.6464,1.231997,0.643275,0.350538
70,0.5136,1.20221,0.684211,0.403962
80,0.345,1.336012,0.625731,0.350788
90,0.3173,1.237446,0.672515,0.421623
100,0.2589,1.255185,0.666667,0.470853


CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.0069,1.849806,0.315789,0.090254
20,1.6393,1.668671,0.432749,0.185542
30,1.3703,1.430328,0.532164,0.270258
40,1.0866,1.302266,0.596491,0.401245
50,0.745,1.21752,0.643275,0.50544
60,0.5935,1.276849,0.625731,0.461225
70,0.4821,1.262485,0.619883,0.48816
80,0.4175,1.326384,0.614035,0.459905
90,0.2621,1.294476,0.625731,0.483104
100,0.307,1.476246,0.637427,0.470364


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.0069,1.849806,0.315789,0.090254
20,1.6393,1.668671,0.432749,0.185542
30,1.3703,1.430328,0.532164,0.270258
40,1.0866,1.302266,0.596491,0.401245
50,0.745,1.21752,0.643275,0.50544
60,0.5935,1.276849,0.625731,0.461225
70,0.4821,1.262485,0.619883,0.48816
80,0.4175,1.326384,0.614035,0.459905
90,0.2621,1.294476,0.625731,0.483104
100,0.307,1.476246,0.637427,0.470364


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.0069,1.849806,0.315789,0.090254
20,1.6393,1.668671,0.432749,0.185542
30,1.3703,1.430328,0.532164,0.270258
40,1.0866,1.302266,0.596491,0.401245
50,0.745,1.21752,0.643275,0.50544
60,0.5935,1.276849,0.625731,0.461225
70,0.4821,1.262485,0.619883,0.48816
80,0.4175,1.326384,0.614035,0.459905
90,0.2621,1.294476,0.625731,0.483104
100,0.307,1.476246,0.637427,0.470364


DatasetDict({
    train: Dataset({
        features: ['review', 'label'],
        num_rows: 680
    })
    test: Dataset({
        features: ['review', 'label'],
        num_rows: 171
    })
})

qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9862,1.656892,0.45614,0.181422
20,1.3884,1.23509,0.602339,0.292345
30,0.986,0.980735,0.666667,0.415037
40,0.6573,0.954427,0.71345,0.539114
50,0.49,0.9771,0.719298,0.60221
60,0.333,1.071084,0.71345,0.550519
70,0.2498,0.999031,0.736842,0.596637
80,0.1675,1.14473,0.707602,0.541795
90,0.1161,1.077477,0.736842,0.599204
100,0.0781,1.325983,0.672515,0.480354


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9862,1.656892,0.45614,0.181422
20,1.3884,1.23509,0.602339,0.292345
30,0.986,0.980735,0.666667,0.415037
40,0.6573,0.954427,0.71345,0.539114
50,0.49,0.9771,0.719298,0.60221
60,0.333,1.071084,0.71345,0.550519
70,0.2498,0.999031,0.736842,0.596637
80,0.1675,1.14473,0.707602,0.541795
90,0.1161,1.077477,0.736842,0.599204
100,0.0781,1.325983,0.672515,0.480354


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9862,1.656892,0.45614,0.181422
20,1.3884,1.23509,0.602339,0.292345
30,0.986,0.980735,0.666667,0.415037
40,0.6573,0.954427,0.71345,0.539114
50,0.49,0.9771,0.719298,0.60221
60,0.333,1.071084,0.71345,0.550519
70,0.2498,0.999031,0.736842,0.596637
80,0.1675,1.14473,0.707602,0.541795
90,0.1161,1.077477,0.736842,0.599204
100,0.0781,1.325983,0.672515,0.480354


qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.0008,1.661804,0.497076,0.157021
20,1.4639,1.29026,0.596491,0.227192
30,0.9403,1.0559,0.701754,0.348379
40,0.7026,1.191369,0.672515,0.378146
50,0.4425,1.161135,0.660819,0.404198
60,0.3413,1.104459,0.695906,0.446178
70,0.2599,1.128805,0.672515,0.412495
80,0.156,1.281456,0.660819,0.475467
90,0.1202,1.180681,0.701754,0.465555
100,0.1173,1.397053,0.666667,0.483661


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.0008,1.661804,0.497076,0.157021
20,1.4639,1.29026,0.596491,0.227192
30,0.9403,1.0559,0.701754,0.348379
40,0.7026,1.191369,0.672515,0.378146
50,0.4425,1.161135,0.660819,0.404198
60,0.3413,1.104459,0.695906,0.446178
70,0.2599,1.128805,0.672515,0.412495
80,0.156,1.281456,0.660819,0.475467
90,0.1202,1.180681,0.701754,0.465555
100,0.1173,1.397053,0.666667,0.483661


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.0008,1.661804,0.497076,0.157021
20,1.4639,1.29026,0.596491,0.227192
30,0.9403,1.0559,0.701754,0.348379
40,0.7026,1.191369,0.672515,0.378146
50,0.4425,1.161135,0.660819,0.404198
60,0.3413,1.104459,0.695906,0.446178
70,0.2599,1.128805,0.672515,0.412495
80,0.156,1.281456,0.660819,0.475467
90,0.1202,1.180681,0.701754,0.465555
100,0.1173,1.397053,0.666667,0.483661


qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9729,1.750437,0.426901,0.161803
20,1.4481,1.274138,0.584795,0.275038
30,1.0906,1.006394,0.690058,0.40625
40,0.7928,0.929305,0.707602,0.490631
50,0.5051,0.904589,0.736842,0.585018
60,0.3615,0.973274,0.730994,0.636746
70,0.2711,1.007032,0.730994,0.663714
80,0.2149,1.017832,0.736842,0.541622
90,0.148,1.092841,0.695906,0.495096
100,0.1046,1.078215,0.730994,0.56813


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9729,1.750437,0.426901,0.161803
20,1.4481,1.274138,0.584795,0.275038
30,1.0906,1.006394,0.690058,0.40625
40,0.7928,0.929305,0.707602,0.490631
50,0.5051,0.904589,0.736842,0.585018
60,0.3615,0.973274,0.730994,0.636746
70,0.2711,1.007032,0.730994,0.663714
80,0.2149,1.017832,0.736842,0.541622
90,0.148,1.092841,0.695906,0.495096
100,0.1046,1.078215,0.730994,0.56813


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9729,1.750437,0.426901,0.161803
20,1.4481,1.274138,0.584795,0.275038
30,1.0906,1.006394,0.690058,0.40625
40,0.7928,0.929305,0.707602,0.490631
50,0.5051,0.904589,0.736842,0.585018
60,0.3615,0.973274,0.730994,0.636746
70,0.2711,1.007032,0.730994,0.663714
80,0.2149,1.017832,0.736842,0.541622
90,0.148,1.092841,0.695906,0.495096
100,0.1046,1.078215,0.730994,0.56813


DatasetDict({
    train: Dataset({
        features: ['review', 'label'],
        num_rows: 680
    })
    test: Dataset({
        features: ['review', 'label'],
        num_rows: 171
    })
})

UBC-NLP/MARBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.0436,1.821072,0.327485,0.097003
20,1.6241,1.501843,0.51462,0.238952
30,1.2451,1.171639,0.654971,0.381787
40,0.9128,1.024301,0.695906,0.436332
50,0.6871,0.96013,0.725146,0.508187
60,0.535,0.9842,0.725146,0.538731
70,0.4148,1.023198,0.725146,0.553099
80,0.3429,1.070666,0.725146,0.614723
90,0.2377,1.171353,0.725146,0.585699
100,0.171,1.135015,0.725146,0.599409


UBC-NLP/MARBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.0436,1.821072,0.327485,0.097003
20,1.6241,1.501843,0.51462,0.238952
30,1.2451,1.171639,0.654971,0.381787
40,0.9128,1.024301,0.695906,0.436332
50,0.6871,0.96013,0.725146,0.508187
60,0.535,0.9842,0.725146,0.538731
70,0.4148,1.023198,0.725146,0.553099
80,0.3429,1.070666,0.725146,0.614723
90,0.2377,1.171353,0.725146,0.585699
100,0.171,1.135015,0.725146,0.599409


UBC-NLP/MARBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.0436,1.821072,0.327485,0.097003
20,1.6241,1.501843,0.51462,0.238952
30,1.2451,1.171639,0.654971,0.381787
40,0.9128,1.024301,0.695906,0.436332
50,0.6871,0.96013,0.725146,0.508187
60,0.535,0.9842,0.725146,0.538731
70,0.4148,1.023198,0.725146,0.553099
80,0.3429,1.070666,0.725146,0.614723
90,0.2377,1.171353,0.725146,0.585699
100,0.171,1.135015,0.725146,0.599409


UBC-NLP/MARBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.0676,1.7539,0.479532,0.108767
20,1.6726,1.545691,0.526316,0.166104
30,1.1929,1.39717,0.625731,0.299631
40,0.9738,1.341416,0.614035,0.30639
50,0.6825,1.42994,0.608187,0.312177
60,0.5501,1.384874,0.631579,0.33789
70,0.4847,1.383788,0.596491,0.336252
80,0.4035,1.536427,0.614035,0.41007
90,0.297,1.378198,0.649123,0.407703
100,0.2761,1.444343,0.637427,0.422749


UBC-NLP/MARBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.0676,1.7539,0.479532,0.108767
20,1.6726,1.545691,0.526316,0.166104
30,1.1929,1.39717,0.625731,0.299631
40,0.9738,1.341416,0.614035,0.30639
50,0.6825,1.42994,0.608187,0.312177
60,0.5501,1.384874,0.631579,0.33789
70,0.4847,1.383788,0.596491,0.336252
80,0.4035,1.536427,0.614035,0.41007
90,0.297,1.378198,0.649123,0.407703
100,0.2761,1.444343,0.637427,0.422749


UBC-NLP/MARBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.0676,1.7539,0.479532,0.108767
20,1.6726,1.545691,0.526316,0.166104
30,1.1929,1.39717,0.625731,0.299631
40,0.9738,1.341416,0.614035,0.30639
50,0.6825,1.42994,0.608187,0.312177
60,0.5501,1.384874,0.631579,0.33789
70,0.4847,1.383788,0.596491,0.336252
80,0.4035,1.536427,0.614035,0.41007
90,0.297,1.378198,0.649123,0.407703
100,0.2761,1.444343,0.637427,0.422749


UBC-NLP/MARBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.0454,1.865023,0.345029,0.100584
20,1.6222,1.436085,0.555556,0.281258
30,1.2955,1.2233,0.625731,0.371222
40,1.0191,1.126916,0.666667,0.389834
50,0.7241,1.077603,0.684211,0.430968
60,0.545,1.123336,0.678363,0.496677
70,0.4102,1.142688,0.695906,0.505135
80,0.3467,1.066939,0.684211,0.528906
90,0.2502,1.187692,0.719298,0.538739
100,0.2163,1.166268,0.71345,0.59966


UBC-NLP/MARBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.0454,1.865023,0.345029,0.100584
20,1.6222,1.436085,0.555556,0.281258
30,1.2955,1.2233,0.625731,0.371222
40,1.0191,1.126916,0.666667,0.389834
50,0.7241,1.077603,0.684211,0.430968
60,0.545,1.123336,0.678363,0.496677
70,0.4102,1.142688,0.695906,0.505135
80,0.3467,1.066939,0.684211,0.528906
90,0.2502,1.187692,0.719298,0.538739
100,0.2163,1.166268,0.71345,0.59966


UBC-NLP/MARBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.0454,1.865023,0.345029,0.100584
20,1.6222,1.436085,0.555556,0.281258
30,1.2955,1.2233,0.625731,0.371222
40,1.0191,1.126916,0.666667,0.389834
50,0.7241,1.077603,0.684211,0.430968
60,0.545,1.123336,0.678363,0.496677
70,0.4102,1.142688,0.695906,0.505135
80,0.3467,1.066939,0.684211,0.528906
90,0.2502,1.187692,0.719298,0.538739
100,0.2163,1.166268,0.71345,0.59966


DatasetDict({
    train: Dataset({
        features: ['review', 'label'],
        num_rows: 680
    })
    test: Dataset({
        features: ['review', 'label'],
        num_rows: 171
    })
})

UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.1338,1.933003,0.356725,0.105656
20,1.7422,1.609011,0.520468,0.212019
30,1.3942,1.366861,0.602339,0.291127
40,1.1205,1.215499,0.660819,0.385621
50,0.904,1.105577,0.690058,0.412327
60,0.7813,1.066198,0.71345,0.426242
70,0.5916,1.028274,0.719298,0.459478
80,0.5487,0.995557,0.719298,0.467488
90,0.4342,0.979576,0.725146,0.502449
100,0.3491,0.997021,0.719298,0.495396


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.1338,1.933003,0.356725,0.105656
20,1.7422,1.609011,0.520468,0.212019
30,1.3942,1.366861,0.602339,0.291127
40,1.1205,1.215499,0.660819,0.385621
50,0.904,1.105577,0.690058,0.412327
60,0.7813,1.066198,0.71345,0.426242
70,0.5916,1.028274,0.719298,0.459478
80,0.5487,0.995557,0.719298,0.467488
90,0.4342,0.979576,0.725146,0.502449
100,0.3491,0.997021,0.719298,0.495396


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.1338,1.933003,0.356725,0.105656
20,1.7422,1.609011,0.520468,0.212019
30,1.3942,1.366861,0.602339,0.291127
40,1.1205,1.215499,0.660819,0.385621
50,0.904,1.105577,0.690058,0.412327
60,0.7813,1.066198,0.71345,0.426242
70,0.5916,1.028274,0.719298,0.459478
80,0.5487,0.995557,0.719298,0.467488
90,0.4342,0.979576,0.725146,0.502449
100,0.3491,0.997021,0.719298,0.495396


UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.146,1.855526,0.45614,0.103831
20,1.8148,1.584972,0.54386,0.169312
30,1.4287,1.320138,0.590643,0.203843
40,1.1661,1.222748,0.672515,0.315146
50,0.8803,1.1826,0.672515,0.325279
60,0.7215,1.121646,0.684211,0.33692
70,0.6176,1.208593,0.654971,0.345106
80,0.5032,1.210427,0.678363,0.361625
90,0.43,1.099245,0.725146,0.376219
100,0.3998,1.204671,0.666667,0.396722


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.146,1.855526,0.45614,0.103831
20,1.8148,1.584972,0.54386,0.169312
30,1.4287,1.320138,0.590643,0.203843
40,1.1661,1.222748,0.672515,0.315146
50,0.8803,1.1826,0.672515,0.325279
60,0.7215,1.121646,0.684211,0.33692
70,0.6176,1.208593,0.654971,0.345106
80,0.5032,1.210427,0.678363,0.361625
90,0.43,1.099245,0.725146,0.376219
100,0.3998,1.204671,0.666667,0.396722


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.146,1.855526,0.45614,0.103831
20,1.8148,1.584972,0.54386,0.169312
30,1.4287,1.320138,0.590643,0.203843
40,1.1661,1.222748,0.672515,0.315146
50,0.8803,1.1826,0.672515,0.325279
60,0.7215,1.121646,0.684211,0.33692
70,0.6176,1.208593,0.654971,0.345106
80,0.5032,1.210427,0.678363,0.361625
90,0.43,1.099245,0.725146,0.376219
100,0.3998,1.204671,0.666667,0.396722


UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.128,1.917812,0.350877,0.098138
20,1.7558,1.628901,0.51462,0.214315
30,1.477,1.380951,0.555556,0.254897
40,1.2254,1.281203,0.608187,0.354187
50,0.9689,1.195964,0.654971,0.402965
60,0.8368,1.158558,0.649123,0.385009
70,0.6757,1.129007,0.666667,0.420085
80,0.6186,1.117579,0.666667,0.411402
90,0.4818,1.11871,0.672515,0.436472
100,0.4437,1.096248,0.701754,0.485678


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.128,1.917812,0.350877,0.098138
20,1.7558,1.628901,0.51462,0.214315
30,1.477,1.380951,0.555556,0.254897
40,1.2254,1.281203,0.608187,0.354187
50,0.9689,1.195964,0.654971,0.402965
60,0.8368,1.158558,0.649123,0.385009
70,0.6757,1.129007,0.666667,0.420085
80,0.6186,1.117579,0.666667,0.411402
90,0.4818,1.11871,0.672515,0.436472
100,0.4437,1.096248,0.701754,0.485678


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.128,1.917812,0.350877,0.098138
20,1.7558,1.628901,0.51462,0.214315
30,1.477,1.380951,0.555556,0.254897
40,1.2254,1.281203,0.608187,0.354187
50,0.9689,1.195964,0.654971,0.402965
60,0.8368,1.158558,0.649123,0.385009
70,0.6757,1.129007,0.666667,0.420085
80,0.6186,1.117579,0.666667,0.411402
90,0.4818,1.11871,0.672515,0.436472
100,0.4437,1.096248,0.701754,0.485678


DatasetDict({
    train: Dataset({
        features: ['review', 'label'],
        num_rows: 680
    })
    test: Dataset({
        features: ['review', 'label'],
        num_rows: 171
    })
})

SI2M-Lab/DarijaBERT-mix, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9791,1.79997,0.426901,0.12744
20,1.6189,1.73242,0.432749,0.142484
30,1.5168,1.417773,0.573099,0.284404
40,1.2134,1.23312,0.619883,0.316401
50,1.0324,1.059869,0.666667,0.376866
60,0.8605,0.890038,0.719298,0.419604
70,0.7397,0.82674,0.77193,0.528494
80,0.6919,0.844555,0.748538,0.505834
90,0.5667,0.787214,0.777778,0.584156
100,0.4575,0.798807,0.754386,0.528177


SI2M-Lab/DarijaBERT-mix, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9791,1.79997,0.426901,0.12744
20,1.6189,1.73242,0.432749,0.142484
30,1.5168,1.417773,0.573099,0.284404
40,1.2134,1.23312,0.619883,0.316401
50,1.0324,1.059869,0.666667,0.376866
60,0.8605,0.890038,0.719298,0.419604
70,0.7397,0.82674,0.77193,0.528494
80,0.6919,0.844555,0.748538,0.505834
90,0.5667,0.787214,0.777778,0.584156
100,0.4575,0.798807,0.754386,0.528177


SI2M-Lab/DarijaBERT-mix, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9791,1.79997,0.426901,0.12744
20,1.6189,1.73242,0.432749,0.142484
30,1.5168,1.417773,0.573099,0.284404
40,1.2134,1.23312,0.619883,0.316401
50,1.0324,1.059869,0.666667,0.376866
60,0.8605,0.890038,0.719298,0.419604
70,0.7397,0.82674,0.77193,0.528494
80,0.6919,0.844555,0.748538,0.505834
90,0.5667,0.787214,0.777778,0.584156
100,0.4575,0.798807,0.754386,0.528177


SI2M-Lab/DarijaBERT-mix, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9918,1.70716,0.45614,0.150181
20,1.5362,1.232352,0.649123,0.240015
30,1.0548,0.936878,0.725146,0.338828
40,0.7725,0.871531,0.730994,0.382803
50,0.4981,0.752262,0.77193,0.442403
60,0.3747,0.761229,0.766082,0.458091
70,0.2721,0.758935,0.760234,0.456365
80,0.1597,0.749447,0.766082,0.478603
90,0.1014,0.838321,0.74269,0.504522
100,0.074,0.796868,0.795322,0.554796


SI2M-Lab/DarijaBERT-mix, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9918,1.70716,0.45614,0.150181
20,1.5362,1.232352,0.649123,0.240015
30,1.0548,0.936878,0.725146,0.338828
40,0.7725,0.871531,0.730994,0.382803
50,0.4981,0.752262,0.77193,0.442403
60,0.3747,0.761229,0.766082,0.458091
70,0.2721,0.758935,0.760234,0.456365
80,0.1597,0.749447,0.766082,0.478603
90,0.1014,0.838321,0.74269,0.504522
100,0.074,0.796868,0.795322,0.554796


SI2M-Lab/DarijaBERT-mix, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9918,1.70716,0.45614,0.150181
20,1.5362,1.232352,0.649123,0.240015
30,1.0548,0.936878,0.725146,0.338828
40,0.7725,0.871531,0.730994,0.382803
50,0.4981,0.752262,0.77193,0.442403
60,0.3747,0.761229,0.766082,0.458091
70,0.2721,0.758935,0.760234,0.456365
80,0.1597,0.749447,0.766082,0.478603
90,0.1014,0.838321,0.74269,0.504522
100,0.074,0.796868,0.795322,0.554796


SI2M-Lab/DarijaBERT-mix, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.0403,1.891399,0.374269,0.104467
20,1.7297,1.656297,0.415205,0.155859
30,1.6078,1.4332,0.532164,0.250273
40,1.3535,1.169789,0.654971,0.325312
50,1.0751,1.005239,0.654971,0.37268
60,0.8756,0.873105,0.71345,0.475744
70,0.6773,0.797993,0.730994,0.519348
80,0.5584,0.678899,0.783626,0.539753
90,0.3741,0.703455,0.766082,0.545906
100,0.2885,0.708114,0.766082,0.626146


SI2M-Lab/DarijaBERT-mix, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.0403,1.891399,0.374269,0.104467
20,1.7297,1.656297,0.415205,0.155859
30,1.6078,1.4332,0.532164,0.250273
40,1.3535,1.169789,0.654971,0.325312
50,1.0751,1.005239,0.654971,0.37268
60,0.8756,0.873105,0.71345,0.475744
70,0.6773,0.797993,0.730994,0.519348
80,0.5584,0.678899,0.783626,0.539753
90,0.3741,0.703455,0.766082,0.545906
100,0.2885,0.708114,0.766082,0.626146


SI2M-Lab/DarijaBERT-mix, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.0403,1.891399,0.374269,0.104467
20,1.7297,1.656297,0.415205,0.155859
30,1.6078,1.4332,0.532164,0.250273
40,1.3535,1.169789,0.654971,0.325312
50,1.0751,1.005239,0.654971,0.37268
60,0.8756,0.873105,0.71345,0.475744
70,0.6773,0.797993,0.730994,0.519348
80,0.5584,0.678899,0.783626,0.539753
90,0.3741,0.703455,0.766082,0.545906
100,0.2885,0.708114,0.766082,0.626146


DatasetDict({
    train: Dataset({
        features: ['review', 'label'],
        num_rows: 680
    })
    test: Dataset({
        features: ['review', 'label'],
        num_rows: 171
    })
})

SI2M-Lab/DarijaBERT-arabizi, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9289,1.699166,0.426901,0.125683
20,1.3272,1.237683,0.602339,0.290754
30,0.9479,1.047257,0.678363,0.354413
40,0.6544,1.000452,0.690058,0.421439
50,0.4298,1.021266,0.695906,0.459212
60,0.2875,1.005385,0.707602,0.435858
70,0.2043,1.147761,0.690058,0.470291
80,0.1391,1.078785,0.707602,0.484352
90,0.0732,1.171998,0.701754,0.483882
100,0.0433,1.169872,0.690058,0.473997


SI2M-Lab/DarijaBERT-arabizi, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9289,1.699166,0.426901,0.125683
20,1.3272,1.237683,0.602339,0.290754
30,0.9479,1.047257,0.678363,0.354413
40,0.6544,1.000452,0.690058,0.421439
50,0.4298,1.021266,0.695906,0.459212
60,0.2875,1.005385,0.707602,0.435858
70,0.2043,1.147761,0.690058,0.470291
80,0.1391,1.078785,0.707602,0.484352
90,0.0732,1.171998,0.701754,0.483882
100,0.0433,1.169872,0.690058,0.473997


SI2M-Lab/DarijaBERT-arabizi, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9289,1.699166,0.426901,0.125683
20,1.3272,1.237683,0.602339,0.290754
30,0.9479,1.047257,0.678363,0.354413
40,0.6544,1.000452,0.690058,0.421439
50,0.4298,1.021266,0.695906,0.459212
60,0.2875,1.005385,0.707602,0.435858
70,0.2043,1.147761,0.690058,0.470291
80,0.1391,1.078785,0.707602,0.484352
90,0.0732,1.171998,0.701754,0.483882
100,0.0433,1.169872,0.690058,0.473997


SI2M-Lab/DarijaBERT-arabizi, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9578,1.680553,0.491228,0.160686
20,1.4345,1.299141,0.619883,0.222415
30,0.9236,1.092621,0.660819,0.251365
40,0.7175,1.07025,0.672515,0.297708
50,0.4217,1.027797,0.707602,0.347465
60,0.3112,1.04037,0.701754,0.371286
70,0.2076,1.178659,0.684211,0.353077
80,0.1432,1.123967,0.719298,0.408299
90,0.0774,1.203326,0.695906,0.42572
100,0.068,1.160943,0.707602,0.433552


SI2M-Lab/DarijaBERT-arabizi, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9578,1.680553,0.491228,0.160686
20,1.4345,1.299141,0.619883,0.222415
30,0.9236,1.092621,0.660819,0.251365
40,0.7175,1.07025,0.672515,0.297708
50,0.4217,1.027797,0.707602,0.347465
60,0.3112,1.04037,0.701754,0.371286
70,0.2076,1.178659,0.684211,0.353077
80,0.1432,1.123967,0.719298,0.408299
90,0.0774,1.203326,0.695906,0.42572
100,0.068,1.160943,0.707602,0.433552


SI2M-Lab/DarijaBERT-arabizi, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9578,1.680553,0.491228,0.160686
20,1.4345,1.299141,0.619883,0.222415
30,0.9236,1.092621,0.660819,0.251365
40,0.7175,1.07025,0.672515,0.297708
50,0.4217,1.027797,0.707602,0.347465
60,0.3112,1.04037,0.701754,0.371286
70,0.2076,1.178659,0.684211,0.353077
80,0.1432,1.123967,0.719298,0.408299
90,0.0774,1.203326,0.695906,0.42572
100,0.068,1.160943,0.707602,0.433552


SI2M-Lab/DarijaBERT-arabizi, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9418,1.673427,0.415205,0.120065
20,1.3578,1.250445,0.625731,0.30253
30,1.0088,1.050584,0.643275,0.327822
40,0.7341,0.980034,0.678363,0.37199
50,0.4649,0.997067,0.684211,0.472014
60,0.322,1.017674,0.695906,0.483196
70,0.1875,1.035465,0.707602,0.467732
80,0.15,1.040999,0.695906,0.487373
90,0.081,1.155118,0.707602,0.503795
100,0.054,1.221034,0.678363,0.465143


SI2M-Lab/DarijaBERT-arabizi, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9418,1.673427,0.415205,0.120065
20,1.3578,1.250445,0.625731,0.30253
30,1.0088,1.050584,0.643275,0.327822
40,0.7341,0.980034,0.678363,0.37199
50,0.4649,0.997067,0.684211,0.472014
60,0.322,1.017674,0.695906,0.483196
70,0.1875,1.035465,0.707602,0.467732
80,0.15,1.040999,0.695906,0.487373
90,0.081,1.155118,0.707602,0.503795
100,0.054,1.221034,0.678363,0.465143


SI2M-Lab/DarijaBERT-arabizi, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9418,1.673427,0.415205,0.120065
20,1.3578,1.250445,0.625731,0.30253
30,1.0088,1.050584,0.643275,0.327822
40,0.7341,0.980034,0.678363,0.37199
50,0.4649,0.997067,0.684211,0.472014
60,0.322,1.017674,0.695906,0.483196
70,0.1875,1.035465,0.707602,0.467732
80,0.15,1.040999,0.695906,0.487373
90,0.081,1.155118,0.707602,0.503795
100,0.054,1.221034,0.678363,0.465143


Unnamed: 0,Model,Accuracy,F1
0,CAMeL-Lab/bert-base-arabic-camelbert-da,0.690058,0.569598
3,SI2M-Lab/DarijaBERT-arabizi,0.730994,0.552129
6,SI2M-Lab/DarijaBERT-mix,0.824561,0.758153
9,UBC-NLP/MARBERT,0.736842,0.630286
12,UBC-NLP/MARBERTv2,0.730994,0.643215
15,aubmindlab/bert-base-arabertv02-twitter,0.760234,0.694863
18,qarib/bert-base-qarib,0.730994,0.663714
