In [1]:
import os
os.environ["CUDA_VISIBLE_DEVICES"]="1" 

import numpy as np
import tensorflow as tf
import pandas as pd
import pyarabic.araby as araby
import warnings
warnings.filterwarnings('ignore')
from sklearn.model_selection import train_test_split
from sklearn.metrics import classification_report
from tensorflow.keras.layers import Dense, Input
from tensorflow.keras.utils import to_categorical
from tensorflow.keras.optimizers import Adam
from tensorflow.keras.callbacks import EarlyStopping
from tensorflow.keras.initializers import TruncatedNormal
from tensorflow.keras.losses import CategoricalCrossentropy
from tensorflow.keras.metrics import CategoricalAccuracy
import torch
from sklearn.metrics import accuracy_score, f1_score
from transformers import Trainer, TrainingArguments
from transformers import AutoTokenizer, AutoModelForSequenceClassification
from datasets import load_dataset, Dataset, concatenate_datasets
pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', None)
pd.set_option('display.max_colwidth', 1000)


fname = 'dreviews_tc_2'
log_file = fname + '.txt'

with open(log_file, 'w') as f:
    f.write('Model,Accuracy,F1\n')


dataset = load_dataset('ohidaoui/darija-reviews')


df = pd.DataFrame(dataset['test'])

display(len(df))
      
display(df.columns)
display(df[:4])

df['label'] = df['label'].replace('negative ', 'negative')

c = df['topic'].value_counts()
display(c)

classes = set(df['topic'].values)
display(classes)

df['topic'] = df['topic'].astype('category')
df['label'] = df['topic'].cat.codes

df = df[['review', 'label']]
classes_num = len(classes)
display(classes_num)
display(len(df))



max_sequence_length = 128

models = [ 
        'faisalq/EgyBERT',            
    'faisalq/SaudiBERT',            
    'tunis-ai/TunBERT',
    'alger-ia/dziribert',
    'SI2M-Lab/DarijaBERT',
    'otmangi/MorRoBERTa',
    'otmangi/MorrBERT'
            
]


seeds = [0, 1, 42]

for model_name in models:
    for seed in seeds:
        ds = Dataset.from_pandas(df)
        ds = ds.train_test_split(test_size=0.2, seed = seed)
        if seed==0:
            display(ds)
            
        for i in range(3):
            print(f'{model_name}, try:{i}')
                  
            tokenizer = AutoTokenizer.from_pretrained(model_name)
            model = AutoModelForSequenceClassification.from_pretrained(model_name,
                                                                  num_labels=classes_num).to('cuda')                                                 
            dataset_train = ds['train']
            dataset_validation = ds['test']                                                    
            
          
    
            def preprocess_function(examples):
                return tokenizer(examples['review'], truncation=True, padding="max_length",
                                max_length=max_sequence_length)
            
            
            dataset_train = dataset_train.map(preprocess_function, batched=True)
            dataset_validation = dataset_validation.map(preprocess_function, batched=True)
            
           
            
            def compute_metrics(eval_pred):
                logits, labels = eval_pred
                predictions = np.argmax(logits, axis=-1)    
                acc = accuracy_score(labels, predictions)        
                f1 = f1_score(labels, predictions, average='macro')   
                with open(log_file, 'a') as f:
                    f.write(f'{model_name},{acc},{f1}\n')
                return {'accuracy': acc, 'f1_score': f1}
    
    
            
            
            epochs = 30
            save_steps = 10000 #save checkpoint every 10000 steps
            batch_size = 64
            
            training_args = TrainingArguments(
                output_dir = 'bert/',
                overwrite_output_dir=True,
                num_train_epochs = epochs,
                per_device_train_batch_size = batch_size,
                per_device_eval_batch_size = batch_size,
                save_steps = save_steps,
                save_total_limit = 1, #only save the last 5 checkpoints
                fp16=True,
                learning_rate = 5e-5,  # 5e-5 is the default
                logging_steps = 10, #50_000
                evaluation_strategy = 'steps',
                # evaluate_during_training = True,
                eval_steps = 10
                
            )
            
            trainer = Trainer(
                model = model,
                args = training_args,
                # data_collator=data_collator,
                train_dataset=dataset_train,
                eval_dataset=dataset_validation,
                compute_metrics = compute_metrics
            )
            
            
            trainer.train()


results = pd.read_csv(log_file)

best_results = results.groupby('Model', as_index=False)['F1'].max()

best_results = pd.merge(best_results, results, on=['Model', 'F1'])
best_results = best_results[['Model', 'Accuracy', 'F1']]
best_results = best_results.drop_duplicates()
best_results.to_csv(f'{fname}.csv')
display(best_results)



2024-09-19 08:14:33.348378: I tensorflow/core/util/port.cc:110] oneDNN custom operations are on. You may see slightly different numerical results due to floating-point round-off errors from different computation orders. To turn them off, set the environment variable `TF_ENABLE_ONEDNN_OPTS=0`.
2024-09-19 08:14:33.374453: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.
To enable the following instructions: AVX2 AVX512F AVX512_VNNI AVX512_BF16 FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.
Found cached dataset parquet (/home/ffq/.cache/huggingface/datasets/ohidaoui___parquet/ohidaoui--darija-reviews-34030453886e5230/0.0.0/14a00e99c0d15a23649d0db8944380ac81082d4b021f398733dd84f3a6c569a7)


  0%|          | 0/1 [00:00<?, ?it/s]

851

Index(['review', 'label', 'topic', 'writing_style'], dtype='object')

Unnamed: 0,review,label,topic,writing_style
0,داسيا فقدت أهم ميزة كانت تميزها وهي السعر للأسف !,negative,automotive,Arabic
1,لاأظنها ستنجح كالنسخ الأولى,negative,automotive,Arabic
2,Khas ykon tghyir mbanch li lfar9 rir fa dizayn lkrasa mikanik tablo fih dak lblstik lmryat 3lach mdyrinch lhm daw volm mzl kif mahwa jwant kifma howa fin kyn lfr9 fdizyn ama ljiti tchof mkynch fra9 fra9 howa y9riban 40% mli kt9ol l3mrya hdi bnsba li ana nas 3morya ama l3morya kolchi daw mzl khsha whd 10 ans wnchofo ana knfdl dacia l9dima,negative,automotive,Arabizi
3,هناك اختيارات أحسن وماركات عالميه أجود من داصيا.,negative,automotive,Arabic


topic
it                      287
cosmetics               172
entertainment           121
clothing                 93
cleaning                 57
hospitality              37
household appliances     33
automotive               20
restaurants              19
jewelry                   8
other                     4
Name: count, dtype: int64

{'automotive',
 'cleaning',
 'clothing',
 'cosmetics',
 'entertainment',
 'hospitality',
 'household appliances',
 'it',
 'jewelry',
 'other',
 'restaurants'}

11

851

DatasetDict({
    train: Dataset({
        features: ['review', 'label'],
        num_rows: 680
    })
    test: Dataset({
        features: ['review', 'label'],
        num_rows: 171
    })
})

faisalq/EgyBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/EgyBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.3865,2.356839,0.315789,0.053333
20,2.3299,2.302597,0.315789,0.053333
30,2.2735,2.247339,0.315789,0.053333
40,2.2129,2.190681,0.315789,0.053333
50,2.1418,2.129957,0.315789,0.053333
60,2.0931,2.062466,0.339181,0.080938
70,1.9702,1.997801,0.345029,0.085586
80,1.955,1.939727,0.438596,0.134863
90,1.8491,1.878672,0.444444,0.137375
100,1.7636,1.823985,0.444444,0.134867


faisalq/EgyBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/EgyBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.3785,2.349153,0.315789,0.053333
20,2.3198,2.293323,0.315789,0.053333
30,2.2602,2.238293,0.315789,0.053333
40,2.199,2.180835,0.315789,0.053333
50,2.1273,2.123355,0.315789,0.053333
60,2.0862,2.071563,0.385965,0.112683
70,1.9625,2.004363,0.415205,0.12548
80,1.9439,1.934142,0.426901,0.130435
90,1.8387,1.871642,0.438596,0.133625
100,1.749,1.827388,0.444444,0.13603


faisalq/EgyBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/EgyBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.3785,2.349153,0.315789,0.053333
20,2.3198,2.293323,0.315789,0.053333
30,2.2602,2.238293,0.315789,0.053333
40,2.199,2.180835,0.315789,0.053333
50,2.1273,2.123355,0.315789,0.053333
60,2.0862,2.071563,0.385965,0.112683
70,1.9625,2.004363,0.415205,0.12548
80,1.9439,1.934142,0.426901,0.130435
90,1.8387,1.871642,0.438596,0.133625
100,1.749,1.827388,0.444444,0.13603


faisalq/EgyBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/EgyBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.38,2.34206,0.397661,0.051731
20,2.3269,2.278989,0.397661,0.051731
30,2.2643,2.21465,0.397661,0.051731
40,2.2185,2.152698,0.397661,0.051731
50,2.1348,2.086971,0.397661,0.051731
60,2.0754,2.019508,0.473684,0.104692
70,2.0096,1.94883,0.508772,0.116689
80,1.9292,1.87267,0.51462,0.117252
90,1.8319,1.811706,0.502924,0.113625
100,1.7765,1.740714,0.51462,0.11678


faisalq/EgyBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/EgyBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.38,2.34206,0.397661,0.051731
20,2.3269,2.278989,0.397661,0.051731
30,2.2643,2.21465,0.397661,0.051731
40,2.2185,2.152698,0.397661,0.051731
50,2.1348,2.086971,0.397661,0.051731
60,2.0754,2.019508,0.473684,0.104692
70,2.0096,1.94883,0.508772,0.116689
80,1.9292,1.87267,0.51462,0.117252
90,1.8319,1.811706,0.502924,0.113625
100,1.7765,1.740714,0.51462,0.11678


faisalq/EgyBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/EgyBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.38,2.34206,0.397661,0.051731
20,2.3269,2.278989,0.397661,0.051731
30,2.2643,2.21465,0.397661,0.051731
40,2.2185,2.152698,0.397661,0.051731
50,2.1348,2.086971,0.397661,0.051731
60,2.0754,2.019508,0.473684,0.104692
70,2.0096,1.94883,0.508772,0.116689
80,1.9292,1.87267,0.51462,0.117252
90,1.8319,1.811706,0.502924,0.113625
100,1.7765,1.740714,0.51462,0.11678


faisalq/EgyBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/EgyBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.3793,2.349633,0.339181,0.073574
20,2.322,2.292717,0.321637,0.054081
30,2.2665,2.235117,0.321637,0.054081
40,2.2156,2.178677,0.321637,0.054081
50,2.1247,2.119032,0.321637,0.054081
60,2.0892,2.058411,0.350877,0.084555
70,1.9838,1.995854,0.374269,0.099577
80,1.9584,1.922143,0.438596,0.129898
90,1.8466,1.871305,0.426901,0.125392
100,1.7848,1.814859,0.438596,0.130244


faisalq/EgyBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/EgyBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.3793,2.349633,0.339181,0.073574
20,2.322,2.292717,0.321637,0.054081
30,2.2665,2.235117,0.321637,0.054081
40,2.2156,2.178677,0.321637,0.054081
50,2.1247,2.119032,0.321637,0.054081
60,2.0892,2.058411,0.350877,0.084555
70,1.9838,1.995854,0.374269,0.099577
80,1.9584,1.922143,0.438596,0.129898
90,1.8466,1.871305,0.426901,0.125392
100,1.7848,1.814859,0.438596,0.130244


faisalq/EgyBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/EgyBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.3793,2.349633,0.339181,0.073574
20,2.322,2.292717,0.321637,0.054081
30,2.2665,2.235117,0.321637,0.054081
40,2.2156,2.178677,0.321637,0.054081
50,2.1247,2.119032,0.321637,0.054081
60,2.0892,2.058411,0.350877,0.084555
70,1.9838,1.995854,0.374269,0.099577
80,1.9584,1.922143,0.438596,0.129898
90,1.8466,1.871305,0.426901,0.125392
100,1.7848,1.814859,0.438596,0.130244


DatasetDict({
    train: Dataset({
        features: ['review', 'label'],
        num_rows: 680
    })
    test: Dataset({
        features: ['review', 'label'],
        num_rows: 171
    })
})

faisalq/SaudiBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.797,1.456134,0.532164,0.232643
20,1.1702,1.115634,0.649123,0.367058
30,0.8669,1.027802,0.678363,0.4094
40,0.5854,1.012543,0.707602,0.527515
50,0.449,1.027242,0.701754,0.497865
60,0.294,0.986448,0.74269,0.609284
70,0.2019,1.156547,0.71345,0.5462
80,0.157,1.249398,0.719298,0.574853
90,0.0962,1.227833,0.725146,0.548201
100,0.0571,1.322394,0.695906,0.561942


faisalq/SaudiBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.797,1.456134,0.532164,0.232643
20,1.1702,1.115634,0.649123,0.367058
30,0.8669,1.027802,0.678363,0.4094
40,0.5854,1.012543,0.707602,0.527515
50,0.449,1.027242,0.701754,0.497865
60,0.294,0.986448,0.74269,0.609284
70,0.2019,1.156547,0.71345,0.5462
80,0.157,1.249398,0.719298,0.574853
90,0.0962,1.227833,0.725146,0.548201
100,0.0571,1.322394,0.695906,0.561942


faisalq/SaudiBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.797,1.456134,0.532164,0.232643
20,1.1702,1.115634,0.649123,0.367058
30,0.8669,1.027802,0.678363,0.4094
40,0.5854,1.012543,0.707602,0.527515
50,0.449,1.027242,0.701754,0.497865
60,0.294,0.986448,0.74269,0.609284
70,0.2019,1.156547,0.71345,0.5462
80,0.157,1.249398,0.719298,0.574853
90,0.0962,1.227833,0.725146,0.548201
100,0.0571,1.322394,0.695906,0.561942


faisalq/SaudiBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.843,1.444382,0.561404,0.17992
20,1.234,1.106577,0.660819,0.297915
30,0.7824,1.079086,0.666667,0.321344
40,0.5729,1.13341,0.695906,0.46951
50,0.419,1.068544,0.701754,0.440886
60,0.2528,1.113602,0.695906,0.505927
70,0.2218,1.358237,0.678363,0.515861
80,0.1306,1.174455,0.71345,0.49174
90,0.0998,1.365094,0.707602,0.433919
100,0.1353,1.34332,0.690058,0.502609


faisalq/SaudiBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.843,1.444382,0.561404,0.17992
20,1.234,1.106577,0.660819,0.297915
30,0.7824,1.079086,0.666667,0.321344
40,0.5729,1.13341,0.695906,0.46951
50,0.419,1.068544,0.701754,0.440886
60,0.2528,1.113602,0.695906,0.505927
70,0.2218,1.358237,0.678363,0.515861
80,0.1306,1.174455,0.71345,0.49174
90,0.0998,1.365094,0.707602,0.433919
100,0.1353,1.34332,0.690058,0.502609


faisalq/SaudiBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.843,1.444382,0.561404,0.17992
20,1.234,1.106577,0.660819,0.297915
30,0.7824,1.079086,0.666667,0.321344
40,0.5729,1.13341,0.695906,0.46951
50,0.419,1.068544,0.701754,0.440886
60,0.2528,1.113602,0.695906,0.505927
70,0.2218,1.358237,0.678363,0.515861
80,0.1306,1.174455,0.71345,0.49174
90,0.0998,1.365094,0.707602,0.433919
100,0.1353,1.34332,0.690058,0.502609


faisalq/SaudiBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.8184,1.48268,0.538012,0.222719
20,1.1884,1.095231,0.643275,0.360395
30,0.8745,0.979592,0.684211,0.411921
40,0.6666,0.907999,0.725146,0.466387
50,0.4344,0.922148,0.730994,0.54068
60,0.3239,0.983034,0.754386,0.597642
70,0.2425,1.02089,0.690058,0.523589
80,0.1786,1.003332,0.736842,0.612866
90,0.108,1.105792,0.74269,0.619761
100,0.0954,1.050525,0.748538,0.559111


faisalq/SaudiBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.8184,1.48268,0.538012,0.222719
20,1.1884,1.095231,0.643275,0.360395
30,0.8745,0.979592,0.684211,0.411921
40,0.6666,0.907999,0.725146,0.466387
50,0.4344,0.922148,0.730994,0.54068
60,0.3239,0.983034,0.754386,0.597642
70,0.2425,1.02089,0.690058,0.523589
80,0.1786,1.003332,0.736842,0.612866
90,0.108,1.105792,0.74269,0.619761
100,0.0954,1.050525,0.748538,0.559111


faisalq/SaudiBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.8184,1.48268,0.538012,0.222719
20,1.1884,1.095231,0.643275,0.360395
30,0.8745,0.979592,0.684211,0.411921
40,0.6666,0.907999,0.725146,0.466387
50,0.4344,0.922148,0.730994,0.54068
60,0.3239,0.983034,0.754386,0.597642
70,0.2425,1.02089,0.690058,0.523589
80,0.1786,1.003332,0.736842,0.612866
90,0.108,1.105792,0.74269,0.619761
100,0.0954,1.050525,0.748538,0.559111


DatasetDict({
    train: Dataset({
        features: ['review', 'label'],
        num_rows: 680
    })
    test: Dataset({
        features: ['review', 'label'],
        num_rows: 171
    })
})

tunis-ai/TunBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at tunis-ai/TunBERT and are newly initialized: ['classifier.bias', 'classifier.weight', 'embeddings.LayerNorm.bias', 'embeddings.LayerNorm.weight', 'embeddings.position_embeddings.weight', 'embeddings.token_type_embeddings.weight', 'embeddings.word_embeddings.weight', 'encoder.layer.0.attention.output.LayerNorm.bias', 'encoder.layer.0.attention.output.LayerNorm.weight', 'encoder.layer.0.attention.output.dense.bias', 'encoder.layer.0.attention.output.dense.weight', 'encoder.layer.0.attention.self.key.bias', 'encoder.layer.0.attention.self.key.weight', 'encoder.layer.0.attention.self.query.bias', 'encoder.layer.0.attention.self.query.weight', 'encoder.layer.0.attention.self.value.bias', 'encoder.layer.0.attention.self.value.weight', 'encoder.layer.0.intermediate.dense.bias', 'encoder.layer.0.intermediate.dense.weight', 'encoder.layer.0.output.LayerNorm.bias', 'encoder.layer.0.output.LayerNorm.wei

Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.01,1.942543,0.315789,0.053333
20,1.906,1.994689,0.339181,0.100965
30,1.9037,1.90627,0.315789,0.053333
40,1.8792,1.911094,0.362573,0.10587
50,1.7551,1.843125,0.391813,0.118242
60,1.7368,1.831976,0.380117,0.143042
70,1.5282,1.840458,0.380117,0.130693
80,1.6196,1.876808,0.391813,0.138046
90,1.5971,1.879591,0.385965,0.147849
100,1.4812,1.859062,0.403509,0.141549


tunis-ai/TunBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at tunis-ai/TunBERT and are newly initialized: ['classifier.bias', 'classifier.weight', 'embeddings.LayerNorm.bias', 'embeddings.LayerNorm.weight', 'embeddings.position_embeddings.weight', 'embeddings.token_type_embeddings.weight', 'embeddings.word_embeddings.weight', 'encoder.layer.0.attention.output.LayerNorm.bias', 'encoder.layer.0.attention.output.LayerNorm.weight', 'encoder.layer.0.attention.output.dense.bias', 'encoder.layer.0.attention.output.dense.weight', 'encoder.layer.0.attention.self.key.bias', 'encoder.layer.0.attention.self.key.weight', 'encoder.layer.0.attention.self.query.bias', 'encoder.layer.0.attention.self.query.weight', 'encoder.layer.0.attention.self.value.bias', 'encoder.layer.0.attention.self.value.weight', 'encoder.layer.0.intermediate.dense.bias', 'encoder.layer.0.intermediate.dense.weight', 'encoder.layer.0.output.LayerNorm.bias', 'encoder.layer.0.output.LayerNorm.wei

Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.01,1.942543,0.315789,0.053333
20,1.906,1.994689,0.339181,0.100965
30,1.9037,1.90627,0.315789,0.053333
40,1.8792,1.911094,0.362573,0.10587
50,1.7551,1.843125,0.391813,0.118242
60,1.7368,1.831976,0.380117,0.143042
70,1.5282,1.840458,0.380117,0.130693
80,1.6196,1.876808,0.391813,0.138046
90,1.5971,1.879591,0.385965,0.147849
100,1.4812,1.859062,0.403509,0.141549


tunis-ai/TunBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at tunis-ai/TunBERT and are newly initialized: ['classifier.bias', 'classifier.weight', 'embeddings.LayerNorm.bias', 'embeddings.LayerNorm.weight', 'embeddings.position_embeddings.weight', 'embeddings.token_type_embeddings.weight', 'embeddings.word_embeddings.weight', 'encoder.layer.0.attention.output.LayerNorm.bias', 'encoder.layer.0.attention.output.LayerNorm.weight', 'encoder.layer.0.attention.output.dense.bias', 'encoder.layer.0.attention.output.dense.weight', 'encoder.layer.0.attention.self.key.bias', 'encoder.layer.0.attention.self.key.weight', 'encoder.layer.0.attention.self.query.bias', 'encoder.layer.0.attention.self.query.weight', 'encoder.layer.0.attention.self.value.bias', 'encoder.layer.0.attention.self.value.weight', 'encoder.layer.0.intermediate.dense.bias', 'encoder.layer.0.intermediate.dense.weight', 'encoder.layer.0.output.LayerNorm.bias', 'encoder.layer.0.output.LayerNorm.wei

Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.01,1.942543,0.315789,0.053333
20,1.906,1.994689,0.339181,0.100965
30,1.9037,1.90627,0.315789,0.053333
40,1.8792,1.911094,0.362573,0.10587
50,1.7551,1.843125,0.391813,0.118242
60,1.7368,1.831976,0.380117,0.143042
70,1.5282,1.840458,0.380117,0.130693
80,1.6196,1.876808,0.391813,0.138046
90,1.5971,1.879591,0.385965,0.147849
100,1.4812,1.859062,0.403509,0.141549


tunis-ai/TunBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at tunis-ai/TunBERT and are newly initialized: ['classifier.bias', 'classifier.weight', 'embeddings.LayerNorm.bias', 'embeddings.LayerNorm.weight', 'embeddings.position_embeddings.weight', 'embeddings.token_type_embeddings.weight', 'embeddings.word_embeddings.weight', 'encoder.layer.0.attention.output.LayerNorm.bias', 'encoder.layer.0.attention.output.LayerNorm.weight', 'encoder.layer.0.attention.output.dense.bias', 'encoder.layer.0.attention.output.dense.weight', 'encoder.layer.0.attention.self.key.bias', 'encoder.layer.0.attention.self.key.weight', 'encoder.layer.0.attention.self.query.bias', 'encoder.layer.0.attention.self.query.weight', 'encoder.layer.0.attention.self.value.bias', 'encoder.layer.0.attention.self.value.weight', 'encoder.layer.0.intermediate.dense.bias', 'encoder.layer.0.intermediate.dense.weight', 'encoder.layer.0.output.LayerNorm.bias', 'encoder.layer.0.output.LayerNorm.wei

Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.0036,1.940887,0.175439,0.029131
20,1.9924,1.910545,0.397661,0.051731
30,1.9052,1.845663,0.397661,0.051731
40,1.9064,1.795005,0.461988,0.106383
50,1.7707,2.05493,0.239766,0.054308
60,1.8177,1.71102,0.467836,0.106768
70,1.6438,1.717408,0.461988,0.112958
80,1.6778,1.656147,0.467836,0.143658
90,1.5492,1.748919,0.421053,0.142462
100,1.5187,1.636704,0.491228,0.158074


tunis-ai/TunBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at tunis-ai/TunBERT and are newly initialized: ['classifier.bias', 'classifier.weight', 'embeddings.LayerNorm.bias', 'embeddings.LayerNorm.weight', 'embeddings.position_embeddings.weight', 'embeddings.token_type_embeddings.weight', 'embeddings.word_embeddings.weight', 'encoder.layer.0.attention.output.LayerNorm.bias', 'encoder.layer.0.attention.output.LayerNorm.weight', 'encoder.layer.0.attention.output.dense.bias', 'encoder.layer.0.attention.output.dense.weight', 'encoder.layer.0.attention.self.key.bias', 'encoder.layer.0.attention.self.key.weight', 'encoder.layer.0.attention.self.query.bias', 'encoder.layer.0.attention.self.query.weight', 'encoder.layer.0.attention.self.value.bias', 'encoder.layer.0.attention.self.value.weight', 'encoder.layer.0.intermediate.dense.bias', 'encoder.layer.0.intermediate.dense.weight', 'encoder.layer.0.output.LayerNorm.bias', 'encoder.layer.0.output.LayerNorm.wei

Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.0036,1.940887,0.175439,0.029131
20,1.9924,1.910545,0.397661,0.051731
30,1.9052,1.845663,0.397661,0.051731
40,1.9064,1.795005,0.461988,0.106383
50,1.7707,2.05493,0.239766,0.054308
60,1.8177,1.71102,0.467836,0.106768
70,1.6438,1.717408,0.461988,0.112958
80,1.6778,1.656147,0.467836,0.143658
90,1.5492,1.748919,0.421053,0.142462
100,1.5187,1.636704,0.491228,0.158074


tunis-ai/TunBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at tunis-ai/TunBERT and are newly initialized: ['classifier.bias', 'classifier.weight', 'embeddings.LayerNorm.bias', 'embeddings.LayerNorm.weight', 'embeddings.position_embeddings.weight', 'embeddings.token_type_embeddings.weight', 'embeddings.word_embeddings.weight', 'encoder.layer.0.attention.output.LayerNorm.bias', 'encoder.layer.0.attention.output.LayerNorm.weight', 'encoder.layer.0.attention.output.dense.bias', 'encoder.layer.0.attention.output.dense.weight', 'encoder.layer.0.attention.self.key.bias', 'encoder.layer.0.attention.self.key.weight', 'encoder.layer.0.attention.self.query.bias', 'encoder.layer.0.attention.self.query.weight', 'encoder.layer.0.attention.self.value.bias', 'encoder.layer.0.attention.self.value.weight', 'encoder.layer.0.intermediate.dense.bias', 'encoder.layer.0.intermediate.dense.weight', 'encoder.layer.0.output.LayerNorm.bias', 'encoder.layer.0.output.LayerNorm.wei

Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.0036,1.940887,0.175439,0.029131
20,1.9924,1.910545,0.397661,0.051731
30,1.9052,1.845663,0.397661,0.051731
40,1.9064,1.795005,0.461988,0.106383
50,1.7707,2.05493,0.239766,0.054308
60,1.8177,1.71102,0.467836,0.106768
70,1.6438,1.717408,0.461988,0.112958
80,1.6778,1.656147,0.467836,0.143658
90,1.5492,1.748919,0.421053,0.142462
100,1.5187,1.636704,0.491228,0.158074


tunis-ai/TunBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at tunis-ai/TunBERT and are newly initialized: ['classifier.bias', 'classifier.weight', 'embeddings.LayerNorm.bias', 'embeddings.LayerNorm.weight', 'embeddings.position_embeddings.weight', 'embeddings.token_type_embeddings.weight', 'embeddings.word_embeddings.weight', 'encoder.layer.0.attention.output.LayerNorm.bias', 'encoder.layer.0.attention.output.LayerNorm.weight', 'encoder.layer.0.attention.output.dense.bias', 'encoder.layer.0.attention.output.dense.weight', 'encoder.layer.0.attention.self.key.bias', 'encoder.layer.0.attention.self.key.weight', 'encoder.layer.0.attention.self.query.bias', 'encoder.layer.0.attention.self.query.weight', 'encoder.layer.0.attention.self.value.bias', 'encoder.layer.0.attention.self.value.weight', 'encoder.layer.0.intermediate.dense.bias', 'encoder.layer.0.intermediate.dense.weight', 'encoder.layer.0.output.LayerNorm.bias', 'encoder.layer.0.output.LayerNorm.wei

Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.039,1.989886,0.321637,0.054081
20,1.9082,1.949076,0.181287,0.034103
30,1.9873,1.916587,0.321637,0.054081
40,1.9549,1.890534,0.321637,0.054081
50,1.8298,1.909469,0.339181,0.096947
60,1.8153,1.874115,0.327485,0.096948
70,1.7353,1.831937,0.350877,0.103376
80,1.786,1.776119,0.356725,0.105391
90,1.6321,1.756086,0.385965,0.113686
100,1.5189,1.746596,0.421053,0.140506


tunis-ai/TunBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at tunis-ai/TunBERT and are newly initialized: ['classifier.bias', 'classifier.weight', 'embeddings.LayerNorm.bias', 'embeddings.LayerNorm.weight', 'embeddings.position_embeddings.weight', 'embeddings.token_type_embeddings.weight', 'embeddings.word_embeddings.weight', 'encoder.layer.0.attention.output.LayerNorm.bias', 'encoder.layer.0.attention.output.LayerNorm.weight', 'encoder.layer.0.attention.output.dense.bias', 'encoder.layer.0.attention.output.dense.weight', 'encoder.layer.0.attention.self.key.bias', 'encoder.layer.0.attention.self.key.weight', 'encoder.layer.0.attention.self.query.bias', 'encoder.layer.0.attention.self.query.weight', 'encoder.layer.0.attention.self.value.bias', 'encoder.layer.0.attention.self.value.weight', 'encoder.layer.0.intermediate.dense.bias', 'encoder.layer.0.intermediate.dense.weight', 'encoder.layer.0.output.LayerNorm.bias', 'encoder.layer.0.output.LayerNorm.wei

Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.039,1.989886,0.321637,0.054081
20,1.9082,1.949076,0.181287,0.034103
30,1.9873,1.916587,0.321637,0.054081
40,1.9549,1.890534,0.321637,0.054081
50,1.8298,1.909469,0.339181,0.096947
60,1.8153,1.874115,0.327485,0.096948
70,1.7353,1.831937,0.350877,0.103376
80,1.786,1.776119,0.356725,0.105391
90,1.6321,1.756086,0.385965,0.113686
100,1.5189,1.746596,0.421053,0.140506


tunis-ai/TunBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at tunis-ai/TunBERT and are newly initialized: ['classifier.bias', 'classifier.weight', 'embeddings.LayerNorm.bias', 'embeddings.LayerNorm.weight', 'embeddings.position_embeddings.weight', 'embeddings.token_type_embeddings.weight', 'embeddings.word_embeddings.weight', 'encoder.layer.0.attention.output.LayerNorm.bias', 'encoder.layer.0.attention.output.LayerNorm.weight', 'encoder.layer.0.attention.output.dense.bias', 'encoder.layer.0.attention.output.dense.weight', 'encoder.layer.0.attention.self.key.bias', 'encoder.layer.0.attention.self.key.weight', 'encoder.layer.0.attention.self.query.bias', 'encoder.layer.0.attention.self.query.weight', 'encoder.layer.0.attention.self.value.bias', 'encoder.layer.0.attention.self.value.weight', 'encoder.layer.0.intermediate.dense.bias', 'encoder.layer.0.intermediate.dense.weight', 'encoder.layer.0.output.LayerNorm.bias', 'encoder.layer.0.output.LayerNorm.wei

Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,2.039,1.989886,0.321637,0.054081
20,1.9082,1.949076,0.181287,0.034103
30,1.9873,1.916587,0.321637,0.054081
40,1.9549,1.890534,0.321637,0.054081
50,1.8298,1.909469,0.339181,0.096947
60,1.8153,1.874115,0.327485,0.096948
70,1.7353,1.831937,0.350877,0.103376
80,1.786,1.776119,0.356725,0.105391
90,1.6321,1.756086,0.385965,0.113686
100,1.5189,1.746596,0.421053,0.140506


DatasetDict({
    train: Dataset({
        features: ['review', 'label'],
        num_rows: 680
    })
    test: Dataset({
        features: ['review', 'label'],
        num_rows: 171
    })
})

alger-ia/dziribert, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at alger-ia/dziribert and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9673,1.727422,0.409357,0.147056
20,1.3938,1.277377,0.619883,0.308668
30,0.9738,1.038326,0.666667,0.428257
40,0.6437,0.927825,0.672515,0.402663
50,0.3918,0.914712,0.71345,0.47763
60,0.2065,0.948899,0.725146,0.482537
70,0.1113,1.059221,0.719298,0.554994
80,0.0676,1.071494,0.701754,0.512804
90,0.0341,1.121985,0.719298,0.483551
100,0.0186,1.129223,0.719298,0.502758


alger-ia/dziribert, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at alger-ia/dziribert and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9673,1.727422,0.409357,0.147056
20,1.3938,1.277377,0.619883,0.308668
30,0.9738,1.038326,0.666667,0.428257
40,0.6437,0.927825,0.672515,0.402663
50,0.3918,0.914712,0.71345,0.47763
60,0.2065,0.948899,0.725146,0.482537
70,0.1113,1.059221,0.719298,0.554994
80,0.0676,1.071494,0.701754,0.512804
90,0.0341,1.121985,0.719298,0.483551
100,0.0186,1.129223,0.719298,0.502758


alger-ia/dziribert, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at alger-ia/dziribert and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9673,1.727422,0.409357,0.147056
20,1.3938,1.277377,0.619883,0.308668
30,0.9738,1.038326,0.666667,0.428257
40,0.6437,0.927825,0.672515,0.402663
50,0.3918,0.914712,0.71345,0.47763
60,0.2065,0.948899,0.725146,0.482537
70,0.1113,1.059221,0.719298,0.554994
80,0.0676,1.071494,0.701754,0.512804
90,0.0341,1.121985,0.719298,0.483551
100,0.0186,1.129223,0.719298,0.502758


alger-ia/dziribert, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at alger-ia/dziribert and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9826,1.691244,0.479532,0.157566
20,1.4951,1.323888,0.584795,0.201089
30,0.9899,1.10203,0.637427,0.254917
40,0.7295,1.078532,0.654971,0.334017
50,0.4117,0.998032,0.660819,0.315112
60,0.2715,1.013209,0.690058,0.375387
70,0.1911,0.972562,0.730994,0.490047
80,0.0809,1.01922,0.672515,0.427218
90,0.0455,1.064055,0.725146,0.53123
100,0.032,1.209596,0.649123,0.395575


alger-ia/dziribert, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at alger-ia/dziribert and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9826,1.691244,0.479532,0.157566
20,1.4951,1.323888,0.584795,0.201089
30,0.9899,1.10203,0.637427,0.254917
40,0.7295,1.078532,0.654971,0.334017
50,0.4117,0.998032,0.660819,0.315112
60,0.2715,1.013209,0.690058,0.375387
70,0.1911,0.972562,0.730994,0.490047
80,0.0809,1.01922,0.672515,0.427218
90,0.0455,1.064055,0.725146,0.53123
100,0.032,1.209596,0.649123,0.395575


alger-ia/dziribert, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at alger-ia/dziribert and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9826,1.691244,0.479532,0.157566
20,1.4951,1.323888,0.584795,0.201089
30,0.9899,1.10203,0.637427,0.254917
40,0.7295,1.078532,0.654971,0.334017
50,0.4117,0.998032,0.660819,0.315112
60,0.2715,1.013209,0.690058,0.375387
70,0.1911,0.972562,0.730994,0.490047
80,0.0809,1.01922,0.672515,0.427218
90,0.0455,1.064055,0.725146,0.53123
100,0.032,1.209596,0.649123,0.395575


alger-ia/dziribert, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at alger-ia/dziribert and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9544,1.681055,0.438596,0.16842
20,1.3881,1.288269,0.567251,0.268914
30,1.005,1.055454,0.625731,0.350185
40,0.7046,1.002396,0.672515,0.400247
50,0.4333,0.967133,0.695906,0.463737
60,0.2648,0.98018,0.678363,0.466419
70,0.1513,1.079972,0.684211,0.466835
80,0.0917,1.039557,0.730994,0.570141
90,0.0395,1.169161,0.71345,0.563895
100,0.0235,1.230832,0.71345,0.508117


alger-ia/dziribert, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at alger-ia/dziribert and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9544,1.681055,0.438596,0.16842
20,1.3881,1.288269,0.567251,0.268914
30,1.005,1.055454,0.625731,0.350185
40,0.7046,1.002396,0.672515,0.400247
50,0.4333,0.967133,0.695906,0.463737
60,0.2648,0.98018,0.678363,0.466419
70,0.1513,1.079972,0.684211,0.466835
80,0.0917,1.039557,0.730994,0.570141
90,0.0395,1.169161,0.71345,0.563895
100,0.0235,1.230832,0.71345,0.508117


alger-ia/dziribert, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at alger-ia/dziribert and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9544,1.681055,0.438596,0.16842
20,1.3881,1.288269,0.567251,0.268914
30,1.005,1.055454,0.625731,0.350185
40,0.7046,1.002396,0.672515,0.400247
50,0.4333,0.967133,0.695906,0.463737
60,0.2648,0.98018,0.678363,0.466419
70,0.1513,1.079972,0.684211,0.466835
80,0.0917,1.039557,0.730994,0.570141
90,0.0395,1.169161,0.71345,0.563895
100,0.0235,1.230832,0.71345,0.508117


DatasetDict({
    train: Dataset({
        features: ['review', 'label'],
        num_rows: 680
    })
    test: Dataset({
        features: ['review', 'label'],
        num_rows: 171
    })
})

SI2M-Lab/DarijaBERT, try:0


The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9048,1.671892,0.385965,0.132576
20,1.3658,1.344011,0.573099,0.267395
30,1.032,1.094569,0.643275,0.346088
40,0.7258,0.974752,0.71345,0.448748
50,0.5013,0.969496,0.707602,0.489264
60,0.3487,1.006144,0.725146,0.503916
70,0.214,1.039534,0.754386,0.57293
80,0.1876,1.15206,0.695906,0.499464
90,0.1223,1.094475,0.730994,0.577485
100,0.0644,1.251686,0.719298,0.502422


SI2M-Lab/DarijaBERT, try:1


The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9048,1.671892,0.385965,0.132576
20,1.3658,1.344011,0.573099,0.267395
30,1.032,1.094569,0.643275,0.346088
40,0.7258,0.974752,0.71345,0.448748
50,0.5013,0.969496,0.707602,0.489264
60,0.3487,1.006144,0.725146,0.503916
70,0.214,1.039534,0.754386,0.57293
80,0.1876,1.15206,0.695906,0.499464
90,0.1223,1.094475,0.730994,0.577485
100,0.0644,1.251686,0.719298,0.502422


SI2M-Lab/DarijaBERT, try:2


The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9048,1.671892,0.385965,0.132576
20,1.3658,1.344011,0.573099,0.267395
30,1.032,1.094569,0.643275,0.346088
40,0.7258,0.974752,0.71345,0.448748
50,0.5013,0.969496,0.707602,0.489264
60,0.3487,1.006144,0.725146,0.503916
70,0.214,1.039534,0.754386,0.57293
80,0.1876,1.15206,0.695906,0.499464
90,0.1223,1.094475,0.730994,0.577485
100,0.0644,1.251686,0.719298,0.502422


SI2M-Lab/DarijaBERT, try:0


The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9412,1.673671,0.491228,0.144843
20,1.4691,1.4585,0.555556,0.223787
30,0.9911,1.250955,0.619883,0.274118
40,0.7812,1.171206,0.643275,0.31891
50,0.481,1.307557,0.578947,0.280987
60,0.3757,1.365985,0.649123,0.33889
70,0.2987,1.260936,0.666667,0.39566
80,0.1685,1.290772,0.649123,0.385515
90,0.115,1.311715,0.684211,0.441368
100,0.086,1.452834,0.649123,0.339144


SI2M-Lab/DarijaBERT, try:1


The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9412,1.673671,0.491228,0.144843
20,1.4691,1.4585,0.555556,0.223787
30,0.9911,1.250955,0.619883,0.274118
40,0.7812,1.171206,0.643275,0.31891
50,0.481,1.307557,0.578947,0.280987
60,0.3757,1.365985,0.649123,0.33889
70,0.2987,1.260936,0.666667,0.39566
80,0.1685,1.290772,0.649123,0.385515
90,0.115,1.311715,0.684211,0.441368
100,0.086,1.452834,0.649123,0.339144


SI2M-Lab/DarijaBERT, try:2


The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9412,1.673671,0.491228,0.144843
20,1.4691,1.4585,0.555556,0.223787
30,0.9911,1.250955,0.619883,0.274118
40,0.7812,1.171206,0.643275,0.31891
50,0.481,1.307557,0.578947,0.280987
60,0.3757,1.365985,0.649123,0.33889
70,0.2987,1.260936,0.666667,0.39566
80,0.1685,1.290772,0.649123,0.385515
90,0.115,1.311715,0.684211,0.441368
100,0.086,1.452834,0.649123,0.339144


SI2M-Lab/DarijaBERT, try:0


The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9341,1.750564,0.374269,0.123551
20,1.4954,1.373624,0.584795,0.29107
30,1.1225,1.136954,0.660819,0.407164
40,0.8249,1.075731,0.654971,0.442195
50,0.5468,1.055672,0.672515,0.428174
60,0.3699,1.060412,0.725146,0.565986
70,0.254,1.107995,0.684211,0.508286
80,0.2141,1.16186,0.695906,0.522565
90,0.1268,1.208541,0.695906,0.499255
100,0.0967,1.144718,0.707602,0.533485


SI2M-Lab/DarijaBERT, try:1


The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9341,1.750564,0.374269,0.123551
20,1.4954,1.373624,0.584795,0.29107
30,1.1225,1.136954,0.660819,0.407164
40,0.8249,1.075731,0.654971,0.442195
50,0.5468,1.055672,0.672515,0.428174
60,0.3699,1.060412,0.725146,0.565986
70,0.254,1.107995,0.684211,0.508286
80,0.2141,1.16186,0.695906,0.522565
90,0.1268,1.208541,0.695906,0.499255
100,0.0967,1.144718,0.707602,0.533485


SI2M-Lab/DarijaBERT, try:2


The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9341,1.750564,0.374269,0.123551
20,1.4954,1.373624,0.584795,0.29107
30,1.1225,1.136954,0.660819,0.407164
40,0.8249,1.075731,0.654971,0.442195
50,0.5468,1.055672,0.672515,0.428174
60,0.3699,1.060412,0.725146,0.565986
70,0.254,1.107995,0.684211,0.508286
80,0.2141,1.16186,0.695906,0.522565
90,0.1268,1.208541,0.695906,0.499255
100,0.0967,1.144718,0.707602,0.533485


DatasetDict({
    train: Dataset({
        features: ['review', 'label'],
        num_rows: 680
    })
    test: Dataset({
        features: ['review', 'label'],
        num_rows: 171
    })
})

otmangi/MorRoBERTa, try:0


Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at otmangi/MorRoBERTa and are newly initialized: ['classifier.dense.bias', 'classifier.dense.weight', 'classifier.out_proj.bias', 'classifier.out_proj.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9258,1.75022,0.426901,0.1834
20,1.4778,1.425571,0.549708,0.270164
30,1.1123,1.247542,0.608187,0.361305
40,0.8311,1.104753,0.631579,0.398379
50,0.5583,1.10798,0.643275,0.426358
60,0.3809,1.116383,0.649123,0.441899
70,0.2663,1.243193,0.649123,0.449181
80,0.1892,1.262129,0.625731,0.417048
90,0.1144,1.295828,0.660819,0.491646
100,0.0652,1.418666,0.637427,0.440647


otmangi/MorRoBERTa, try:1


Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at otmangi/MorRoBERTa and are newly initialized: ['classifier.dense.bias', 'classifier.dense.weight', 'classifier.out_proj.bias', 'classifier.out_proj.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9258,1.75022,0.426901,0.1834
20,1.4778,1.425571,0.549708,0.270164
30,1.1123,1.247542,0.608187,0.361305
40,0.8311,1.104753,0.631579,0.398379
50,0.5583,1.10798,0.643275,0.426358
60,0.3809,1.116383,0.649123,0.441899
70,0.2663,1.243193,0.649123,0.449181
80,0.1892,1.262129,0.625731,0.417048
90,0.1144,1.295828,0.660819,0.491646
100,0.0652,1.418666,0.637427,0.440647


otmangi/MorRoBERTa, try:2


Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at otmangi/MorRoBERTa and are newly initialized: ['classifier.dense.bias', 'classifier.dense.weight', 'classifier.out_proj.bias', 'classifier.out_proj.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9258,1.75022,0.426901,0.1834
20,1.4778,1.425571,0.549708,0.270164
30,1.1123,1.247542,0.608187,0.361305
40,0.8311,1.104753,0.631579,0.398379
50,0.5583,1.10798,0.643275,0.426358
60,0.3809,1.116383,0.649123,0.441899
70,0.2663,1.243193,0.649123,0.449181
80,0.1892,1.262129,0.625731,0.417048
90,0.1144,1.295828,0.660819,0.491646
100,0.0652,1.418666,0.637427,0.440647


otmangi/MorRoBERTa, try:0


Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at otmangi/MorRoBERTa and are newly initialized: ['classifier.dense.bias', 'classifier.dense.weight', 'classifier.out_proj.bias', 'classifier.out_proj.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9607,1.708425,0.426901,0.146707
20,1.5091,1.396394,0.584795,0.238747
30,1.0869,1.248222,0.596491,0.247428
40,0.8515,1.241084,0.614035,0.299943
50,0.527,1.238433,0.625731,0.315012
60,0.3769,1.197382,0.678363,0.37803
70,0.2834,1.393095,0.649123,0.357373
80,0.1706,1.283134,0.672515,0.398453
90,0.108,1.422924,0.654971,0.389442
100,0.0845,1.4282,0.654971,0.373165


otmangi/MorRoBERTa, try:1


Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at otmangi/MorRoBERTa and are newly initialized: ['classifier.dense.bias', 'classifier.dense.weight', 'classifier.out_proj.bias', 'classifier.out_proj.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9607,1.708425,0.426901,0.146707
20,1.5091,1.396394,0.584795,0.238747
30,1.0869,1.248222,0.596491,0.247428
40,0.8515,1.241084,0.614035,0.299943
50,0.527,1.238433,0.625731,0.315012
60,0.3769,1.197382,0.678363,0.37803
70,0.2834,1.393095,0.649123,0.357373
80,0.1706,1.283134,0.672515,0.398453
90,0.108,1.422924,0.654971,0.389442
100,0.0845,1.4282,0.654971,0.373165


otmangi/MorRoBERTa, try:2


Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at otmangi/MorRoBERTa and are newly initialized: ['classifier.dense.bias', 'classifier.dense.weight', 'classifier.out_proj.bias', 'classifier.out_proj.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9607,1.708425,0.426901,0.146707
20,1.5091,1.396394,0.584795,0.238747
30,1.0869,1.248222,0.596491,0.247428
40,0.8515,1.241084,0.614035,0.299943
50,0.527,1.238433,0.625731,0.315012
60,0.3769,1.197382,0.678363,0.37803
70,0.2834,1.393095,0.649123,0.357373
80,0.1706,1.283134,0.672515,0.398453
90,0.108,1.422924,0.654971,0.389442
100,0.0845,1.4282,0.654971,0.373165


otmangi/MorRoBERTa, try:0


Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at otmangi/MorRoBERTa and are newly initialized: ['classifier.dense.bias', 'classifier.dense.weight', 'classifier.out_proj.bias', 'classifier.out_proj.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9334,1.669819,0.438596,0.164791
20,1.458,1.393062,0.508772,0.244949
30,1.14,1.164517,0.619883,0.340355
40,0.8512,1.094415,0.649123,0.388572
50,0.6071,1.012347,0.678363,0.448373
60,0.4136,1.024966,0.695906,0.506056
70,0.275,1.009048,0.71345,0.576027
80,0.1993,1.053709,0.690058,0.520571
90,0.1126,1.133862,0.701754,0.55773
100,0.0713,1.217952,0.678363,0.539689


otmangi/MorRoBERTa, try:1


Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at otmangi/MorRoBERTa and are newly initialized: ['classifier.dense.bias', 'classifier.dense.weight', 'classifier.out_proj.bias', 'classifier.out_proj.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9334,1.669819,0.438596,0.164791
20,1.458,1.393062,0.508772,0.244949
30,1.14,1.164517,0.619883,0.340355
40,0.8512,1.094415,0.649123,0.388572
50,0.6071,1.012347,0.678363,0.448373
60,0.4136,1.024966,0.695906,0.506056
70,0.275,1.009048,0.71345,0.576027
80,0.1993,1.053709,0.690058,0.520571
90,0.1126,1.133862,0.701754,0.55773
100,0.0713,1.217952,0.678363,0.539689


otmangi/MorRoBERTa, try:2


Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at otmangi/MorRoBERTa and are newly initialized: ['classifier.dense.bias', 'classifier.dense.weight', 'classifier.out_proj.bias', 'classifier.out_proj.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.9334,1.669819,0.438596,0.164791
20,1.458,1.393062,0.508772,0.244949
30,1.14,1.164517,0.619883,0.340355
40,0.8512,1.094415,0.649123,0.388572
50,0.6071,1.012347,0.678363,0.448373
60,0.4136,1.024966,0.695906,0.506056
70,0.275,1.009048,0.71345,0.576027
80,0.1993,1.053709,0.690058,0.520571
90,0.1126,1.133862,0.701754,0.55773
100,0.0713,1.217952,0.678363,0.539689


DatasetDict({
    train: Dataset({
        features: ['review', 'label'],
        num_rows: 680
    })
    test: Dataset({
        features: ['review', 'label'],
        num_rows: 171
    })
})

otmangi/MorrBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at otmangi/MorrBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.8327,1.49751,0.573099,0.288035
20,1.1882,1.178828,0.608187,0.317424
30,0.8804,1.049534,0.672515,0.394176
40,0.6012,0.946682,0.71345,0.520331
50,0.3951,0.996129,0.701754,0.563791
60,0.2075,0.979982,0.719298,0.588092
70,0.1826,1.085568,0.719298,0.504411
80,0.1378,1.023577,0.730994,0.611751
90,0.0903,1.229767,0.695906,0.524919
100,0.0708,1.253977,0.695906,0.562675


otmangi/MorrBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at otmangi/MorrBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.8327,1.49751,0.573099,0.288035
20,1.1882,1.178828,0.608187,0.317424
30,0.8804,1.049534,0.672515,0.394176
40,0.6012,0.946682,0.71345,0.520331
50,0.3951,0.996129,0.701754,0.563791
60,0.2075,0.979982,0.719298,0.588092
70,0.1826,1.085568,0.719298,0.504411
80,0.1378,1.023577,0.730994,0.611751
90,0.0903,1.229767,0.695906,0.524919
100,0.0708,1.253977,0.695906,0.562675


otmangi/MorrBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at otmangi/MorrBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.8327,1.49751,0.573099,0.288035
20,1.1882,1.178828,0.608187,0.317424
30,0.8804,1.049534,0.672515,0.394176
40,0.6012,0.946682,0.71345,0.520331
50,0.3951,0.996129,0.701754,0.563791
60,0.2075,0.979982,0.719298,0.588092
70,0.1826,1.085568,0.719298,0.504411
80,0.1378,1.023577,0.730994,0.611751
90,0.0903,1.229767,0.695906,0.524919
100,0.0708,1.253977,0.695906,0.562675


otmangi/MorrBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at otmangi/MorrBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.888,1.520045,0.538012,0.213114
20,1.2546,1.212645,0.637427,0.266647
30,0.8351,1.061955,0.678363,0.299934
40,0.6364,1.036336,0.701754,0.416537
50,0.3518,0.999189,0.725146,0.481741
60,0.2262,1.070827,0.707602,0.446974
70,0.185,1.097269,0.719298,0.450566
80,0.0965,1.231263,0.678363,0.435338
90,0.0754,1.155699,0.701754,0.447234
100,0.0651,1.215822,0.684211,0.442872


otmangi/MorrBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at otmangi/MorrBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.888,1.520045,0.538012,0.213114
20,1.2546,1.212645,0.637427,0.266647
30,0.8351,1.061955,0.678363,0.299934
40,0.6364,1.036336,0.701754,0.416537
50,0.3518,0.999189,0.725146,0.481741
60,0.2262,1.070827,0.707602,0.446974
70,0.185,1.097269,0.719298,0.450566
80,0.0965,1.231263,0.678363,0.435338
90,0.0754,1.155699,0.701754,0.447234
100,0.0651,1.215822,0.684211,0.442872


otmangi/MorrBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at otmangi/MorrBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.888,1.520045,0.538012,0.213114
20,1.2546,1.212645,0.637427,0.266647
30,0.8351,1.061955,0.678363,0.299934
40,0.6364,1.036336,0.701754,0.416537
50,0.3518,0.999189,0.725146,0.481741
60,0.2262,1.070827,0.707602,0.446974
70,0.185,1.097269,0.719298,0.450566
80,0.0965,1.231263,0.678363,0.435338
90,0.0754,1.155699,0.701754,0.447234
100,0.0651,1.215822,0.684211,0.442872


otmangi/MorrBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at otmangi/MorrBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.8445,1.538296,0.520468,0.256481
20,1.2264,1.139264,0.631579,0.33939
30,0.8915,0.980184,0.678363,0.428125
40,0.6233,0.866787,0.719298,0.503114
50,0.3856,0.895401,0.707602,0.515022
60,0.2195,0.965935,0.678363,0.4737
70,0.1454,1.079721,0.695906,0.566565
80,0.0996,1.059929,0.707602,0.55729
90,0.0622,1.165489,0.701754,0.549524
100,0.0418,1.109924,0.707602,0.587428


otmangi/MorrBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at otmangi/MorrBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.8445,1.538296,0.520468,0.256481
20,1.2264,1.139264,0.631579,0.33939
30,0.8915,0.980184,0.678363,0.428125
40,0.6233,0.866787,0.719298,0.503114
50,0.3856,0.895401,0.707602,0.515022
60,0.2195,0.965935,0.678363,0.4737
70,0.1454,1.079721,0.695906,0.566565
80,0.0996,1.059929,0.707602,0.55729
90,0.0622,1.165489,0.701754,0.549524
100,0.0418,1.109924,0.707602,0.587428


otmangi/MorrBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at otmangi/MorrBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,1.8445,1.538296,0.520468,0.256481
20,1.2264,1.139264,0.631579,0.33939
30,0.8915,0.980184,0.678363,0.428125
40,0.6233,0.866787,0.719298,0.503114
50,0.3856,0.895401,0.707602,0.515022
60,0.2195,0.965935,0.678363,0.4737
70,0.1454,1.079721,0.695906,0.566565
80,0.0996,1.059929,0.707602,0.55729
90,0.0622,1.165489,0.701754,0.549524
100,0.0418,1.109924,0.707602,0.587428


Unnamed: 0,Model,Accuracy,F1
0,SI2M-Lab/DarijaBERT,0.77193,0.622234
3,alger-ia/dziribert,0.730994,0.606202
6,faisalq/EgyBERT,0.666667,0.459321
8,faisalq/SaudiBERT,0.74269,0.619761
11,otmangi/MorRoBERTa,0.719298,0.614669
14,otmangi/MorrBERT,0.730994,0.611751
17,tunis-ai/TunBERT,0.51462,0.304322
