In [1]:
import os
os.environ["CUDA_VISIBLE_DEVICES"]="0" 

import numpy as np
import tensorflow as tf
import pandas as pd
import pyarabic.araby as araby
import warnings
warnings.filterwarnings('ignore')
from sklearn.model_selection import train_test_split
from sklearn.metrics import classification_report
from tensorflow.keras.layers import Dense, Input
from tensorflow.keras.utils import to_categorical
from tensorflow.keras.optimizers import Adam
from tensorflow.keras.callbacks import EarlyStopping
from tensorflow.keras.initializers import TruncatedNormal
from tensorflow.keras.losses import CategoricalCrossentropy
from tensorflow.keras.metrics import CategoricalAccuracy
import torch
from sklearn.metrics import accuracy_score, f1_score
from transformers import Trainer, TrainingArguments
from transformers import AutoTokenizer, AutoModelForSequenceClassification
from datasets import load_dataset, Dataset, concatenate_datasets
pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', None)
pd.set_option('display.max_colwidth', 1000)


fname = 'dreviews_1'
log_file = fname + '.txt'

with open(log_file, 'w') as f:
    f.write('Model,Accuracy,F1\n')


dataset = load_dataset('ohidaoui/darija-reviews')


df = pd.DataFrame(dataset['test'])

display(len(df))
      
display(df.columns)
display(df[:4])

df['label'] = df['label'].replace('negative ', 'negative')

c = df['label'].value_counts()
display(c)

classes = set(df['label'].values)
display(classes)

df['label'] = df['label'].astype('category')
df['label'] = df['label'].cat.codes

df = df[['review', 'label']]
classes_num = len(classes)
display(classes_num)
display(len(df))



max_sequence_length = 128



models = [ 
        'aubmindlab/bert-base-arabertv02-twitter',
        'CAMeL-Lab/bert-base-arabic-camelbert-da',
        'qarib/bert-base-qarib', 
        'UBC-NLP/MARBERT',
        'UBC-NLP/MARBERTv2',
    'SI2M-Lab/DarijaBERT-mix',
    'SI2M-Lab/DarijaBERT-arabizi'
]

seeds = [0, 1, 42]

for model_name in models:
    for seed in seeds:
        ds = Dataset.from_pandas(df)
        ds = ds.train_test_split(test_size=0.2, seed = seed)
        if seed==0:
            display(ds)
            
        for i in range(3):
            print(f'{model_name}, try:{i}')
                  
            tokenizer = AutoTokenizer.from_pretrained(model_name)
            model = AutoModelForSequenceClassification.from_pretrained(model_name,
                                                                  num_labels=classes_num).to('cuda')                                                 
            dataset_train = ds['train']
            dataset_validation = ds['test']                                                    
            
          
    
            def preprocess_function(examples):
                return tokenizer(examples['review'], truncation=True, padding="max_length",
                                max_length=max_sequence_length)
            
            
            dataset_train = dataset_train.map(preprocess_function, batched=True)
            dataset_validation = dataset_validation.map(preprocess_function, batched=True)
            
           
            
            def compute_metrics(eval_pred):
                logits, labels = eval_pred
                predictions = np.argmax(logits, axis=-1)    
                acc = accuracy_score(labels, predictions)        
                f1 = f1_score(labels, predictions, average='macro')   
                with open(log_file, 'a') as f:
                    f.write(f'{model_name},{acc},{f1}\n')
                return {'accuracy': acc, 'f1_score': f1}
    
    
            
            
            epochs = 30
            save_steps = 10000 #save checkpoint every 10000 steps
            batch_size = 64
            
            training_args = TrainingArguments(
                output_dir = 'bert/',
                overwrite_output_dir=True,
                num_train_epochs = epochs,
                per_device_train_batch_size = batch_size,
                per_device_eval_batch_size = batch_size,
                save_steps = save_steps,
                save_total_limit = 1, #only save the last 5 checkpoints
                fp16=True,
                learning_rate = 5e-5,  # 5e-5 is the default
                logging_steps = 10, #50_000
                evaluation_strategy = 'steps',
                # evaluate_during_training = True,
                eval_steps = 10
                
            )
            
            trainer = Trainer(
                model = model,
                args = training_args,
                # data_collator=data_collator,
                train_dataset=dataset_train,
                eval_dataset=dataset_validation,
                compute_metrics = compute_metrics
            )
            
            
            trainer.train()


results = pd.read_csv(log_file)

best_results = results.groupby('Model', as_index=False)['F1'].max()

best_results = pd.merge(best_results, results, on=['Model', 'F1'])
best_results = best_results[['Model', 'Accuracy', 'F1']]
best_results = best_results.drop_duplicates()
best_results.to_csv(f'{fname}.csv')
display(best_results)



2024-09-18 20:30:57.113987: I tensorflow/core/util/port.cc:110] oneDNN custom operations are on. You may see slightly different numerical results due to floating-point round-off errors from different computation orders. To turn them off, set the environment variable `TF_ENABLE_ONEDNN_OPTS=0`.
2024-09-18 20:30:57.137175: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.
To enable the following instructions: AVX2 AVX512F AVX512_VNNI AVX512_BF16 FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.
Found cached dataset parquet (/home/ffq/.cache/huggingface/datasets/ohidaoui___parquet/ohidaoui--darija-reviews-34030453886e5230/0.0.0/14a00e99c0d15a23649d0db8944380ac81082d4b021f398733dd84f3a6c569a7)


  0%|          | 0/1 [00:00<?, ?it/s]

851

Index(['review', 'label', 'topic', 'writing_style'], dtype='object')

Unnamed: 0,review,label,topic,writing_style
0,داسيا فقدت أهم ميزة كانت تميزها وهي السعر للأسف !,negative,automotive,Arabic
1,لاأظنها ستنجح كالنسخ الأولى,negative,automotive,Arabic
2,Khas ykon tghyir mbanch li lfar9 rir fa dizayn lkrasa mikanik tablo fih dak lblstik lmryat 3lach mdyrinch lhm daw volm mzl kif mahwa jwant kifma howa fin kyn lfr9 fdizyn ama ljiti tchof mkynch fra9 fra9 howa y9riban 40% mli kt9ol l3mrya hdi bnsba li ana nas 3morya ama l3morya kolchi daw mzl khsha whd 10 ans wnchofo ana knfdl dacia l9dima,negative,automotive,Arabizi
3,هناك اختيارات أحسن وماركات عالميه أجود من داصيا.,negative,automotive,Arabic


label
positive    456
negative    273
neutral     122
Name: count, dtype: int64

{'negative', 'neutral', 'positive'}

3

851

DatasetDict({
    train: Dataset({
        features: ['review', 'label'],
        num_rows: 680
    })
    test: Dataset({
        features: ['review', 'label'],
        num_rows: 171
    })
})

aubmindlab/bert-base-arabertv02-twitter, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9871,0.820749,0.625731,0.453039
20,0.8123,0.67399,0.71345,0.490113
30,0.6296,0.620058,0.730994,0.641682
40,0.447,0.533679,0.783626,0.635057
50,0.3193,0.576427,0.795322,0.708191
60,0.2351,0.522439,0.818713,0.731054
70,0.1505,0.600028,0.812865,0.722175
80,0.0987,0.727973,0.783626,0.701103
90,0.0728,0.820526,0.783626,0.715047
100,0.0597,0.922145,0.795322,0.725894


aubmindlab/bert-base-arabertv02-twitter, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9563,0.801001,0.602339,0.43792
20,0.766,0.652882,0.730994,0.535526
30,0.595,0.62929,0.74269,0.643796
40,0.4259,0.523222,0.795322,0.674987
50,0.3246,0.581451,0.80117,0.717013
60,0.2128,0.583591,0.807018,0.748375
70,0.167,0.60588,0.836257,0.774579
80,0.0801,0.65301,0.830409,0.768217
90,0.097,0.787016,0.812865,0.746505
100,0.088,0.725889,0.853801,0.802222


aubmindlab/bert-base-arabertv02-twitter, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9563,0.801001,0.602339,0.43792
20,0.766,0.652882,0.730994,0.535526
30,0.595,0.62929,0.74269,0.643796
40,0.4259,0.523222,0.795322,0.674987
50,0.3246,0.581451,0.80117,0.717013
60,0.2128,0.583591,0.807018,0.748375
70,0.167,0.60588,0.836257,0.774579
80,0.0801,0.65301,0.830409,0.768217
90,0.097,0.787016,0.812865,0.746505
100,0.088,0.725889,0.853801,0.802222


aubmindlab/bert-base-arabertv02-twitter, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9446,0.788926,0.614035,0.4405
20,0.6916,0.683694,0.684211,0.527187
30,0.5043,0.666182,0.666667,0.572538
40,0.3373,0.68318,0.707602,0.589959
50,0.2138,0.808201,0.690058,0.610523
60,0.1559,0.935101,0.725146,0.615581
70,0.0918,1.049271,0.707602,0.63761
80,0.0499,1.097225,0.719298,0.63829
90,0.0552,1.211329,0.725146,0.65907
100,0.0563,1.225253,0.725146,0.612433


aubmindlab/bert-base-arabertv02-twitter, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9446,0.788926,0.614035,0.4405
20,0.6916,0.683694,0.684211,0.527187
30,0.5043,0.666182,0.666667,0.572538
40,0.3373,0.68318,0.707602,0.589959
50,0.2138,0.808201,0.690058,0.610523
60,0.1559,0.935101,0.725146,0.615581
70,0.0918,1.049271,0.707602,0.63761
80,0.0499,1.097225,0.719298,0.63829
90,0.0552,1.211329,0.725146,0.65907
100,0.0563,1.225253,0.725146,0.612433


aubmindlab/bert-base-arabertv02-twitter, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9446,0.788926,0.614035,0.4405
20,0.6916,0.683694,0.684211,0.527187
30,0.5043,0.666182,0.666667,0.572538
40,0.3373,0.68318,0.707602,0.589959
50,0.2138,0.808201,0.690058,0.610523
60,0.1559,0.935101,0.725146,0.615581
70,0.0918,1.049271,0.707602,0.63761
80,0.0499,1.097225,0.719298,0.63829
90,0.0552,1.211329,0.725146,0.65907
100,0.0563,1.225253,0.725146,0.612433


aubmindlab/bert-base-arabertv02-twitter, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.939,0.875075,0.573099,0.394388
20,0.7501,0.736086,0.678363,0.583512
30,0.5765,0.717518,0.678363,0.597128
40,0.4114,0.63495,0.725146,0.659498
50,0.239,0.720507,0.71345,0.625432
60,0.1613,0.72503,0.766082,0.671435
70,0.1213,0.844387,0.754386,0.660777
80,0.0889,0.873588,0.730994,0.647009
90,0.0485,1.080744,0.736842,0.671111
100,0.0466,0.935691,0.748538,0.659928


aubmindlab/bert-base-arabertv02-twitter, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.939,0.875075,0.573099,0.394388
20,0.7501,0.736086,0.678363,0.583512
30,0.5765,0.717518,0.678363,0.597128
40,0.4114,0.63495,0.725146,0.659498
50,0.239,0.720507,0.71345,0.625432
60,0.1613,0.72503,0.766082,0.671435
70,0.1213,0.844387,0.754386,0.660777
80,0.0889,0.873588,0.730994,0.647009
90,0.0485,1.080744,0.736842,0.671111
100,0.0466,0.935691,0.748538,0.659928


aubmindlab/bert-base-arabertv02-twitter, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.939,0.875075,0.573099,0.394388
20,0.7501,0.736086,0.678363,0.583512
30,0.5765,0.717518,0.678363,0.597128
40,0.4114,0.63495,0.725146,0.659498
50,0.239,0.720507,0.71345,0.625432
60,0.1613,0.72503,0.766082,0.671435
70,0.1213,0.844387,0.754386,0.660777
80,0.0889,0.873588,0.730994,0.647009
90,0.0485,1.080744,0.736842,0.671111
100,0.0466,0.935691,0.748538,0.659928


DatasetDict({
    train: Dataset({
        features: ['review', 'label'],
        num_rows: 680
    })
    test: Dataset({
        features: ['review', 'label'],
        num_rows: 171
    })
})

CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.978,0.853487,0.619883,0.367588
20,0.8067,0.718566,0.707602,0.488209
30,0.6663,0.68861,0.730994,0.526932
40,0.4834,0.619703,0.725146,0.616145
50,0.382,0.660248,0.736842,0.609575
60,0.2967,0.660686,0.766082,0.665586
70,0.2369,0.844372,0.707602,0.619321
80,0.2212,0.751362,0.760234,0.673394
90,0.2092,0.932927,0.707602,0.634398
100,0.1991,0.922401,0.748538,0.654361


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.978,0.853487,0.619883,0.367588
20,0.8067,0.718566,0.707602,0.488209
30,0.6663,0.68861,0.730994,0.526932
40,0.4834,0.619703,0.725146,0.616145
50,0.382,0.660248,0.736842,0.609575
60,0.2967,0.660686,0.766082,0.665586
70,0.2369,0.844372,0.707602,0.619321
80,0.2212,0.751362,0.760234,0.673394
90,0.2092,0.932927,0.707602,0.634398
100,0.1991,0.922401,0.748538,0.654361


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.978,0.853487,0.619883,0.367588
20,0.8067,0.718566,0.707602,0.488209
30,0.6663,0.68861,0.730994,0.526932
40,0.4834,0.619703,0.725146,0.616145
50,0.382,0.660248,0.736842,0.609575
60,0.2967,0.660686,0.766082,0.665586
70,0.2369,0.844372,0.707602,0.619321
80,0.2212,0.751362,0.760234,0.673394
90,0.2092,0.932927,0.707602,0.634398
100,0.1991,0.922401,0.748538,0.654361


CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9745,0.803076,0.643275,0.43655
20,0.7591,0.738965,0.678363,0.458384
30,0.5741,0.694076,0.690058,0.544827
40,0.3943,0.764537,0.695906,0.561908
50,0.2638,0.846594,0.707602,0.612534
60,0.2046,0.816663,0.754386,0.610834
70,0.1456,1.059105,0.672515,0.590098
80,0.1439,1.058751,0.701754,0.54885
90,0.1051,1.255055,0.684211,0.573282
100,0.0794,1.041168,0.701754,0.60144


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9745,0.803076,0.643275,0.43655
20,0.7591,0.738965,0.678363,0.458384
30,0.5741,0.694076,0.690058,0.544827
40,0.3943,0.764537,0.695906,0.561908
50,0.2638,0.846594,0.707602,0.612534
60,0.2046,0.816663,0.754386,0.610834
70,0.1456,1.059105,0.672515,0.590098
80,0.1439,1.058751,0.701754,0.54885
90,0.1051,1.255055,0.684211,0.573282
100,0.0794,1.041168,0.701754,0.60144


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9745,0.803076,0.643275,0.43655
20,0.7591,0.738965,0.678363,0.458384
30,0.5741,0.694076,0.690058,0.544827
40,0.3943,0.764537,0.695906,0.561908
50,0.2638,0.846594,0.707602,0.612534
60,0.2046,0.816663,0.754386,0.610834
70,0.1456,1.059105,0.672515,0.590098
80,0.1439,1.058751,0.701754,0.54885
90,0.1051,1.255055,0.684211,0.573282
100,0.0794,1.041168,0.701754,0.60144


CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9656,0.910902,0.567251,0.370453
20,0.787,0.784081,0.631579,0.443117
30,0.5761,0.784671,0.660819,0.491634
40,0.4217,0.840523,0.631579,0.503733
50,0.3172,0.920858,0.631579,0.516963
60,0.2863,0.989074,0.654971,0.534642
70,0.2081,0.998514,0.666667,0.554953
80,0.1994,1.075951,0.654971,0.531006
90,0.1446,1.2247,0.678363,0.55316
100,0.1566,1.249161,0.666667,0.567374


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9656,0.910902,0.567251,0.370453
20,0.787,0.784081,0.631579,0.443117
30,0.5761,0.784671,0.660819,0.491634
40,0.4217,0.840523,0.631579,0.503733
50,0.3172,0.920858,0.631579,0.516963
60,0.2863,0.989074,0.654971,0.534642
70,0.2081,0.998514,0.666667,0.554953
80,0.1994,1.075951,0.654971,0.531006
90,0.1446,1.2247,0.678363,0.55316
100,0.1566,1.249161,0.666667,0.567374


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9656,0.910902,0.567251,0.370453
20,0.787,0.784081,0.631579,0.443117
30,0.5761,0.784671,0.660819,0.491634
40,0.4217,0.840523,0.631579,0.503733
50,0.3172,0.920858,0.631579,0.516963
60,0.2863,0.989074,0.654971,0.534642
70,0.2081,0.998514,0.666667,0.554953
80,0.1994,1.075951,0.654971,0.531006
90,0.1446,1.2247,0.678363,0.55316
100,0.1566,1.249161,0.666667,0.567374


DatasetDict({
    train: Dataset({
        features: ['review', 'label'],
        num_rows: 680
    })
    test: Dataset({
        features: ['review', 'label'],
        num_rows: 171
    })
})

qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.964,0.785944,0.649123,0.498932
20,0.7115,0.591308,0.730994,0.560855
30,0.4709,0.586773,0.777778,0.716724
40,0.2788,0.558174,0.80117,0.701616
50,0.1841,0.63728,0.789474,0.740173
60,0.1043,0.838826,0.80117,0.726544
70,0.1104,0.755244,0.795322,0.71952
80,0.0549,0.830344,0.77193,0.699043
90,0.038,1.023799,0.777778,0.700642
100,0.0117,0.913384,0.795322,0.723914


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.964,0.785944,0.649123,0.498932
20,0.7115,0.591308,0.730994,0.560855
30,0.4709,0.586773,0.777778,0.716724
40,0.2788,0.558174,0.80117,0.701616
50,0.1841,0.63728,0.789474,0.740173
60,0.1043,0.838826,0.80117,0.726544
70,0.1104,0.755244,0.795322,0.71952
80,0.0549,0.830344,0.77193,0.699043
90,0.038,1.023799,0.777778,0.700642
100,0.0117,0.913384,0.795322,0.723914


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.964,0.785944,0.649123,0.498932
20,0.7115,0.591308,0.730994,0.560855
30,0.4709,0.586773,0.777778,0.716724
40,0.2788,0.558174,0.80117,0.701616
50,0.1841,0.63728,0.789474,0.740173
60,0.1043,0.838826,0.80117,0.726544
70,0.1104,0.755244,0.795322,0.71952
80,0.0549,0.830344,0.77193,0.699043
90,0.038,1.023799,0.777778,0.700642
100,0.0117,0.913384,0.795322,0.723914


qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9486,0.733035,0.660819,0.485172
20,0.6351,0.788702,0.701754,0.509835
30,0.4026,0.794046,0.695906,0.579722
40,0.2555,0.794159,0.754386,0.683812
50,0.1359,0.944468,0.736842,0.676977
60,0.0642,1.07656,0.71345,0.621141
70,0.0739,1.066716,0.748538,0.6838
80,0.0153,1.289506,0.71345,0.653322
90,0.0404,1.403377,0.730994,0.624288
100,0.0557,1.428812,0.719298,0.617906


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9486,0.733035,0.660819,0.485172
20,0.6351,0.788702,0.701754,0.509835
30,0.4026,0.794046,0.695906,0.579722
40,0.2555,0.794159,0.754386,0.683812
50,0.1359,0.944468,0.736842,0.676977
60,0.0642,1.07656,0.71345,0.621141
70,0.0739,1.066716,0.748538,0.6838
80,0.0153,1.289506,0.71345,0.653322
90,0.0404,1.403377,0.730994,0.624288
100,0.0557,1.428812,0.719298,0.617906


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9486,0.733035,0.660819,0.485172
20,0.6351,0.788702,0.701754,0.509835
30,0.4026,0.794046,0.695906,0.579722
40,0.2555,0.794159,0.754386,0.683812
50,0.1359,0.944468,0.736842,0.676977
60,0.0642,1.07656,0.71345,0.621141
70,0.0739,1.066716,0.748538,0.6838
80,0.0153,1.289506,0.71345,0.653322
90,0.0404,1.403377,0.730994,0.624288
100,0.0557,1.428812,0.719298,0.617906


qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9347,0.850241,0.584795,0.404722
20,0.6768,0.648804,0.71345,0.605959
30,0.4131,0.675474,0.748538,0.647139
40,0.2496,0.650491,0.80117,0.748254
50,0.1654,1.091172,0.690058,0.578413
60,0.1217,1.100719,0.736842,0.639604
70,0.0929,0.84861,0.783626,0.735421
80,0.0379,0.968208,0.760234,0.713066
90,0.0316,1.374406,0.74269,0.672947
100,0.0232,1.040484,0.77193,0.728178


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9347,0.850241,0.584795,0.404722
20,0.6768,0.648804,0.71345,0.605959
30,0.4131,0.675474,0.748538,0.647139
40,0.2496,0.650491,0.80117,0.748254
50,0.1654,1.091172,0.690058,0.578413
60,0.1217,1.100719,0.736842,0.639604
70,0.0929,0.84861,0.783626,0.735421
80,0.0379,0.968208,0.760234,0.713066
90,0.0316,1.374406,0.74269,0.672947
100,0.0232,1.040484,0.77193,0.728178


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9347,0.850241,0.584795,0.404722
20,0.6768,0.648804,0.71345,0.605959
30,0.4131,0.675474,0.748538,0.647139
40,0.2496,0.650491,0.80117,0.748254
50,0.1654,1.091172,0.690058,0.578413
60,0.1217,1.100719,0.736842,0.639604
70,0.0929,0.84861,0.783626,0.735421
80,0.0379,0.968208,0.760234,0.713066
90,0.0316,1.374406,0.74269,0.672947
100,0.0232,1.040484,0.77193,0.728178


DatasetDict({
    train: Dataset({
        features: ['review', 'label'],
        num_rows: 680
    })
    test: Dataset({
        features: ['review', 'label'],
        num_rows: 171
    })
})

UBC-NLP/MARBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9824,0.799955,0.631579,0.386706
20,0.7774,0.718888,0.690058,0.46181
30,0.6263,0.646731,0.725146,0.508604
40,0.4659,0.576966,0.777778,0.619937
50,0.3895,0.612372,0.748538,0.589475
60,0.2591,0.754749,0.766082,0.620015
70,0.2716,0.879121,0.754386,0.605239
80,0.1728,0.696254,0.777778,0.684601
90,0.1835,1.177759,0.74269,0.659128
100,0.1621,0.936798,0.77193,0.633566


UBC-NLP/MARBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9824,0.799955,0.631579,0.386706
20,0.7774,0.718888,0.690058,0.46181
30,0.6263,0.646731,0.725146,0.508604
40,0.4659,0.576966,0.777778,0.619937
50,0.3895,0.612372,0.748538,0.589475
60,0.2591,0.754749,0.766082,0.620015
70,0.2716,0.879121,0.754386,0.605239
80,0.1728,0.696254,0.777778,0.684601
90,0.1835,1.177759,0.74269,0.659128
100,0.1621,0.936798,0.77193,0.633566


UBC-NLP/MARBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9824,0.799955,0.631579,0.386706
20,0.7774,0.718888,0.690058,0.46181
30,0.6263,0.646731,0.725146,0.508604
40,0.4659,0.576966,0.777778,0.619937
50,0.3895,0.612372,0.748538,0.589475
60,0.2591,0.754749,0.766082,0.620015
70,0.2716,0.879121,0.754386,0.605239
80,0.1728,0.696254,0.777778,0.684601
90,0.1835,1.177759,0.74269,0.659128
100,0.1621,0.936798,0.77193,0.633566


UBC-NLP/MARBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9698,0.89605,0.614035,0.382698
20,0.6801,0.662729,0.725146,0.515531
30,0.4812,0.64592,0.760234,0.540195
40,0.4052,1.207732,0.660819,0.537094
50,0.3361,0.732454,0.766082,0.642808
60,0.1668,0.834428,0.754386,0.601767
70,0.144,0.896015,0.77193,0.626981
80,0.0829,1.095441,0.736842,0.632287
90,0.0744,1.174128,0.77193,0.668525
100,0.0368,1.220766,0.77193,0.658959


UBC-NLP/MARBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9698,0.89605,0.614035,0.382698
20,0.6801,0.662729,0.725146,0.515531
30,0.4812,0.64592,0.760234,0.540195
40,0.4052,1.207732,0.660819,0.537094
50,0.3361,0.732454,0.766082,0.642808
60,0.1668,0.834428,0.754386,0.601767
70,0.144,0.896015,0.77193,0.626981
80,0.0829,1.095441,0.736842,0.632287
90,0.0744,1.174128,0.77193,0.668525
100,0.0368,1.220766,0.77193,0.658959


UBC-NLP/MARBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9698,0.89605,0.614035,0.382698
20,0.6801,0.662729,0.725146,0.515531
30,0.4812,0.64592,0.760234,0.540195
40,0.4052,1.207732,0.660819,0.537094
50,0.3361,0.732454,0.766082,0.642808
60,0.1668,0.834428,0.754386,0.601767
70,0.144,0.896015,0.77193,0.626981
80,0.0829,1.095441,0.736842,0.632287
90,0.0744,1.174128,0.77193,0.668525
100,0.0368,1.220766,0.77193,0.658959


UBC-NLP/MARBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9596,0.791463,0.654971,0.468023
20,0.763,0.761554,0.684211,0.493145
30,0.634,0.666788,0.707602,0.508335
40,0.5727,0.803347,0.707602,0.505664
50,0.4392,1.012399,0.71345,0.620371
60,0.3183,0.829614,0.730994,0.645644
70,0.1537,0.943796,0.730994,0.626863
80,0.1427,1.11644,0.730994,0.626993
90,0.0953,1.233772,0.748538,0.669148
100,0.083,1.264947,0.730994,0.639819


UBC-NLP/MARBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9596,0.791463,0.654971,0.468023
20,0.763,0.761554,0.684211,0.493145
30,0.634,0.666788,0.707602,0.508335
40,0.5727,0.803347,0.707602,0.505664
50,0.4392,1.012399,0.71345,0.620371
60,0.3183,0.829614,0.730994,0.645644
70,0.1537,0.943796,0.730994,0.626863
80,0.1427,1.11644,0.730994,0.626993
90,0.0953,1.233772,0.748538,0.669148
100,0.083,1.264947,0.730994,0.639819


UBC-NLP/MARBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9596,0.791463,0.654971,0.468023
20,0.763,0.761554,0.684211,0.493145
30,0.634,0.666788,0.707602,0.508335
40,0.5727,0.803347,0.707602,0.505664
50,0.4392,1.012399,0.71345,0.620371
60,0.3183,0.829614,0.730994,0.645644
70,0.1537,0.943796,0.730994,0.626863
80,0.1427,1.11644,0.730994,0.626993
90,0.0953,1.233772,0.748538,0.669148
100,0.083,1.264947,0.730994,0.639819


DatasetDict({
    train: Dataset({
        features: ['review', 'label'],
        num_rows: 680
    })
    test: Dataset({
        features: ['review', 'label'],
        num_rows: 171
    })
})

UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9995,0.916866,0.590643,0.390814
20,0.9235,0.866863,0.631579,0.420694
30,0.8641,0.75906,0.701754,0.495794
40,0.6681,0.645901,0.725146,0.532732
50,0.5301,0.56738,0.760234,0.665425
60,0.4245,0.537464,0.795322,0.648606
70,0.3071,0.715294,0.760234,0.633275
80,0.2172,0.6354,0.795322,0.691589
90,0.1636,0.757041,0.754386,0.675985
100,0.1614,0.750229,0.777778,0.673849


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9995,0.916866,0.590643,0.390814
20,0.9235,0.866863,0.631579,0.420694
30,0.8641,0.75906,0.701754,0.495794
40,0.6681,0.645901,0.725146,0.532732
50,0.5301,0.56738,0.760234,0.665425
60,0.4245,0.537464,0.795322,0.648606
70,0.3071,0.715294,0.760234,0.633275
80,0.2172,0.6354,0.795322,0.691589
90,0.1636,0.757041,0.754386,0.675985
100,0.1614,0.750229,0.777778,0.673849


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9995,0.916866,0.590643,0.390814
20,0.9235,0.866863,0.631579,0.420694
30,0.8641,0.75906,0.701754,0.495794
40,0.6681,0.645901,0.725146,0.532732
50,0.5301,0.56738,0.760234,0.665425
60,0.4245,0.537464,0.795322,0.648606
70,0.3071,0.715294,0.760234,0.633275
80,0.2172,0.6354,0.795322,0.691589
90,0.1636,0.757041,0.754386,0.675985
100,0.1614,0.750229,0.777778,0.673849


UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9818,0.816313,0.678363,0.470134
20,0.8107,0.727009,0.684211,0.606566
30,0.6334,0.725743,0.649123,0.466529
40,0.5219,0.655679,0.725146,0.623073
50,0.3733,0.736977,0.707602,0.643548
60,0.2552,0.785146,0.701754,0.603704
70,0.171,0.881125,0.71345,0.60827
80,0.1263,0.916294,0.730994,0.632765
90,0.1053,1.206083,0.666667,0.58905
100,0.0941,0.953016,0.74269,0.674313


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9818,0.816313,0.678363,0.470134
20,0.8107,0.727009,0.684211,0.606566
30,0.6334,0.725743,0.649123,0.466529
40,0.5219,0.655679,0.725146,0.623073
50,0.3733,0.736977,0.707602,0.643548
60,0.2552,0.785146,0.701754,0.603704
70,0.171,0.881125,0.71345,0.60827
80,0.1263,0.916294,0.730994,0.632765
90,0.1053,1.206083,0.666667,0.58905
100,0.0941,0.953016,0.74269,0.674313


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9818,0.816313,0.678363,0.470134
20,0.8107,0.727009,0.684211,0.606566
30,0.6334,0.725743,0.649123,0.466529
40,0.5219,0.655679,0.725146,0.623073
50,0.3733,0.736977,0.707602,0.643548
60,0.2552,0.785146,0.701754,0.603704
70,0.171,0.881125,0.71345,0.60827
80,0.1263,0.916294,0.730994,0.632765
90,0.1053,1.206083,0.666667,0.58905
100,0.0941,0.953016,0.74269,0.674313


UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9705,0.887678,0.584795,0.406931
20,0.8061,0.695098,0.707602,0.562927
30,0.6443,0.616448,0.748538,0.599622
40,0.5298,0.552204,0.783626,0.703187
50,0.4089,0.617,0.760234,0.664055
60,0.3194,0.654544,0.77193,0.688822
70,0.2056,0.748402,0.736842,0.63598
80,0.1322,0.945776,0.748538,0.650947
90,0.0803,0.80447,0.795322,0.715602
100,0.056,1.081608,0.74269,0.635464


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9705,0.887678,0.584795,0.406931
20,0.8061,0.695098,0.707602,0.562927
30,0.6443,0.616448,0.748538,0.599622
40,0.5298,0.552204,0.783626,0.703187
50,0.4089,0.617,0.760234,0.664055
60,0.3194,0.654544,0.77193,0.688822
70,0.2056,0.748402,0.736842,0.63598
80,0.1322,0.945776,0.748538,0.650947
90,0.0803,0.80447,0.795322,0.715602
100,0.056,1.081608,0.74269,0.635464


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9705,0.887678,0.584795,0.406931
20,0.8061,0.695098,0.707602,0.562927
30,0.6443,0.616448,0.748538,0.599622
40,0.5298,0.552204,0.783626,0.703187
50,0.4089,0.617,0.760234,0.664055
60,0.3194,0.654544,0.77193,0.688822
70,0.2056,0.748402,0.736842,0.63598
80,0.1322,0.945776,0.748538,0.650947
90,0.0803,0.80447,0.795322,0.715602
100,0.056,1.081608,0.74269,0.635464


DatasetDict({
    train: Dataset({
        features: ['review', 'label'],
        num_rows: 680
    })
    test: Dataset({
        features: ['review', 'label'],
        num_rows: 171
    })
})

SI2M-Lab/DarijaBERT-mix, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.96,0.760313,0.701754,0.478391
20,0.7616,0.627446,0.730994,0.596421
30,0.6036,0.53011,0.754386,0.59769
40,0.4139,0.45398,0.807018,0.708106
50,0.3353,0.470285,0.830409,0.741988
60,0.1684,0.512534,0.818713,0.766652
70,0.0912,0.537863,0.830409,0.789379
80,0.0326,0.657396,0.818713,0.763473
90,0.0128,0.745158,0.824561,0.768597
100,0.0135,0.819396,0.812865,0.753403


SI2M-Lab/DarijaBERT-mix, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.96,0.760313,0.701754,0.478391
20,0.7616,0.627446,0.730994,0.596421
30,0.6036,0.53011,0.754386,0.59769
40,0.4139,0.45398,0.807018,0.708106
50,0.3353,0.470285,0.830409,0.741988
60,0.1684,0.512534,0.818713,0.766652
70,0.0912,0.537863,0.830409,0.789379
80,0.0326,0.657396,0.818713,0.763473
90,0.0128,0.745158,0.824561,0.768597
100,0.0135,0.819396,0.812865,0.753403


SI2M-Lab/DarijaBERT-mix, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.96,0.760313,0.701754,0.478391
20,0.7616,0.627446,0.730994,0.596421
30,0.6036,0.53011,0.754386,0.59769
40,0.4139,0.45398,0.807018,0.708106
50,0.3353,0.470285,0.830409,0.741988
60,0.1684,0.512534,0.818713,0.766652
70,0.0912,0.537863,0.830409,0.789379
80,0.0326,0.657396,0.818713,0.763473
90,0.0128,0.745158,0.824561,0.768597
100,0.0135,0.819396,0.812865,0.753403


SI2M-Lab/DarijaBERT-mix, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9789,0.802113,0.660819,0.44573
20,0.7858,0.696173,0.707602,0.490909
30,0.6744,0.614536,0.74269,0.594117
40,0.6376,0.705369,0.684211,0.532604
50,0.5935,0.639976,0.71345,0.596505
60,0.4756,0.554034,0.766082,0.654188
70,0.4128,0.535396,0.77193,0.628632
80,0.3298,0.570749,0.783626,0.714349
90,0.2447,0.651335,0.777778,0.698955
100,0.1634,0.59896,0.80117,0.720244


SI2M-Lab/DarijaBERT-mix, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9789,0.802113,0.660819,0.44573
20,0.7858,0.696173,0.707602,0.490909
30,0.6744,0.614536,0.74269,0.594117
40,0.6376,0.705369,0.684211,0.532604
50,0.5935,0.639976,0.71345,0.596505
60,0.4756,0.554034,0.766082,0.654188
70,0.4128,0.535396,0.77193,0.628632
80,0.3298,0.570749,0.783626,0.714349
90,0.2447,0.651335,0.777778,0.698955
100,0.1634,0.59896,0.80117,0.720244


SI2M-Lab/DarijaBERT-mix, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9789,0.802113,0.660819,0.44573
20,0.7858,0.696173,0.707602,0.490909
30,0.6744,0.614536,0.74269,0.594117
40,0.6376,0.705369,0.684211,0.532604
50,0.5935,0.639976,0.71345,0.596505
60,0.4756,0.554034,0.766082,0.654188
70,0.4128,0.535396,0.77193,0.628632
80,0.3298,0.570749,0.783626,0.714349
90,0.2447,0.651335,0.777778,0.698955
100,0.1634,0.59896,0.80117,0.720244


SI2M-Lab/DarijaBERT-mix, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9285,0.770713,0.666667,0.467493
20,0.6744,0.641187,0.74269,0.550997
30,0.518,0.617543,0.74269,0.639444
40,0.3927,0.559852,0.777778,0.694961
50,0.2959,0.534429,0.783626,0.721819
60,0.2094,0.52151,0.777778,0.698952
70,0.1175,0.55964,0.818713,0.774095
80,0.0584,0.622014,0.812865,0.754076
90,0.0463,0.710166,0.795322,0.741455
100,0.0296,0.772263,0.812865,0.754017


SI2M-Lab/DarijaBERT-mix, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9285,0.770713,0.666667,0.467493
20,0.6744,0.641187,0.74269,0.550997
30,0.518,0.617543,0.74269,0.639444
40,0.3927,0.559852,0.777778,0.694961
50,0.2959,0.534429,0.783626,0.721819
60,0.2094,0.52151,0.777778,0.698952
70,0.1175,0.55964,0.818713,0.774095
80,0.0584,0.622014,0.812865,0.754076
90,0.0463,0.710166,0.795322,0.741455
100,0.0296,0.772263,0.812865,0.754017


SI2M-Lab/DarijaBERT-mix, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9285,0.770713,0.666667,0.467493
20,0.6744,0.641187,0.74269,0.550997
30,0.518,0.617543,0.74269,0.639444
40,0.3927,0.559852,0.777778,0.694961
50,0.2959,0.534429,0.783626,0.721819
60,0.2094,0.52151,0.777778,0.698952
70,0.1175,0.55964,0.818713,0.774095
80,0.0584,0.622014,0.812865,0.754076
90,0.0463,0.710166,0.795322,0.741455
100,0.0296,0.772263,0.812865,0.754017


DatasetDict({
    train: Dataset({
        features: ['review', 'label'],
        num_rows: 680
    })
    test: Dataset({
        features: ['review', 'label'],
        num_rows: 171
    })
})

SI2M-Lab/DarijaBERT-arabizi, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.938,0.701678,0.672515,0.449559
20,0.6658,0.591335,0.730994,0.561848
30,0.4325,0.567209,0.754386,0.676976
40,0.2103,0.641747,0.754386,0.672365
50,0.1183,0.771882,0.77193,0.674328
60,0.0328,0.8719,0.754386,0.667361
70,0.0118,0.972553,0.777778,0.702924
80,0.0039,1.072692,0.766082,0.695911
90,0.0022,1.252739,0.725146,0.622322
100,0.0019,1.230098,0.754386,0.681255


SI2M-Lab/DarijaBERT-arabizi, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.938,0.701678,0.672515,0.449559
20,0.6658,0.591335,0.730994,0.561848
30,0.4325,0.567209,0.754386,0.676976
40,0.2103,0.641747,0.754386,0.672365
50,0.1183,0.771882,0.77193,0.674328
60,0.0328,0.8719,0.754386,0.667361
70,0.0118,0.972553,0.777778,0.702924
80,0.0039,1.072692,0.766082,0.695911
90,0.0022,1.252739,0.725146,0.622322
100,0.0019,1.230098,0.754386,0.681255


SI2M-Lab/DarijaBERT-arabizi, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.938,0.701678,0.672515,0.449559
20,0.6658,0.591335,0.730994,0.561848
30,0.4325,0.567209,0.754386,0.676976
40,0.2103,0.641747,0.754386,0.672365
50,0.1183,0.771882,0.77193,0.674328
60,0.0328,0.8719,0.754386,0.667361
70,0.0118,0.972553,0.777778,0.702924
80,0.0039,1.072692,0.766082,0.695911
90,0.0022,1.252739,0.725146,0.622322
100,0.0019,1.230098,0.754386,0.681255


SI2M-Lab/DarijaBERT-arabizi, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9019,0.661238,0.690058,0.514256
20,0.5785,0.567042,0.760234,0.618975
30,0.2957,0.53081,0.795322,0.69691
40,0.1581,0.713352,0.719298,0.650868
50,0.0621,0.722416,0.777778,0.707623
60,0.0183,0.868344,0.807018,0.730144
70,0.0112,0.994046,0.807018,0.74636
80,0.0046,1.101744,0.795322,0.706891
90,0.0034,1.130625,0.80117,0.734162
100,0.0044,1.17492,0.80117,0.734162


SI2M-Lab/DarijaBERT-arabizi, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9019,0.661238,0.690058,0.514256
20,0.5785,0.567042,0.760234,0.618975
30,0.2957,0.53081,0.795322,0.69691
40,0.1581,0.713352,0.719298,0.650868
50,0.0621,0.722416,0.777778,0.707623
60,0.0183,0.868344,0.807018,0.730144
70,0.0112,0.994046,0.807018,0.74636
80,0.0046,1.101744,0.795322,0.706891
90,0.0034,1.130625,0.80117,0.734162
100,0.0044,1.17492,0.80117,0.734162


SI2M-Lab/DarijaBERT-arabizi, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9019,0.661238,0.690058,0.514256
20,0.5785,0.567042,0.760234,0.618975
30,0.2957,0.53081,0.795322,0.69691
40,0.1581,0.713352,0.719298,0.650868
50,0.0621,0.722416,0.777778,0.707623
60,0.0183,0.868344,0.807018,0.730144
70,0.0112,0.994046,0.807018,0.74636
80,0.0046,1.101744,0.795322,0.706891
90,0.0034,1.130625,0.80117,0.734162
100,0.0044,1.17492,0.80117,0.734162


SI2M-Lab/DarijaBERT-arabizi, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9023,0.788045,0.643275,0.439419
20,0.592,0.628732,0.760234,0.658458
30,0.3764,0.504999,0.789474,0.696954
40,0.1728,0.599599,0.812865,0.74304
50,0.069,0.626663,0.812865,0.759234
60,0.0218,0.764783,0.830409,0.780285
70,0.0069,0.92679,0.807018,0.760157
80,0.0043,1.129192,0.789474,0.682381
90,0.002,1.163883,0.783626,0.725469
100,0.0012,1.245812,0.795322,0.709488


SI2M-Lab/DarijaBERT-arabizi, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9023,0.788045,0.643275,0.439419
20,0.592,0.628732,0.760234,0.658458
30,0.3764,0.504999,0.789474,0.696954
40,0.1728,0.599599,0.812865,0.74304
50,0.069,0.626663,0.812865,0.759234
60,0.0218,0.764783,0.830409,0.780285
70,0.0069,0.92679,0.807018,0.760157
80,0.0043,1.129192,0.789474,0.682381
90,0.002,1.163883,0.783626,0.725469
100,0.0012,1.245812,0.795322,0.709488


SI2M-Lab/DarijaBERT-arabizi, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/680 [00:00<?, ? examples/s]

Map:   0%|          | 0/171 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
10,0.9023,0.788045,0.643275,0.439419
20,0.592,0.628732,0.760234,0.658458
30,0.3764,0.504999,0.789474,0.696954
40,0.1728,0.599599,0.812865,0.74304
50,0.069,0.626663,0.812865,0.759234
60,0.0218,0.764783,0.830409,0.780285
70,0.0069,0.92679,0.807018,0.760157
80,0.0043,1.129192,0.789474,0.682381
90,0.002,1.163883,0.783626,0.725469
100,0.0012,1.245812,0.795322,0.709488


Unnamed: 0,Model,Accuracy,F1
0,CAMeL-Lab/bert-base-arabic-camelbert-da,0.807018,0.699862
3,SI2M-Lab/DarijaBERT-arabizi,0.830409,0.780285
6,SI2M-Lab/DarijaBERT-mix,0.853801,0.797231
9,UBC-NLP/MARBERT,0.783626,0.713323
36,UBC-NLP/MARBERTv2,0.818713,0.752615
39,aubmindlab/bert-base-arabertv02-twitter,0.853801,0.80615
41,qarib/bert-base-qarib,0.824561,0.758824
