In [1]:
import os
os.environ["CUDA_VISIBLE_DEVICES"]="0" 

import numpy as np
import tensorflow as tf
import pandas as pd
import pyarabic.araby as araby
import warnings
warnings.filterwarnings('ignore')
from sklearn.model_selection import train_test_split
from sklearn.metrics import classification_report
from tensorflow.keras.layers import Dense, Input
from tensorflow.keras.utils import to_categorical
from tensorflow.keras.optimizers import Adam
from tensorflow.keras.callbacks import EarlyStopping
from tensorflow.keras.initializers import TruncatedNormal
from tensorflow.keras.losses import CategoricalCrossentropy
from tensorflow.keras.metrics import CategoricalAccuracy
import torch
from sklearn.metrics import accuracy_score, f1_score
from transformers import Trainer, TrainingArguments
from transformers import AutoTokenizer, AutoModelForSequenceClassification
from datasets import load_dataset, Dataset, concatenate_datasets
pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', None)
pd.set_option('display.max_colwidth', 1000)


fname = 'MYC_cleaned_1'
log_file = fname + '.txt'

with open(log_file, 'w') as f:
    f.write('Model,Accuracy,F1\n')


df = pd.read_csv('datasets/MYC/DATA_CLEANED.csv', encoding='utf-16', engine='python') #, quotechar="'"  , quoting=3


      
display(df.columns)
display(df[:4])

c = df['polarity'].value_counts()
display(c)

classes = set(df['polarity'].values)
display(classes)

df['polarity'] = df['polarity'].astype('category')
df['label'] = df['polarity'].cat.codes

df = df[['sentence', 'label']]
classes_num = len(classes)
display(classes_num)
display(len(df))


# ds = Dataset.from_pandas(df)
# ds = ds.train_test_split(test_size=0.2)

# display(ds)

max_sequence_length = 128



models = [ 
        'aubmindlab/bert-base-arabertv02-twitter',
        'CAMeL-Lab/bert-base-arabic-camelbert-da',
        'qarib/bert-base-qarib', 
        'UBC-NLP/MARBERT',
        'UBC-NLP/MARBERTv2',
    'SI2M-Lab/DarijaBERT-mix',
    'SI2M-Lab/DarijaBERT-arabizi'
]

seeds = [0, 1, 42]



for model_name in models:
    for seed in seeds:
        ds = Dataset.from_pandas(df)
        ds = ds.train_test_split(test_size=0.2, seed = seed)
        if seed==0:
            display(ds)
        for i in range(3):
            print(f'{model_name}, try:{i}')
                  
            tokenizer = AutoTokenizer.from_pretrained(model_name)
            model = AutoModelForSequenceClassification.from_pretrained(model_name,
                                                                  num_labels=classes_num).to('cuda')                                                 
            dataset_train = ds['train']
            dataset_validation = ds['test']                                                    
            
          
    
            def preprocess_function(examples):
                return tokenizer(examples['sentence'], truncation=True, padding="max_length",
                                max_length=max_sequence_length)
            
            
            dataset_train = dataset_train.map(preprocess_function, batched=True)
            dataset_validation = dataset_validation.map(preprocess_function, batched=True)
            
           
            
            def compute_metrics(eval_pred):
                logits, labels = eval_pred
                predictions = np.argmax(logits, axis=-1)    
                acc = accuracy_score(labels, predictions)        
                f1 = f1_score(labels, predictions, average='macro')   
                with open(log_file, 'a') as f:
                    f.write(f'{model_name},{acc},{f1}\n')
                return {'accuracy': acc, 'f1_score': f1}
    
    
            
            
            epochs = 15
            save_steps = 10000 #save checkpoint every 10000 steps
            batch_size = 64
            
            training_args = TrainingArguments(
                output_dir = 'bert/',
                overwrite_output_dir=True,
                num_train_epochs = epochs,
                per_device_train_batch_size = batch_size,
                per_device_eval_batch_size = batch_size,
                save_steps = save_steps,
                save_total_limit = 1, #only save the last 5 checkpoints
                fp16=True,
                learning_rate = 5e-5,  # 5e-5 is the default
                logging_steps = 100, #50_000
                evaluation_strategy = 'steps',
                # evaluate_during_training = True,
                eval_steps = 100
                
            )
            
            trainer = Trainer(
                model = model,
                args = training_args,
                # data_collator=data_collator,
                train_dataset=dataset_train,
                eval_dataset=dataset_validation,
                compute_metrics = compute_metrics
            )
            
            
            trainer.train()


results = pd.read_csv(log_file)

best_results = results.groupby('Model', as_index=False)['F1'].max()

best_results = pd.merge(best_results, results, on=['Model', 'F1'])
best_results = best_results[['Model', 'Accuracy', 'F1']]
best_results = best_results.drop_duplicates()
best_results.to_csv(f'{fname}.csv')
display(best_results)



2024-09-17 11:56:22.225851: I tensorflow/core/util/port.cc:110] oneDNN custom operations are on. You may see slightly different numerical results due to floating-point round-off errors from different computation orders. To turn them off, set the environment variable `TF_ENABLE_ONEDNN_OPTS=0`.
2024-09-17 11:56:22.260151: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.
To enable the following instructions: AVX2 AVX512F AVX512_VNNI AVX512_BF16 FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.


Index(['sentence', 'polarity'], dtype='object')

Unnamed: 0,sentence,polarity
0,انسان عبارة عن دواء للإكتئاب❤🎤,1
1,نحبك يا فنان وااااااحسااااااااان❤,1
2,Stream zuin😂 Thank you ilyas ❤️🫶,1
3,وحق الرب الى دوا د الاكتئاب الأسطورة❤️❤️❤️❤️😂,1


polarity
 1    9999
-1    9992
Name: count, dtype: int64

{-1, 1}

2

19991

DatasetDict({
    train: Dataset({
        features: ['sentence', 'label'],
        num_rows: 15992
    })
    test: Dataset({
        features: ['sentence', 'label'],
        num_rows: 3999
    })
})

aubmindlab/bert-base-arabertv02-twitter, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.3991,0.311792,0.864716,0.864115
200,0.3283,0.323498,0.862466,0.860849
300,0.2878,0.306879,0.871468,0.871007
400,0.2599,0.314699,0.863966,0.86297
500,0.2607,0.294349,0.870468,0.87036
600,0.1785,0.370524,0.867967,0.867936
700,0.1823,0.372049,0.862216,0.862213
800,0.1538,0.428564,0.868717,0.868691
900,0.1267,0.447508,0.859715,0.859696
1000,0.1304,0.464609,0.859965,0.859965


aubmindlab/bert-base-arabertv02-twitter, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4102,0.34055,0.859465,0.859454
200,0.3362,0.320838,0.862466,0.86104
300,0.3073,0.313962,0.869717,0.86919
400,0.2611,0.294697,0.876469,0.876111
500,0.2619,0.294415,0.873218,0.873142
600,0.1849,0.390979,0.858965,0.85895
700,0.1857,0.395849,0.864716,0.864716
800,0.1603,0.453808,0.866217,0.866213
900,0.1318,0.449985,0.862716,0.862716
1000,0.141,0.39631,0.869217,0.869043


aubmindlab/bert-base-arabertv02-twitter, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4102,0.34055,0.859465,0.859454
200,0.3362,0.320838,0.862466,0.86104
300,0.3073,0.313962,0.869717,0.86919
400,0.2611,0.294697,0.876469,0.876111
500,0.2619,0.294415,0.873218,0.873142
600,0.1849,0.390979,0.858965,0.85895
700,0.1857,0.395849,0.864716,0.864716
800,0.1603,0.453808,0.866217,0.866213
900,0.1318,0.449985,0.862716,0.862716
1000,0.141,0.39631,0.869217,0.869043


aubmindlab/bert-base-arabertv02-twitter, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4081,0.34306,0.850963,0.85041
200,0.3135,0.325816,0.863716,0.863155
300,0.2854,0.309649,0.866967,0.866415
400,0.256,0.310603,0.868217,0.868078
500,0.2302,0.319973,0.866217,0.865927
600,0.172,0.414198,0.863716,0.86358
700,0.1705,0.379989,0.866217,0.866057
800,0.15,0.461622,0.863716,0.863669
900,0.1341,0.448924,0.866217,0.865765
1000,0.1296,0.494576,0.862966,0.862878


aubmindlab/bert-base-arabertv02-twitter, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4081,0.34306,0.850963,0.85041
200,0.3135,0.325816,0.863716,0.863155
300,0.2854,0.309649,0.866967,0.866415
400,0.256,0.310603,0.868217,0.868078
500,0.2302,0.319973,0.866217,0.865927
600,0.172,0.414198,0.863716,0.86358
700,0.1705,0.379989,0.866217,0.866057
800,0.15,0.461622,0.863716,0.863669
900,0.1341,0.448924,0.866217,0.865765
1000,0.1296,0.494576,0.862966,0.862878


aubmindlab/bert-base-arabertv02-twitter, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4081,0.34306,0.850963,0.85041
200,0.3135,0.325816,0.863716,0.863155
300,0.2854,0.309649,0.866967,0.866415
400,0.256,0.310603,0.868217,0.868078
500,0.2302,0.319973,0.866217,0.865927
600,0.172,0.414198,0.863716,0.86358
700,0.1705,0.379989,0.866217,0.866057
800,0.15,0.461622,0.863716,0.863669
900,0.1341,0.448924,0.866217,0.865765
1000,0.1296,0.494576,0.862966,0.862878


aubmindlab/bert-base-arabertv02-twitter, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.3948,0.332103,0.856464,0.856328
200,0.339,0.318064,0.868217,0.867003
300,0.2888,0.335951,0.856714,0.856613
400,0.2479,0.330076,0.863716,0.863519
500,0.2453,0.296463,0.871218,0.870696
600,0.1732,0.383193,0.863466,0.863337
700,0.1731,0.394981,0.872218,0.871615
800,0.1456,0.486912,0.866717,0.866548
900,0.1245,0.502364,0.859965,0.859961
1000,0.1276,0.477701,0.866467,0.866101


aubmindlab/bert-base-arabertv02-twitter, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.3948,0.332103,0.856464,0.856328
200,0.339,0.318064,0.868217,0.867003
300,0.2888,0.335951,0.856714,0.856613
400,0.2479,0.330076,0.863716,0.863519
500,0.2453,0.296463,0.871218,0.870696
600,0.1732,0.383193,0.863466,0.863337
700,0.1731,0.394981,0.872218,0.871615
800,0.1456,0.486912,0.866717,0.866548
900,0.1245,0.502364,0.859965,0.859961
1000,0.1276,0.477701,0.866467,0.866101


aubmindlab/bert-base-arabertv02-twitter, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.3948,0.332103,0.856464,0.856328
200,0.339,0.318064,0.868217,0.867003
300,0.2888,0.335951,0.856714,0.856613
400,0.2479,0.330076,0.863716,0.863519
500,0.2453,0.296463,0.871218,0.870696
600,0.1732,0.383193,0.863466,0.863337
700,0.1731,0.394981,0.872218,0.871615
800,0.1456,0.486912,0.866717,0.866548
900,0.1245,0.502364,0.859965,0.859961
1000,0.1276,0.477701,0.866467,0.866101


DatasetDict({
    train: Dataset({
        features: ['sentence', 'label'],
        num_rows: 15992
    })
    test: Dataset({
        features: ['sentence', 'label'],
        num_rows: 3999
    })
})

CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.2728,0.108111,0.952738,0.952715
200,0.1231,0.102323,0.955989,0.955989
300,0.0945,0.16398,0.957739,0.9577
400,0.0867,0.102874,0.96074,0.960736
500,0.0848,0.107247,0.962241,0.962233
600,0.0541,0.116373,0.962991,0.962979
700,0.0604,0.117342,0.964491,0.964482
800,0.0541,0.129984,0.965241,0.965239
900,0.0467,0.173785,0.964991,0.96499
1000,0.0544,0.110313,0.965241,0.965239


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.2728,0.108111,0.952738,0.952715
200,0.1231,0.102323,0.955989,0.955989
300,0.0945,0.16398,0.957739,0.9577
400,0.0867,0.102874,0.96074,0.960736
500,0.0848,0.107247,0.962241,0.962233
600,0.0541,0.116373,0.962991,0.962979
700,0.0604,0.117342,0.964491,0.964482
800,0.0541,0.129984,0.965241,0.965239
900,0.0467,0.173785,0.964991,0.96499
1000,0.0544,0.110313,0.965241,0.965239


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.2728,0.108111,0.952738,0.952715
200,0.1231,0.102323,0.955989,0.955989
300,0.0945,0.16398,0.957739,0.9577
400,0.0867,0.102874,0.96074,0.960736
500,0.0848,0.107247,0.962241,0.962233
600,0.0541,0.116373,0.962991,0.962979
700,0.0604,0.117342,0.964491,0.964482
800,0.0541,0.129984,0.965241,0.965239
900,0.0467,0.173785,0.964991,0.96499
1000,0.0544,0.110313,0.965241,0.965239


CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.266,0.122473,0.941985,0.941925
200,0.1263,0.093593,0.96049,0.960461
300,0.0923,0.11075,0.95999,0.959983
400,0.0872,0.102892,0.96124,0.961233
500,0.0775,0.106298,0.963991,0.963991
600,0.067,0.11638,0.96049,0.96049
700,0.0561,0.101272,0.964741,0.964736
800,0.0511,0.134313,0.967242,0.967241
900,0.048,0.119592,0.962241,0.962239
1000,0.0403,0.15228,0.966492,0.96649


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.266,0.122473,0.941985,0.941925
200,0.1263,0.093593,0.96049,0.960461
300,0.0923,0.11075,0.95999,0.959983
400,0.0872,0.102892,0.96124,0.961233
500,0.0775,0.106298,0.963991,0.963991
600,0.067,0.11638,0.96049,0.96049
700,0.0561,0.101272,0.964741,0.964736
800,0.0511,0.134313,0.967242,0.967241
900,0.048,0.119592,0.962241,0.962239
1000,0.0403,0.15228,0.966492,0.96649


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.266,0.122473,0.941985,0.941925
200,0.1263,0.093593,0.96049,0.960461
300,0.0923,0.11075,0.95999,0.959983
400,0.0872,0.102892,0.96124,0.961233
500,0.0775,0.106298,0.963991,0.963991
600,0.067,0.11638,0.96049,0.96049
700,0.0561,0.101272,0.964741,0.964736
800,0.0511,0.134313,0.967242,0.967241
900,0.048,0.119592,0.962241,0.962239
1000,0.0403,0.15228,0.966492,0.96649


CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.2576,0.132261,0.941235,0.941148
200,0.1242,0.106131,0.95999,0.95999
300,0.0937,0.153976,0.954739,0.954724
400,0.0757,0.13717,0.956739,0.956731
500,0.0778,0.109496,0.96149,0.961489
600,0.0608,0.163717,0.95849,0.95849
700,0.0555,0.132009,0.957989,0.957971
800,0.0467,0.166451,0.95949,0.959484
900,0.0431,0.146832,0.95924,0.959233
1000,0.046,0.19614,0.956739,0.956728


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.2576,0.132261,0.941235,0.941148
200,0.1242,0.106131,0.95999,0.95999
300,0.0937,0.153976,0.954739,0.954724
400,0.0757,0.13717,0.956739,0.956731
500,0.0778,0.109496,0.96149,0.961489
600,0.0608,0.163717,0.95849,0.95849
700,0.0555,0.132009,0.957989,0.957971
800,0.0467,0.166451,0.95949,0.959484
900,0.0431,0.146832,0.95924,0.959233
1000,0.046,0.19614,0.956739,0.956728


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.2576,0.132261,0.941235,0.941148
200,0.1242,0.106131,0.95999,0.95999
300,0.0937,0.153976,0.954739,0.954724
400,0.0757,0.13717,0.956739,0.956731
500,0.0778,0.109496,0.96149,0.961489
600,0.0608,0.163717,0.95849,0.95849
700,0.0555,0.132009,0.957989,0.957971
800,0.0467,0.166451,0.95949,0.959484
900,0.0431,0.146832,0.95924,0.959233
1000,0.046,0.19614,0.956739,0.956728


DatasetDict({
    train: Dataset({
        features: ['sentence', 'label'],
        num_rows: 15992
    })
    test: Dataset({
        features: ['sentence', 'label'],
        num_rows: 3999
    })
})

qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4235,0.319577,0.849212,0.849149
200,0.3127,0.296856,0.869217,0.868051
300,0.261,0.324152,0.877219,0.876272
400,0.2156,0.298524,0.885221,0.885121
500,0.2151,0.300052,0.88047,0.880286
600,0.1255,0.356561,0.877219,0.877219
700,0.1362,0.394238,0.88172,0.881717
800,0.1178,0.493881,0.875469,0.875286
900,0.0825,0.463876,0.883221,0.883014
1000,0.0998,0.415274,0.88097,0.880747


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4235,0.319577,0.849212,0.849149
200,0.3127,0.296856,0.869217,0.868051
300,0.261,0.324152,0.877219,0.876272
400,0.2156,0.298524,0.885221,0.885121
500,0.2151,0.300052,0.88047,0.880286
600,0.1255,0.356561,0.877219,0.877219
700,0.1362,0.394238,0.88172,0.881717
800,0.1178,0.493881,0.875469,0.875286
900,0.0825,0.463876,0.883221,0.883014
1000,0.0998,0.415274,0.88097,0.880747


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4235,0.319577,0.849212,0.849149
200,0.3127,0.296856,0.869217,0.868051
300,0.261,0.324152,0.877219,0.876272
400,0.2156,0.298524,0.885221,0.885121
500,0.2151,0.300052,0.88047,0.880286
600,0.1255,0.356561,0.877219,0.877219
700,0.1362,0.394238,0.88172,0.881717
800,0.1178,0.493881,0.875469,0.875286
900,0.0825,0.463876,0.883221,0.883014
1000,0.0998,0.415274,0.88097,0.880747


qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4283,0.356662,0.836959,0.836855
200,0.3163,0.356382,0.855464,0.855444
300,0.2481,0.326508,0.867467,0.867454
400,0.2192,0.309859,0.864466,0.864447
500,0.2017,0.33429,0.875969,0.875852
600,0.1238,0.367402,0.862216,0.862213
700,0.1363,0.512268,0.862716,0.862711
800,0.11,0.464199,0.88022,0.880112
900,0.0922,0.517902,0.866967,0.866958
1000,0.0967,0.487734,0.869967,0.869924


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4283,0.356662,0.836959,0.836855
200,0.3163,0.356382,0.855464,0.855444
300,0.2481,0.326508,0.867467,0.867454
400,0.2192,0.309859,0.864466,0.864447
500,0.2017,0.33429,0.875969,0.875852
600,0.1238,0.367402,0.862216,0.862213
700,0.1363,0.512268,0.862716,0.862711
800,0.11,0.464199,0.88022,0.880112
900,0.0922,0.517902,0.866967,0.866958
1000,0.0967,0.487734,0.869967,0.869924


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4283,0.356662,0.836959,0.836855
200,0.3163,0.356382,0.855464,0.855444
300,0.2481,0.326508,0.867467,0.867454
400,0.2192,0.309859,0.864466,0.864447
500,0.2017,0.33429,0.875969,0.875852
600,0.1238,0.367402,0.862216,0.862213
700,0.1363,0.512268,0.862716,0.862711
800,0.11,0.464199,0.88022,0.880112
900,0.0922,0.517902,0.866967,0.866958
1000,0.0967,0.487734,0.869967,0.869924


qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4088,0.312534,0.862216,0.861115
200,0.331,0.291116,0.873718,0.873395
300,0.262,0.324898,0.865466,0.865466
400,0.2156,0.334311,0.874469,0.874465
500,0.2029,0.325143,0.88047,0.880179
600,0.1288,0.363388,0.863716,0.863712
700,0.1308,0.458611,0.859215,0.859084
800,0.1078,0.505953,0.875219,0.875079
900,0.0886,0.55481,0.870718,0.870437
1000,0.097,0.507759,0.871468,0.87103


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4088,0.312534,0.862216,0.861115
200,0.331,0.291116,0.873718,0.873395
300,0.262,0.324898,0.865466,0.865466
400,0.2156,0.334311,0.874469,0.874465
500,0.2029,0.325143,0.88047,0.880179
600,0.1288,0.363388,0.863716,0.863712
700,0.1308,0.458611,0.859215,0.859084
800,0.1078,0.505953,0.875219,0.875079
900,0.0886,0.55481,0.870718,0.870437
1000,0.097,0.507759,0.871468,0.87103


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4088,0.312534,0.862216,0.861115
200,0.331,0.291116,0.873718,0.873395
300,0.262,0.324898,0.865466,0.865466
400,0.2156,0.334311,0.874469,0.874465
500,0.2029,0.325143,0.88047,0.880179
600,0.1288,0.363388,0.863716,0.863712
700,0.1308,0.458611,0.859215,0.859084
800,0.1078,0.505953,0.875219,0.875079
900,0.0886,0.55481,0.870718,0.870437
1000,0.097,0.507759,0.871468,0.87103


DatasetDict({
    train: Dataset({
        features: ['sentence', 'label'],
        num_rows: 15992
    })
    test: Dataset({
        features: ['sentence', 'label'],
        num_rows: 3999
    })
})

UBC-NLP/MARBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.1984,0.103628,0.966742,0.96674
200,0.1055,0.065334,0.977994,0.977989
300,0.0579,0.104125,0.976994,0.976985
400,0.0539,0.05467,0.984746,0.984745
500,0.0556,0.057052,0.984246,0.984245
600,0.03,0.077244,0.983996,0.983996
700,0.0417,0.069325,0.983246,0.983245
800,0.028,0.075359,0.985496,0.985496
900,0.022,0.094137,0.982746,0.982746
1000,0.0195,0.1033,0.981245,0.981244


UBC-NLP/MARBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.1984,0.103628,0.966742,0.96674
200,0.1055,0.065334,0.977994,0.977989
300,0.0579,0.104125,0.976994,0.976985
400,0.0539,0.05467,0.984746,0.984745
500,0.0556,0.057052,0.984246,0.984245
600,0.03,0.077244,0.983996,0.983996
700,0.0417,0.069325,0.983246,0.983245
800,0.028,0.075359,0.985496,0.985496
900,0.022,0.094137,0.982746,0.982746
1000,0.0195,0.1033,0.981245,0.981244


UBC-NLP/MARBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.1984,0.103628,0.966742,0.96674
200,0.1055,0.065334,0.977994,0.977989
300,0.0579,0.104125,0.976994,0.976985
400,0.0539,0.05467,0.984746,0.984745
500,0.0556,0.057052,0.984246,0.984245
600,0.03,0.077244,0.983996,0.983996
700,0.0417,0.069325,0.983246,0.983245
800,0.028,0.075359,0.985496,0.985496
900,0.022,0.094137,0.982746,0.982746
1000,0.0195,0.1033,0.981245,0.981244


UBC-NLP/MARBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.1836,0.085748,0.974744,0.974742
200,0.0988,0.083433,0.979495,0.979495
300,0.0722,0.07168,0.983746,0.983745
400,0.0537,0.088216,0.979745,0.979739
500,0.0442,0.066145,0.984496,0.984496
600,0.0394,0.063442,0.986997,0.986996
700,0.0249,0.080036,0.983496,0.983496
800,0.0284,0.090778,0.982996,0.982993
900,0.0231,0.092964,0.985496,0.985496
1000,0.027,0.082519,0.981245,0.981243


UBC-NLP/MARBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.1836,0.085748,0.974744,0.974742
200,0.0988,0.083433,0.979495,0.979495
300,0.0722,0.07168,0.983746,0.983745
400,0.0537,0.088216,0.979745,0.979739
500,0.0442,0.066145,0.984496,0.984496
600,0.0394,0.063442,0.986997,0.986996
700,0.0249,0.080036,0.983496,0.983496
800,0.0284,0.090778,0.982996,0.982993
900,0.0231,0.092964,0.985496,0.985496
1000,0.027,0.082519,0.981245,0.981243


UBC-NLP/MARBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.1836,0.085748,0.974744,0.974742
200,0.0988,0.083433,0.979495,0.979495
300,0.0722,0.07168,0.983746,0.983745
400,0.0537,0.088216,0.979745,0.979739
500,0.0442,0.066145,0.984496,0.984496
600,0.0394,0.063442,0.986997,0.986996
700,0.0249,0.080036,0.983496,0.983496
800,0.0284,0.090778,0.982996,0.982993
900,0.0231,0.092964,0.985496,0.985496
1000,0.027,0.082519,0.981245,0.981243


UBC-NLP/MARBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.1954,0.127412,0.964491,0.964477
200,0.0888,0.100377,0.978745,0.978737
300,0.0609,0.090766,0.981745,0.981743
400,0.046,0.082058,0.978495,0.978492
500,0.0538,0.084649,0.979745,0.979743
600,0.0355,0.086271,0.982496,0.982492
700,0.0305,0.124479,0.976994,0.976991
800,0.0278,0.11777,0.979995,0.979986
900,0.0177,0.112575,0.980495,0.980485
1000,0.018,0.118131,0.979495,0.979482


UBC-NLP/MARBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.1954,0.127412,0.964491,0.964477
200,0.0888,0.100377,0.978745,0.978737
300,0.0609,0.090766,0.981745,0.981743
400,0.046,0.082058,0.978495,0.978492
500,0.0538,0.084649,0.979745,0.979743
600,0.0355,0.086271,0.982496,0.982492
700,0.0305,0.124479,0.976994,0.976991
800,0.0278,0.11777,0.979995,0.979986
900,0.0177,0.112575,0.980495,0.980485
1000,0.018,0.118131,0.979495,0.979482


UBC-NLP/MARBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.1954,0.127412,0.964491,0.964477
200,0.0888,0.100377,0.978745,0.978737
300,0.0609,0.090766,0.981745,0.981743
400,0.046,0.082058,0.978495,0.978492
500,0.0538,0.084649,0.979745,0.979743
600,0.0355,0.086271,0.982496,0.982492
700,0.0305,0.124479,0.976994,0.976991
800,0.0278,0.11777,0.979995,0.979986
900,0.0177,0.112575,0.980495,0.980485
1000,0.018,0.118131,0.979495,0.979482


DatasetDict({
    train: Dataset({
        features: ['sentence', 'label'],
        num_rows: 15992
    })
    test: Dataset({
        features: ['sentence', 'label'],
        num_rows: 3999
    })
})

UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.2779,0.106949,0.967992,0.967991
200,0.1201,0.069139,0.977494,0.977494
300,0.0782,0.09073,0.974744,0.974736
400,0.0671,0.068486,0.980995,0.980994
500,0.0599,0.078228,0.977244,0.977244
600,0.0373,0.06233,0.979995,0.979994
700,0.0393,0.07362,0.982246,0.982244
800,0.0325,0.072165,0.983496,0.983495
900,0.0234,0.100648,0.980495,0.980495
1000,0.0276,0.070837,0.978745,0.978744


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.2779,0.106949,0.967992,0.967991
200,0.1201,0.069139,0.977494,0.977494
300,0.0782,0.09073,0.974744,0.974736
400,0.0671,0.068486,0.980995,0.980994
500,0.0599,0.078228,0.977244,0.977244
600,0.0373,0.06233,0.979995,0.979994
700,0.0393,0.07362,0.982246,0.982244
800,0.0325,0.072165,0.983496,0.983495
900,0.0234,0.100648,0.980495,0.980495
1000,0.0276,0.070837,0.978745,0.978744


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.2779,0.106949,0.967992,0.967991
200,0.1201,0.069139,0.977494,0.977494
300,0.0782,0.09073,0.974744,0.974736
400,0.0671,0.068486,0.980995,0.980994
500,0.0599,0.078228,0.977244,0.977244
600,0.0373,0.06233,0.979995,0.979994
700,0.0393,0.07362,0.982246,0.982244
800,0.0325,0.072165,0.983496,0.983495
900,0.0234,0.100648,0.980495,0.980495
1000,0.0276,0.070837,0.978745,0.978744


UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.2899,0.122174,0.957989,0.957987
200,0.1195,0.080741,0.971493,0.971491
300,0.0743,0.081152,0.978995,0.978995
400,0.0629,0.07771,0.979745,0.979743
500,0.0549,0.080921,0.980495,0.980495
600,0.0479,0.088294,0.975994,0.975991
700,0.0293,0.081944,0.981745,0.981745
800,0.0332,0.103934,0.978745,0.978738
900,0.0224,0.117906,0.980245,0.980242
1000,0.0277,0.078252,0.984496,0.984496


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.2899,0.122174,0.957989,0.957987
200,0.1195,0.080741,0.971493,0.971491
300,0.0743,0.081152,0.978995,0.978995
400,0.0629,0.07771,0.979745,0.979743
500,0.0549,0.080921,0.980495,0.980495
600,0.0479,0.088294,0.975994,0.975991
700,0.0293,0.081944,0.981745,0.981745
800,0.0332,0.103934,0.978745,0.978738
900,0.0224,0.117906,0.980245,0.980242
1000,0.0277,0.078252,0.984496,0.984496


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.2899,0.122174,0.957989,0.957987
200,0.1195,0.080741,0.971493,0.971491
300,0.0743,0.081152,0.978995,0.978995
400,0.0629,0.07771,0.979745,0.979743
500,0.0549,0.080921,0.980495,0.980495
600,0.0479,0.088294,0.975994,0.975991
700,0.0293,0.081944,0.981745,0.981745
800,0.0332,0.103934,0.978745,0.978738
900,0.0224,0.117906,0.980245,0.980242
1000,0.0277,0.078252,0.984496,0.984496


UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.2905,0.14156,0.95849,0.958489
200,0.1061,0.085115,0.974244,0.974239
300,0.0621,0.097768,0.976994,0.97699
400,0.0568,0.081004,0.976494,0.976479
500,0.0645,0.078287,0.980495,0.980492
600,0.04,0.101866,0.977744,0.97774
700,0.0334,0.097318,0.979245,0.979241
800,0.0312,0.102813,0.979245,0.979232
900,0.0256,0.12791,0.973743,0.973724
1000,0.0197,0.111944,0.977244,0.977228


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.2905,0.14156,0.95849,0.958489
200,0.1061,0.085115,0.974244,0.974239
300,0.0621,0.097768,0.976994,0.97699
400,0.0568,0.081004,0.976494,0.976479
500,0.0645,0.078287,0.980495,0.980492
600,0.04,0.101866,0.977744,0.97774
700,0.0334,0.097318,0.979245,0.979241
800,0.0312,0.102813,0.979245,0.979232
900,0.0256,0.12791,0.973743,0.973724
1000,0.0197,0.111944,0.977244,0.977228


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.2905,0.14156,0.95849,0.958489
200,0.1061,0.085115,0.974244,0.974239
300,0.0621,0.097768,0.976994,0.97699
400,0.0568,0.081004,0.976494,0.976479
500,0.0645,0.078287,0.980495,0.980492
600,0.04,0.101866,0.977744,0.97774
700,0.0334,0.097318,0.979245,0.979241
800,0.0312,0.102813,0.979245,0.979232
900,0.0256,0.12791,0.973743,0.973724
1000,0.0197,0.111944,0.977244,0.977228


DatasetDict({
    train: Dataset({
        features: ['sentence', 'label'],
        num_rows: 15992
    })
    test: Dataset({
        features: ['sentence', 'label'],
        num_rows: 3999
    })
})

SI2M-Lab/DarijaBERT-mix, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.1602,0.055872,0.985496,0.985496
200,0.0597,0.045184,0.987997,0.987997
300,0.0455,0.041063,0.988747,0.988747
400,0.0399,0.048522,0.989247,0.989247
500,0.0342,0.054301,0.989247,0.989247
600,0.0214,0.047755,0.988997,0.988997
700,0.0244,0.049655,0.989747,0.989747
800,0.0215,0.056128,0.990998,0.990998
900,0.0152,0.046634,0.988997,0.988997
1000,0.0144,0.047673,0.989997,0.989997


SI2M-Lab/DarijaBERT-mix, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.1602,0.055872,0.985496,0.985496
200,0.0597,0.045184,0.987997,0.987997
300,0.0455,0.041063,0.988747,0.988747
400,0.0399,0.048522,0.989247,0.989247
500,0.0342,0.054301,0.989247,0.989247
600,0.0214,0.047755,0.988997,0.988997
700,0.0244,0.049655,0.989747,0.989747
800,0.0215,0.056128,0.990998,0.990998
900,0.0152,0.046634,0.988997,0.988997
1000,0.0144,0.047673,0.989997,0.989997


SI2M-Lab/DarijaBERT-mix, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.1602,0.055872,0.985496,0.985496
200,0.0597,0.045184,0.987997,0.987997
300,0.0455,0.041063,0.988747,0.988747
400,0.0399,0.048522,0.989247,0.989247
500,0.0342,0.054301,0.989247,0.989247
600,0.0214,0.047755,0.988997,0.988997
700,0.0244,0.049655,0.989747,0.989747
800,0.0215,0.056128,0.990998,0.990998
900,0.0152,0.046634,0.988997,0.988997
1000,0.0144,0.047673,0.989997,0.989997


SI2M-Lab/DarijaBERT-mix, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.144,0.060965,0.986247,0.986246
200,0.0648,0.047088,0.986497,0.986496
300,0.045,0.0532,0.988997,0.988996
400,0.0362,0.044189,0.990748,0.990747
500,0.0368,0.04591,0.989747,0.989747
600,0.023,0.046587,0.989997,0.989997
700,0.0176,0.055327,0.988747,0.988747
800,0.0161,0.056123,0.989747,0.989747
900,0.0116,0.064317,0.989747,0.989747
1000,0.0131,0.056036,0.987247,0.987247


SI2M-Lab/DarijaBERT-mix, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.144,0.060965,0.986247,0.986246
200,0.0648,0.047088,0.986497,0.986496
300,0.045,0.0532,0.988997,0.988996
400,0.0362,0.044189,0.990748,0.990747
500,0.0368,0.04591,0.989747,0.989747
600,0.023,0.046587,0.989997,0.989997
700,0.0176,0.055327,0.988747,0.988747
800,0.0161,0.056123,0.989747,0.989747
900,0.0116,0.064317,0.989747,0.989747
1000,0.0131,0.056036,0.987247,0.987247


SI2M-Lab/DarijaBERT-mix, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.144,0.060965,0.986247,0.986246
200,0.0648,0.047088,0.986497,0.986496
300,0.045,0.0532,0.988997,0.988996
400,0.0362,0.044189,0.990748,0.990747
500,0.0368,0.04591,0.989747,0.989747
600,0.023,0.046587,0.989997,0.989997
700,0.0176,0.055327,0.988747,0.988747
800,0.0161,0.056123,0.989747,0.989747
900,0.0116,0.064317,0.989747,0.989747
1000,0.0131,0.056036,0.987247,0.987247


SI2M-Lab/DarijaBERT-mix, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.1565,0.076505,0.976744,0.976741
200,0.0685,0.068151,0.982496,0.982492
300,0.0469,0.065244,0.984746,0.984739
400,0.0347,0.069107,0.983746,0.983739
500,0.0424,0.057659,0.985246,0.985242
600,0.0259,0.082039,0.984746,0.984744
700,0.0211,0.085081,0.983996,0.983987
800,0.0206,0.092832,0.982996,0.982987
900,0.0201,0.09138,0.982996,0.982984
1000,0.0183,0.067764,0.987247,0.987241


SI2M-Lab/DarijaBERT-mix, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.1565,0.076505,0.976744,0.976741
200,0.0685,0.068151,0.982496,0.982492
300,0.0469,0.065244,0.984746,0.984739
400,0.0347,0.069107,0.983746,0.983739
500,0.0424,0.057659,0.985246,0.985242
600,0.0259,0.082039,0.984746,0.984744
700,0.0211,0.085081,0.983996,0.983987
800,0.0206,0.092832,0.982996,0.982987
900,0.0201,0.09138,0.982996,0.982984
1000,0.0183,0.067764,0.987247,0.987241


SI2M-Lab/DarijaBERT-mix, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.1565,0.076505,0.976744,0.976741
200,0.0685,0.068151,0.982496,0.982492
300,0.0469,0.065244,0.984746,0.984739
400,0.0347,0.069107,0.983746,0.983739
500,0.0424,0.057659,0.985246,0.985242
600,0.0259,0.082039,0.984746,0.984744
700,0.0211,0.085081,0.983996,0.983987
800,0.0206,0.092832,0.982996,0.982987
900,0.0201,0.09138,0.982996,0.982984
1000,0.0183,0.067764,0.987247,0.987241


DatasetDict({
    train: Dataset({
        features: ['sentence', 'label'],
        num_rows: 15992
    })
    test: Dataset({
        features: ['sentence', 'label'],
        num_rows: 3999
    })
})

SI2M-Lab/DarijaBERT-arabizi, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.1118,0.057411,0.985996,0.985996
200,0.0632,0.040128,0.988747,0.988747
300,0.0433,0.045645,0.988497,0.988496
400,0.0399,0.035376,0.989997,0.989997
500,0.0252,0.052093,0.988747,0.988747
600,0.0152,0.048765,0.989497,0.989497
700,0.0145,0.04634,0.988747,0.988746
800,0.0192,0.045562,0.990498,0.990497
900,0.0121,0.050249,0.989497,0.989497
1000,0.0077,0.044706,0.989247,0.989247


SI2M-Lab/DarijaBERT-arabizi, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.1118,0.057411,0.985996,0.985996
200,0.0632,0.040128,0.988747,0.988747
300,0.0433,0.045645,0.988497,0.988496
400,0.0399,0.035376,0.989997,0.989997
500,0.0252,0.052093,0.988747,0.988747
600,0.0152,0.048765,0.989497,0.989497
700,0.0145,0.04634,0.988747,0.988746
800,0.0192,0.045562,0.990498,0.990497
900,0.0121,0.050249,0.989497,0.989497
1000,0.0077,0.044706,0.989247,0.989247


SI2M-Lab/DarijaBERT-arabizi, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.1118,0.057411,0.985996,0.985996
200,0.0632,0.040128,0.988747,0.988747
300,0.0433,0.045645,0.988497,0.988496
400,0.0399,0.035376,0.989997,0.989997
500,0.0252,0.052093,0.988747,0.988747
600,0.0152,0.048765,0.989497,0.989497
700,0.0145,0.04634,0.988747,0.988746
800,0.0192,0.045562,0.990498,0.990497
900,0.0121,0.050249,0.989497,0.989497
1000,0.0077,0.044706,0.989247,0.989247


SI2M-Lab/DarijaBERT-arabizi, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.111,0.056011,0.984496,0.984494
200,0.0695,0.042556,0.986997,0.986997
300,0.0451,0.056965,0.986997,0.986996
400,0.0346,0.053452,0.988247,0.988247
500,0.0347,0.047403,0.990998,0.990997
600,0.0253,0.036838,0.989747,0.989747
700,0.0146,0.07295,0.986997,0.986997
800,0.0151,0.070475,0.986997,0.986997
900,0.0114,0.054988,0.988247,0.988246
1000,0.0117,0.055139,0.989997,0.989997


SI2M-Lab/DarijaBERT-arabizi, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.111,0.056011,0.984496,0.984494
200,0.0695,0.042556,0.986997,0.986997
300,0.0451,0.056965,0.986997,0.986996
400,0.0346,0.053452,0.988247,0.988247
500,0.0347,0.047403,0.990998,0.990997
600,0.0253,0.036838,0.989747,0.989747
700,0.0146,0.07295,0.986997,0.986997
800,0.0151,0.070475,0.986997,0.986997
900,0.0114,0.054988,0.988247,0.988246
1000,0.0117,0.055139,0.989997,0.989997


SI2M-Lab/DarijaBERT-arabizi, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.111,0.056011,0.984496,0.984494
200,0.0695,0.042556,0.986997,0.986997
300,0.0451,0.056965,0.986997,0.986996
400,0.0346,0.053452,0.988247,0.988247
500,0.0347,0.047403,0.990998,0.990997
600,0.0253,0.036838,0.989747,0.989747
700,0.0146,0.07295,0.986997,0.986997
800,0.0151,0.070475,0.986997,0.986997
900,0.0114,0.054988,0.988247,0.988246
1000,0.0117,0.055139,0.989997,0.989997


SI2M-Lab/DarijaBERT-arabizi, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.1056,0.059957,0.985246,0.98524
200,0.059,0.057582,0.985746,0.985743
300,0.0368,0.062546,0.985996,0.985994
400,0.0265,0.062139,0.985496,0.985492
500,0.036,0.053924,0.985246,0.985244
600,0.0211,0.067316,0.984996,0.984992
700,0.0219,0.055213,0.986997,0.986995
800,0.0141,0.110548,0.979995,0.979977
900,0.0123,0.086194,0.983246,0.983235
1000,0.0122,0.102812,0.984496,0.984486


SI2M-Lab/DarijaBERT-arabizi, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.1056,0.059957,0.985246,0.98524
200,0.059,0.057582,0.985746,0.985743
300,0.0368,0.062546,0.985996,0.985994
400,0.0265,0.062139,0.985496,0.985492
500,0.036,0.053924,0.985246,0.985244
600,0.0211,0.067316,0.984996,0.984992
700,0.0219,0.055213,0.986997,0.986995
800,0.0141,0.110548,0.979995,0.979977
900,0.0123,0.086194,0.983246,0.983235
1000,0.0122,0.102812,0.984496,0.984486


SI2M-Lab/DarijaBERT-arabizi, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/15992 [00:00<?, ? examples/s]

Map:   0%|          | 0/3999 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.1056,0.059957,0.985246,0.98524
200,0.059,0.057582,0.985746,0.985743
300,0.0368,0.062546,0.985996,0.985994
400,0.0265,0.062139,0.985496,0.985492
500,0.036,0.053924,0.985246,0.985244
600,0.0211,0.067316,0.984996,0.984992
700,0.0219,0.055213,0.986997,0.986995
800,0.0141,0.110548,0.979995,0.979977
900,0.0123,0.086194,0.983246,0.983235
1000,0.0122,0.102812,0.984496,0.984486


Unnamed: 0,Model,Accuracy,F1
0,CAMeL-Lab/bert-base-arabic-camelbert-da,0.969492,0.969491
3,SI2M-Lab/DarijaBERT-arabizi,0.991248,0.991248
6,SI2M-Lab/DarijaBERT-mix,0.991498,0.991497
9,UBC-NLP/MARBERT,0.986997,0.986996
12,UBC-NLP/MARBERTv2,0.984996,0.984996
15,aubmindlab/bert-base-arabertv02-twitter,0.876469,0.876111
17,qarib/bert-base-qarib,0.885221,0.885121
