In [1]:
import os
os.environ["CUDA_VISIBLE_DEVICES"]="0" 

import numpy as np
import tensorflow as tf
import pandas as pd
import pyarabic.araby as araby
import warnings
warnings.filterwarnings('ignore')
from sklearn.model_selection import train_test_split
from sklearn.metrics import classification_report
from tensorflow.keras.layers import Dense, Input
from tensorflow.keras.utils import to_categorical
from tensorflow.keras.optimizers import Adam
from tensorflow.keras.callbacks import EarlyStopping
from tensorflow.keras.initializers import TruncatedNormal
from tensorflow.keras.losses import CategoricalCrossentropy
from tensorflow.keras.metrics import CategoricalAccuracy
import torch
from sklearn.metrics import accuracy_score, f1_score
from transformers import Trainer, TrainingArguments
from transformers import AutoTokenizer, AutoModelForSequenceClassification
from datasets import load_dataset, Dataset, concatenate_datasets
pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', None)
pd.set_option('display.max_colwidth', 1000)


fname = 'Open_2'
log_file = fname + '.txt'

with open(log_file, 'w') as f:
    f.write('Model,Accuracy,F1\n')


df1 = pd.read_csv('datasets/OpenAccessArDialect/Sentiment_Anaysis.csv', encoding='utf-8', engine='python') #, quotechar="'"  , quoting=3
df2 = pd.read_csv('datasets/OpenAccessArDialect/dialect.csv', encoding='utf-8', engine='python') #, quotechar="'"  , quoting=3

df2 = df2[df2['dialect'] == 'Morocco']
      
display(df1.columns)
display(df1[:4])

display(df2.columns)
display(df2[:4])
display(len(df2))



df = df1[df1['Twits'].isin(df2['Twits'])]

display(df[:5])
display(len(df))

c = df['label'].value_counts()
display(c)

classes = set(df['label'].values)
display(classes)

df['label'] = df['label'].astype('category')
df['label'] = df['label'].cat.codes

df = df[['Twits', 'label']]
classes_num = len(classes)
display(classes_num)
display(len(df))



max_sequence_length = 128



models = [ 
        'faisalq/EgyBERT',            
    'faisalq/SaudiBERT',            
    'tunis-ai/TunBERT',
    'alger-ia/dziribert',
    'SI2M-Lab/DarijaBERT',
    'otmangi/MorRoBERTa',
    'otmangi/MorrBERT'
            
]





seeds = [0, 1, 42]

for model_name in models:
    for seed in seeds:
        ds = Dataset.from_pandas(df)
        ds = ds.train_test_split(test_size=0.2, seed = seed)
        if seed==0:
            display(ds)
            
        for i in range(3):
            print(f'{model_name}, try:{i}')
                  
            tokenizer = AutoTokenizer.from_pretrained(model_name)
            model = AutoModelForSequenceClassification.from_pretrained(model_name,
                                                                  num_labels=classes_num).to('cuda')                                                 
            dataset_train = ds['train']
            dataset_validation = ds['test']                                                    
            
          
    
            def preprocess_function(examples):
                return tokenizer(examples['Twits'], truncation=True, padding="max_length",
                                max_length=max_sequence_length)
            
            
            dataset_train = dataset_train.map(preprocess_function, batched=True)
            dataset_validation = dataset_validation.map(preprocess_function, batched=True)
            
           
            
            def compute_metrics(eval_pred):
                logits, labels = eval_pred
                predictions = np.argmax(logits, axis=-1)    
                acc = accuracy_score(labels, predictions)        
                f1 = f1_score(labels, predictions, average='macro')   
                with open(log_file, 'a') as f:
                    f.write(f'{model_name},{acc},{f1}\n')
                return {'accuracy': acc, 'f1_score': f1}
    
    
            
            
            epochs = 12
            save_steps = 10000 #save checkpoint every 10000 steps
            batch_size = 64
            
            training_args = TrainingArguments(
                output_dir = 'bert/',
                overwrite_output_dir=True,
                num_train_epochs = epochs,
                per_device_train_batch_size = batch_size,
                per_device_eval_batch_size = batch_size,
                save_steps = save_steps,
                save_total_limit = 1, #only save the last 5 checkpoints
                fp16=True,
                learning_rate = 5e-5,  # 5e-5 is the default
                logging_steps = 50, #50_000
                evaluation_strategy = 'steps',
                # evaluate_during_training = True,
                eval_steps = 50
                
            )
            
            trainer = Trainer(
                model = model,
                args = training_args,
                # data_collator=data_collator,
                train_dataset=dataset_train,
                eval_dataset=dataset_validation,
                compute_metrics = compute_metrics
            )
            
            
            trainer.train()


results = pd.read_csv(log_file)

best_results = results.groupby('Model', as_index=False)['F1'].max()

best_results = pd.merge(best_results, results, on=['Model', 'F1'])
best_results = best_results[['Model', 'Accuracy', 'F1']]
best_results = best_results.drop_duplicates()
best_results.to_csv(f'{fname}.csv')
display(best_results)



2024-09-18 15:01:49.541536: I tensorflow/core/util/port.cc:110] oneDNN custom operations are on. You may see slightly different numerical results due to floating-point round-off errors from different computation orders. To turn them off, set the environment variable `TF_ENABLE_ONEDNN_OPTS=0`.
2024-09-18 15:01:49.728668: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.
To enable the following instructions: AVX2 AVX512F AVX512_VNNI AVX512_BF16 FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.


Index(['Unnamed: 0', 'Twits', 'label'], dtype='object')

Unnamed: 0.1,Unnamed: 0,Twits,label
0,0,what happens,neu
1,1,😞😞,neg
2,2,ان شاء الله,neu
3,3,بالتوفيق ان شاء الله,pos


Index(['Twits', 'dialect'], dtype='object')

Unnamed: 0,Twits,dialect
13393,slawiya msikina tb9a f darha 😐😕😕,Morocco
13394,ناس د الرباط أش واقع عندكم تما ... ياكما شي شبه عائلية 😐,Morocco
13395,لي دوا مشاا 😂😂,Morocco
13396,: وزراء تقلقوا,Morocco


9965

Unnamed: 0.1,Unnamed: 0,Twits,label
8,8,ههههههههه,pos
9,9,"هههه ضروري بإذن الله , لفقر را عيب ؤ عار ؤ حشومة",neg
10,10,مع فاق كيم جون من المرض وهو اكتب لينا مشروع قانون شكرا كيم جون ، عاشت كوريا,pos
11,11,الوادافاكية: زوجة اليوسفي تعزي جلالة الملك في وفاة زوجها,neg
12,12,: ها علاش مكنقراوش للقصص للاطفال قبل النوم😂😂😂,neu


8520

label
neu    6923
neg    1200
pos     397
Name: count, dtype: int64

{'neg', 'neu', 'pos'}

3

8520

DatasetDict({
    train: Dataset({
        features: ['Twits', 'label', '__index_level_0__'],
        num_rows: 6816
    })
    test: Dataset({
        features: ['Twits', 'label', '__index_level_0__'],
        num_rows: 1704
    })
})

faisalq/EgyBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/EgyBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.8891,0.85741,0.806925,0.297716
100,0.6436,0.603907,0.806925,0.297716
150,0.4987,0.439402,0.867958,0.519924
200,0.4225,0.406103,0.869131,0.523945
250,0.3469,0.355258,0.872653,0.544987
300,0.2896,0.349073,0.888498,0.64542
350,0.2555,0.355938,0.883216,0.69303
400,0.1978,0.349968,0.884977,0.702558
450,0.1729,0.377242,0.886737,0.704766
500,0.1714,0.375217,0.877347,0.698224


faisalq/EgyBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/EgyBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.8695,0.669616,0.806925,0.297716
100,0.5674,0.479465,0.84331,0.453963
150,0.4271,0.416493,0.857394,0.529053
200,0.4019,0.3871,0.870892,0.530265
250,0.4275,0.482104,0.816901,0.373062
300,0.4266,0.550058,0.819836,0.383508
350,0.5133,0.727582,0.806925,0.297716
400,0.555,0.729891,0.806925,0.297716
450,0.4846,0.682203,0.806925,0.297716
500,0.4529,0.6407,0.806925,0.297716


faisalq/EgyBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/EgyBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.8695,0.669616,0.806925,0.297716
100,0.5674,0.479465,0.84331,0.453963
150,0.4271,0.416493,0.857394,0.529053
200,0.4019,0.3871,0.870892,0.530265
250,0.4275,0.482104,0.816901,0.373062
300,0.4266,0.550058,0.819836,0.383508
350,0.5133,0.727582,0.806925,0.297716
400,0.555,0.729891,0.806925,0.297716
450,0.4846,0.682203,0.806925,0.297716
500,0.4529,0.6407,0.806925,0.297716


faisalq/EgyBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/EgyBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.8773,0.686404,0.789319,0.294085
100,0.5239,0.479641,0.862676,0.524055
150,0.4091,0.44518,0.862089,0.517453
200,0.3701,0.36698,0.877934,0.554513
250,0.3109,0.386369,0.873239,0.543415
300,0.2982,0.373368,0.875587,0.545357
350,0.2861,0.421323,0.866784,0.526831
400,0.2422,0.378798,0.875,0.669191
450,0.2066,0.412622,0.872653,0.666938
500,0.1944,0.3853,0.882629,0.687443


faisalq/EgyBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/EgyBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.8773,0.686404,0.789319,0.294085
100,0.5239,0.479641,0.862676,0.524055
150,0.4091,0.44518,0.862089,0.517453
200,0.3701,0.36698,0.877934,0.554513
250,0.3109,0.386369,0.873239,0.543415
300,0.2982,0.373368,0.875587,0.545357
350,0.2861,0.421323,0.866784,0.526831
400,0.2422,0.378798,0.875,0.669191
450,0.2066,0.412622,0.872653,0.666938
500,0.1944,0.3853,0.882629,0.687443


faisalq/EgyBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/EgyBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.8773,0.686404,0.789319,0.294085
100,0.5239,0.479641,0.862676,0.524055
150,0.4091,0.44518,0.862089,0.517453
200,0.3701,0.36698,0.877934,0.554513
250,0.3109,0.386369,0.873239,0.543415
300,0.2982,0.373368,0.875587,0.545357
350,0.2861,0.421323,0.866784,0.526831
400,0.2422,0.378798,0.875,0.669191
450,0.2066,0.412622,0.872653,0.666938
500,0.1944,0.3853,0.882629,0.687443


faisalq/EgyBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/EgyBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.88,0.672155,0.808685,0.298075
100,0.5562,0.455994,0.869718,0.529325
150,0.4051,0.380221,0.867371,0.512531
200,0.376,0.351707,0.882042,0.551294
250,0.3066,0.354009,0.885563,0.549024
300,0.285,0.378109,0.872653,0.515274
350,0.2601,0.375711,0.887911,0.649807
400,0.2148,0.333038,0.893192,0.736059
450,0.1706,0.365533,0.894953,0.73292
500,0.1458,0.362827,0.892606,0.717293


faisalq/EgyBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/EgyBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.88,0.672155,0.808685,0.298075
100,0.5562,0.455994,0.869718,0.529325
150,0.4051,0.380221,0.867371,0.512531
200,0.376,0.351707,0.882042,0.551294
250,0.3066,0.354009,0.885563,0.549024
300,0.285,0.378109,0.872653,0.515274
350,0.2601,0.375711,0.887911,0.649807
400,0.2148,0.333038,0.893192,0.736059
450,0.1706,0.365533,0.894953,0.73292
500,0.1458,0.362827,0.892606,0.717293


faisalq/EgyBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/EgyBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.88,0.672155,0.808685,0.298075
100,0.5562,0.455994,0.869718,0.529325
150,0.4051,0.380221,0.867371,0.512531
200,0.376,0.351707,0.882042,0.551294
250,0.3066,0.354009,0.885563,0.549024
300,0.285,0.378109,0.872653,0.515274
350,0.2601,0.375711,0.887911,0.649807
400,0.2148,0.333038,0.893192,0.736059
450,0.1706,0.365533,0.894953,0.73292
500,0.1458,0.362827,0.892606,0.717293


DatasetDict({
    train: Dataset({
        features: ['Twits', 'label', '__index_level_0__'],
        num_rows: 6816
    })
    test: Dataset({
        features: ['Twits', 'label', '__index_level_0__'],
        num_rows: 1704
    })
})

faisalq/SaudiBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3827,0.328438,0.867371,0.692269
100,0.3021,0.311825,0.880282,0.661266
150,0.2012,0.353029,0.880869,0.722167
200,0.2015,0.344856,0.876174,0.677296
250,0.1118,0.493757,0.869131,0.718162
300,0.087,0.428568,0.884977,0.716334
350,0.0622,0.515876,0.882629,0.692981
400,0.029,0.625575,0.875,0.724263
450,0.0272,0.603178,0.875,0.711882
500,0.0169,0.621494,0.881455,0.727564


faisalq/SaudiBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3827,0.328438,0.867371,0.692269
100,0.3021,0.311825,0.880282,0.661266
150,0.2012,0.353029,0.880869,0.722167
200,0.2015,0.344856,0.876174,0.677296
250,0.1118,0.493757,0.869131,0.718162
300,0.087,0.428568,0.884977,0.716334
350,0.0622,0.515876,0.882629,0.692981
400,0.029,0.625575,0.875,0.724263
450,0.0272,0.603178,0.875,0.711882
500,0.0169,0.621494,0.881455,0.727564


faisalq/SaudiBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3827,0.328438,0.867371,0.692269
100,0.3021,0.311825,0.880282,0.661266
150,0.2012,0.353029,0.880869,0.722167
200,0.2015,0.344856,0.876174,0.677296
250,0.1118,0.493757,0.869131,0.718162
300,0.087,0.428568,0.884977,0.716334
350,0.0622,0.515876,0.882629,0.692981
400,0.029,0.625575,0.875,0.724263
450,0.0272,0.603178,0.875,0.711882
500,0.0169,0.621494,0.881455,0.727564


faisalq/SaudiBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.39,0.307945,0.879695,0.715055
100,0.2783,0.315232,0.889085,0.674527
150,0.2254,0.305542,0.884977,0.719513
200,0.1787,0.314741,0.889671,0.726
250,0.122,0.435636,0.888498,0.702117
300,0.1022,0.392199,0.893779,0.737604
350,0.0627,0.482718,0.878521,0.720753
400,0.0447,0.521281,0.892019,0.731974
450,0.0311,0.506159,0.900235,0.747883
500,0.0243,0.570948,0.896714,0.733282


faisalq/SaudiBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.39,0.307945,0.879695,0.715055
100,0.2783,0.315232,0.889085,0.674527
150,0.2254,0.305542,0.884977,0.719513
200,0.1787,0.314741,0.889671,0.726
250,0.122,0.435636,0.888498,0.702117
300,0.1022,0.392199,0.893779,0.737604
350,0.0627,0.482718,0.878521,0.720753
400,0.0447,0.521281,0.892019,0.731974
450,0.0311,0.506159,0.900235,0.747883
500,0.0243,0.570948,0.896714,0.733282


faisalq/SaudiBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.39,0.307945,0.879695,0.715055
100,0.2783,0.315232,0.889085,0.674527
150,0.2254,0.305542,0.884977,0.719513
200,0.1787,0.314741,0.889671,0.726
250,0.122,0.435636,0.888498,0.702117
300,0.1022,0.392199,0.893779,0.737604
350,0.0627,0.482718,0.878521,0.720753
400,0.0447,0.521281,0.892019,0.731974
450,0.0311,0.506159,0.900235,0.747883
500,0.0243,0.570948,0.896714,0.733282


faisalq/SaudiBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4029,0.298948,0.887324,0.725839
100,0.2843,0.301646,0.882629,0.738188
150,0.2138,0.286124,0.900822,0.754651
200,0.21,0.287267,0.900235,0.746493
250,0.1097,0.405341,0.901408,0.759349
300,0.0901,0.391175,0.890845,0.726949
350,0.0691,0.465747,0.886737,0.719234
400,0.0372,0.45953,0.890258,0.732349
450,0.0298,0.539348,0.896127,0.730044
500,0.0208,0.56258,0.893192,0.724591


faisalq/SaudiBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4029,0.298948,0.887324,0.725839
100,0.2843,0.301646,0.882629,0.738188
150,0.2138,0.286124,0.900822,0.754651
200,0.21,0.287267,0.900235,0.746493
250,0.1097,0.405341,0.901408,0.759349
300,0.0901,0.391175,0.890845,0.726949
350,0.0691,0.465747,0.886737,0.719234
400,0.0372,0.45953,0.890258,0.732349
450,0.0298,0.539348,0.896127,0.730044
500,0.0208,0.56258,0.893192,0.724591


faisalq/SaudiBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4029,0.298948,0.887324,0.725839
100,0.2843,0.301646,0.882629,0.738188
150,0.2138,0.286124,0.900822,0.754651
200,0.21,0.287267,0.900235,0.746493
250,0.1097,0.405341,0.901408,0.759349
300,0.0901,0.391175,0.890845,0.726949
350,0.0691,0.465747,0.886737,0.719234
400,0.0372,0.45953,0.890258,0.732349
450,0.0298,0.539348,0.896127,0.730044
500,0.0208,0.56258,0.893192,0.724591


DatasetDict({
    train: Dataset({
        features: ['Twits', 'label', '__index_level_0__'],
        num_rows: 6816
    })
    test: Dataset({
        features: ['Twits', 'label', '__index_level_0__'],
        num_rows: 1704
    })
})

tunis-ai/TunBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at tunis-ai/TunBERT and are newly initialized: ['classifier.bias', 'classifier.weight', 'embeddings.LayerNorm.bias', 'embeddings.LayerNorm.weight', 'embeddings.position_embeddings.weight', 'embeddings.token_type_embeddings.weight', 'embeddings.word_embeddings.weight', 'encoder.layer.0.attention.output.LayerNorm.bias', 'encoder.layer.0.attention.output.LayerNorm.weight', 'encoder.layer.0.attention.output.dense.bias', 'encoder.layer.0.attention.output.dense.weight', 'encoder.layer.0.attention.self.key.bias', 'encoder.layer.0.attention.self.key.weight', 'encoder.layer.0.attention.self.query.bias', 'encoder.layer.0.attention.self.query.weight', 'encoder.layer.0.attention.self.value.bias', 'encoder.layer.0.attention.self.value.weight', 'encoder.layer.0.intermediate.dense.bias', 'encoder.layer.0.intermediate.dense.weight', 'encoder.layer.0.output.LayerNorm.bias', 'encoder.layer.0.output.LayerNorm.wei

Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.5798,0.448443,0.849765,0.517302
100,0.4296,0.414336,0.860915,0.531728
150,0.3857,0.394354,0.864437,0.534839
200,0.4102,0.398807,0.868545,0.532826
250,0.3721,0.377105,0.868545,0.529419
300,0.3406,0.402566,0.850939,0.549078
350,0.3691,0.363859,0.870305,0.628934
400,0.3485,0.367512,0.867958,0.542067
450,0.3087,0.369355,0.875,0.568069
500,0.3242,0.353012,0.872653,0.665578


tunis-ai/TunBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at tunis-ai/TunBERT and are newly initialized: ['classifier.bias', 'classifier.weight', 'embeddings.LayerNorm.bias', 'embeddings.LayerNorm.weight', 'embeddings.position_embeddings.weight', 'embeddings.token_type_embeddings.weight', 'embeddings.word_embeddings.weight', 'encoder.layer.0.attention.output.LayerNorm.bias', 'encoder.layer.0.attention.output.LayerNorm.weight', 'encoder.layer.0.attention.output.dense.bias', 'encoder.layer.0.attention.output.dense.weight', 'encoder.layer.0.attention.self.key.bias', 'encoder.layer.0.attention.self.key.weight', 'encoder.layer.0.attention.self.query.bias', 'encoder.layer.0.attention.self.query.weight', 'encoder.layer.0.attention.self.value.bias', 'encoder.layer.0.attention.self.value.weight', 'encoder.layer.0.intermediate.dense.bias', 'encoder.layer.0.intermediate.dense.weight', 'encoder.layer.0.output.LayerNorm.bias', 'encoder.layer.0.output.LayerNorm.wei

Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.5798,0.448443,0.849765,0.517302
100,0.4296,0.414336,0.860915,0.531728
150,0.3857,0.394354,0.864437,0.534839
200,0.4102,0.398807,0.868545,0.532826
250,0.3721,0.377105,0.868545,0.529419
300,0.3406,0.402566,0.850939,0.549078
350,0.3691,0.363859,0.870305,0.628934
400,0.3485,0.367512,0.867958,0.542067
450,0.3087,0.369355,0.875,0.568069
500,0.3242,0.353012,0.872653,0.665578


tunis-ai/TunBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at tunis-ai/TunBERT and are newly initialized: ['classifier.bias', 'classifier.weight', 'embeddings.LayerNorm.bias', 'embeddings.LayerNorm.weight', 'embeddings.position_embeddings.weight', 'embeddings.token_type_embeddings.weight', 'embeddings.word_embeddings.weight', 'encoder.layer.0.attention.output.LayerNorm.bias', 'encoder.layer.0.attention.output.LayerNorm.weight', 'encoder.layer.0.attention.output.dense.bias', 'encoder.layer.0.attention.output.dense.weight', 'encoder.layer.0.attention.self.key.bias', 'encoder.layer.0.attention.self.key.weight', 'encoder.layer.0.attention.self.query.bias', 'encoder.layer.0.attention.self.query.weight', 'encoder.layer.0.attention.self.value.bias', 'encoder.layer.0.attention.self.value.weight', 'encoder.layer.0.intermediate.dense.bias', 'encoder.layer.0.intermediate.dense.weight', 'encoder.layer.0.output.LayerNorm.bias', 'encoder.layer.0.output.LayerNorm.wei

Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.5798,0.448443,0.849765,0.517302
100,0.4296,0.414336,0.860915,0.531728
150,0.3857,0.394354,0.864437,0.534839
200,0.4102,0.398807,0.868545,0.532826
250,0.3721,0.377105,0.868545,0.529419
300,0.3406,0.402566,0.850939,0.549078
350,0.3691,0.363859,0.870305,0.628934
400,0.3485,0.367512,0.867958,0.542067
450,0.3087,0.369355,0.875,0.568069
500,0.3242,0.353012,0.872653,0.665578


tunis-ai/TunBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at tunis-ai/TunBERT and are newly initialized: ['classifier.bias', 'classifier.weight', 'embeddings.LayerNorm.bias', 'embeddings.LayerNorm.weight', 'embeddings.position_embeddings.weight', 'embeddings.token_type_embeddings.weight', 'embeddings.word_embeddings.weight', 'encoder.layer.0.attention.output.LayerNorm.bias', 'encoder.layer.0.attention.output.LayerNorm.weight', 'encoder.layer.0.attention.output.dense.bias', 'encoder.layer.0.attention.output.dense.weight', 'encoder.layer.0.attention.self.key.bias', 'encoder.layer.0.attention.self.key.weight', 'encoder.layer.0.attention.self.query.bias', 'encoder.layer.0.attention.self.query.weight', 'encoder.layer.0.attention.self.value.bias', 'encoder.layer.0.attention.self.value.weight', 'encoder.layer.0.intermediate.dense.bias', 'encoder.layer.0.intermediate.dense.weight', 'encoder.layer.0.output.LayerNorm.bias', 'encoder.layer.0.output.LayerNorm.wei

Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.5443,0.420295,0.863263,0.530884
100,0.3975,0.500606,0.795775,0.500007
150,0.4235,0.439226,0.870305,0.537581
200,0.3824,0.443067,0.816901,0.400243
250,0.3797,0.399601,0.86385,0.526229
300,0.3635,0.467465,0.862676,0.54339
350,0.3676,0.38263,0.865023,0.604724
400,0.3521,0.374783,0.869131,0.545323
450,0.3056,0.398964,0.851526,0.581264
500,0.3297,0.353206,0.877934,0.626709


tunis-ai/TunBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at tunis-ai/TunBERT and are newly initialized: ['classifier.bias', 'classifier.weight', 'embeddings.LayerNorm.bias', 'embeddings.LayerNorm.weight', 'embeddings.position_embeddings.weight', 'embeddings.token_type_embeddings.weight', 'embeddings.word_embeddings.weight', 'encoder.layer.0.attention.output.LayerNorm.bias', 'encoder.layer.0.attention.output.LayerNorm.weight', 'encoder.layer.0.attention.output.dense.bias', 'encoder.layer.0.attention.output.dense.weight', 'encoder.layer.0.attention.self.key.bias', 'encoder.layer.0.attention.self.key.weight', 'encoder.layer.0.attention.self.query.bias', 'encoder.layer.0.attention.self.query.weight', 'encoder.layer.0.attention.self.value.bias', 'encoder.layer.0.attention.self.value.weight', 'encoder.layer.0.intermediate.dense.bias', 'encoder.layer.0.intermediate.dense.weight', 'encoder.layer.0.output.LayerNorm.bias', 'encoder.layer.0.output.LayerNorm.wei

Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.5443,0.420295,0.863263,0.530884
100,0.3975,0.500606,0.795775,0.500007
150,0.4235,0.439226,0.870305,0.537581
200,0.3824,0.443067,0.816901,0.400243
250,0.3797,0.399601,0.86385,0.526229
300,0.3635,0.467465,0.862676,0.54339
350,0.3676,0.38263,0.865023,0.604724
400,0.3521,0.374783,0.869131,0.545323
450,0.3056,0.398964,0.851526,0.581264
500,0.3297,0.353206,0.877934,0.626709


tunis-ai/TunBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at tunis-ai/TunBERT and are newly initialized: ['classifier.bias', 'classifier.weight', 'embeddings.LayerNorm.bias', 'embeddings.LayerNorm.weight', 'embeddings.position_embeddings.weight', 'embeddings.token_type_embeddings.weight', 'embeddings.word_embeddings.weight', 'encoder.layer.0.attention.output.LayerNorm.bias', 'encoder.layer.0.attention.output.LayerNorm.weight', 'encoder.layer.0.attention.output.dense.bias', 'encoder.layer.0.attention.output.dense.weight', 'encoder.layer.0.attention.self.key.bias', 'encoder.layer.0.attention.self.key.weight', 'encoder.layer.0.attention.self.query.bias', 'encoder.layer.0.attention.self.query.weight', 'encoder.layer.0.attention.self.value.bias', 'encoder.layer.0.attention.self.value.weight', 'encoder.layer.0.intermediate.dense.bias', 'encoder.layer.0.intermediate.dense.weight', 'encoder.layer.0.output.LayerNorm.bias', 'encoder.layer.0.output.LayerNorm.wei

Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.5443,0.420295,0.863263,0.530884
100,0.3975,0.500606,0.795775,0.500007
150,0.4235,0.439226,0.870305,0.537581
200,0.3824,0.443067,0.816901,0.400243
250,0.3797,0.399601,0.86385,0.526229
300,0.3635,0.467465,0.862676,0.54339
350,0.3676,0.38263,0.865023,0.604724
400,0.3521,0.374783,0.869131,0.545323
450,0.3056,0.398964,0.851526,0.581264
500,0.3297,0.353206,0.877934,0.626709


tunis-ai/TunBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at tunis-ai/TunBERT and are newly initialized: ['classifier.bias', 'classifier.weight', 'embeddings.LayerNorm.bias', 'embeddings.LayerNorm.weight', 'embeddings.position_embeddings.weight', 'embeddings.token_type_embeddings.weight', 'embeddings.word_embeddings.weight', 'encoder.layer.0.attention.output.LayerNorm.bias', 'encoder.layer.0.attention.output.LayerNorm.weight', 'encoder.layer.0.attention.output.dense.bias', 'encoder.layer.0.attention.output.dense.weight', 'encoder.layer.0.attention.self.key.bias', 'encoder.layer.0.attention.self.key.weight', 'encoder.layer.0.attention.self.query.bias', 'encoder.layer.0.attention.self.query.weight', 'encoder.layer.0.attention.self.value.bias', 'encoder.layer.0.attention.self.value.weight', 'encoder.layer.0.intermediate.dense.bias', 'encoder.layer.0.intermediate.dense.weight', 'encoder.layer.0.output.LayerNorm.bias', 'encoder.layer.0.output.LayerNorm.wei

Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.5671,0.437086,0.85446,0.526122
100,0.4294,0.437963,0.834507,0.51154
150,0.4063,0.42158,0.83392,0.418469
200,0.4125,0.363573,0.873239,0.54072
250,0.371,0.39504,0.857394,0.497134
300,0.3577,0.364231,0.873239,0.536883
350,0.366,0.363264,0.861502,0.634207
400,0.3373,0.359598,0.875,0.561034
450,0.3386,0.3625,0.870305,0.574737
500,0.325,0.384364,0.85446,0.649586


tunis-ai/TunBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at tunis-ai/TunBERT and are newly initialized: ['classifier.bias', 'classifier.weight', 'embeddings.LayerNorm.bias', 'embeddings.LayerNorm.weight', 'embeddings.position_embeddings.weight', 'embeddings.token_type_embeddings.weight', 'embeddings.word_embeddings.weight', 'encoder.layer.0.attention.output.LayerNorm.bias', 'encoder.layer.0.attention.output.LayerNorm.weight', 'encoder.layer.0.attention.output.dense.bias', 'encoder.layer.0.attention.output.dense.weight', 'encoder.layer.0.attention.self.key.bias', 'encoder.layer.0.attention.self.key.weight', 'encoder.layer.0.attention.self.query.bias', 'encoder.layer.0.attention.self.query.weight', 'encoder.layer.0.attention.self.value.bias', 'encoder.layer.0.attention.self.value.weight', 'encoder.layer.0.intermediate.dense.bias', 'encoder.layer.0.intermediate.dense.weight', 'encoder.layer.0.output.LayerNorm.bias', 'encoder.layer.0.output.LayerNorm.wei

Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.5671,0.437086,0.85446,0.526122
100,0.4294,0.437963,0.834507,0.51154
150,0.4063,0.42158,0.83392,0.418469
200,0.4125,0.363573,0.873239,0.54072
250,0.371,0.39504,0.857394,0.497134
300,0.3577,0.364231,0.873239,0.536883
350,0.366,0.363264,0.861502,0.634207
400,0.3373,0.359598,0.875,0.561034
450,0.3386,0.3625,0.870305,0.574737
500,0.325,0.384364,0.85446,0.649586


tunis-ai/TunBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at tunis-ai/TunBERT and are newly initialized: ['classifier.bias', 'classifier.weight', 'embeddings.LayerNorm.bias', 'embeddings.LayerNorm.weight', 'embeddings.position_embeddings.weight', 'embeddings.token_type_embeddings.weight', 'embeddings.word_embeddings.weight', 'encoder.layer.0.attention.output.LayerNorm.bias', 'encoder.layer.0.attention.output.LayerNorm.weight', 'encoder.layer.0.attention.output.dense.bias', 'encoder.layer.0.attention.output.dense.weight', 'encoder.layer.0.attention.self.key.bias', 'encoder.layer.0.attention.self.key.weight', 'encoder.layer.0.attention.self.query.bias', 'encoder.layer.0.attention.self.query.weight', 'encoder.layer.0.attention.self.value.bias', 'encoder.layer.0.attention.self.value.weight', 'encoder.layer.0.intermediate.dense.bias', 'encoder.layer.0.intermediate.dense.weight', 'encoder.layer.0.output.LayerNorm.bias', 'encoder.layer.0.output.LayerNorm.wei

Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.5671,0.437086,0.85446,0.526122
100,0.4294,0.437963,0.834507,0.51154
150,0.4063,0.42158,0.83392,0.418469
200,0.4125,0.363573,0.873239,0.54072
250,0.371,0.39504,0.857394,0.497134
300,0.3577,0.364231,0.873239,0.536883
350,0.366,0.363264,0.861502,0.634207
400,0.3373,0.359598,0.875,0.561034
450,0.3386,0.3625,0.870305,0.574737
500,0.325,0.384364,0.85446,0.649586


DatasetDict({
    train: Dataset({
        features: ['Twits', 'label', '__index_level_0__'],
        num_rows: 6816
    })
    test: Dataset({
        features: ['Twits', 'label', '__index_level_0__'],
        num_rows: 1704
    })
})

alger-ia/dziribert, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at alger-ia/dziribert and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3812,0.306917,0.881455,0.688459
100,0.2934,0.298723,0.882629,0.713574
150,0.1786,0.356214,0.878521,0.712821
200,0.1856,0.322228,0.888498,0.691644
250,0.0976,0.428804,0.892606,0.73101
300,0.0446,0.547756,0.882042,0.693509
350,0.0463,0.516981,0.88439,0.706878
400,0.0228,0.549817,0.883216,0.735829
450,0.015,0.629247,0.894366,0.744415
500,0.01,0.615532,0.889085,0.747426


alger-ia/dziribert, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at alger-ia/dziribert and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3812,0.306917,0.881455,0.688459
100,0.2934,0.298723,0.882629,0.713574
150,0.1786,0.356214,0.878521,0.712821
200,0.1856,0.322228,0.888498,0.691644
250,0.0976,0.428804,0.892606,0.73101
300,0.0446,0.547756,0.882042,0.693509
350,0.0463,0.516981,0.88439,0.706878
400,0.0228,0.549817,0.883216,0.735829
450,0.015,0.629247,0.894366,0.744415
500,0.01,0.615532,0.889085,0.747426


alger-ia/dziribert, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at alger-ia/dziribert and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3812,0.306917,0.881455,0.688459
100,0.2934,0.298723,0.882629,0.713574
150,0.1786,0.356214,0.878521,0.712821
200,0.1856,0.322228,0.888498,0.691644
250,0.0976,0.428804,0.892606,0.73101
300,0.0446,0.547756,0.882042,0.693509
350,0.0463,0.516981,0.88439,0.706878
400,0.0228,0.549817,0.883216,0.735829
450,0.015,0.629247,0.894366,0.744415
500,0.01,0.615532,0.889085,0.747426


alger-ia/dziribert, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at alger-ia/dziribert and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3958,0.302262,0.88439,0.706477
100,0.284,0.29848,0.890258,0.691339
150,0.1966,0.339563,0.88439,0.706094
200,0.1633,0.376311,0.879108,0.697689
250,0.1016,0.483033,0.881455,0.701527
300,0.0621,0.523173,0.879108,0.702102
350,0.0503,0.601313,0.883216,0.705336
400,0.0248,0.604293,0.880869,0.717343
450,0.0166,0.62025,0.883803,0.718007
500,0.017,0.695194,0.871479,0.700568


alger-ia/dziribert, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at alger-ia/dziribert and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3958,0.302262,0.88439,0.706477
100,0.284,0.29848,0.890258,0.691339
150,0.1966,0.339563,0.88439,0.706094
200,0.1633,0.376311,0.879108,0.697689
250,0.1016,0.483033,0.881455,0.701527
300,0.0621,0.523173,0.879108,0.702102
350,0.0503,0.601313,0.883216,0.705336
400,0.0248,0.604293,0.880869,0.717343
450,0.0166,0.62025,0.883803,0.718007
500,0.017,0.695194,0.871479,0.700568


alger-ia/dziribert, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at alger-ia/dziribert and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3958,0.302262,0.88439,0.706477
100,0.284,0.29848,0.890258,0.691339
150,0.1966,0.339563,0.88439,0.706094
200,0.1633,0.376311,0.879108,0.697689
250,0.1016,0.483033,0.881455,0.701527
300,0.0621,0.523173,0.879108,0.702102
350,0.0503,0.601313,0.883216,0.705336
400,0.0248,0.604293,0.880869,0.717343
450,0.0166,0.62025,0.883803,0.718007
500,0.017,0.695194,0.871479,0.700568


alger-ia/dziribert, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at alger-ia/dziribert and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4046,0.298131,0.884977,0.709742
100,0.2803,0.279361,0.8973,0.718191
150,0.2013,0.305198,0.889085,0.711949
200,0.1796,0.310676,0.898474,0.746594
250,0.0848,0.473502,0.890258,0.729593
300,0.0675,0.440378,0.892019,0.725128
350,0.0499,0.556676,0.882629,0.72871
400,0.0317,0.544017,0.88615,0.718577
450,0.0156,0.612121,0.890258,0.727161
500,0.0126,0.658654,0.881455,0.728146


alger-ia/dziribert, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at alger-ia/dziribert and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4046,0.298131,0.884977,0.709742
100,0.2803,0.279361,0.8973,0.718191
150,0.2013,0.305198,0.889085,0.711949
200,0.1796,0.310676,0.898474,0.746594
250,0.0848,0.473502,0.890258,0.729593
300,0.0675,0.440378,0.892019,0.725128
350,0.0499,0.556676,0.882629,0.72871
400,0.0317,0.544017,0.88615,0.718577
450,0.0156,0.612121,0.890258,0.727161
500,0.0126,0.658654,0.881455,0.728146


alger-ia/dziribert, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at alger-ia/dziribert and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4046,0.298131,0.884977,0.709742
100,0.2803,0.279361,0.8973,0.718191
150,0.2013,0.305198,0.889085,0.711949
200,0.1796,0.310676,0.898474,0.746594
250,0.0848,0.473502,0.890258,0.729593
300,0.0675,0.440378,0.892019,0.725128
350,0.0499,0.556676,0.882629,0.72871
400,0.0317,0.544017,0.88615,0.718577
450,0.0156,0.612121,0.890258,0.727161
500,0.0126,0.658654,0.881455,0.728146


DatasetDict({
    train: Dataset({
        features: ['Twits', 'label', '__index_level_0__'],
        num_rows: 6816
    })
    test: Dataset({
        features: ['Twits', 'label', '__index_level_0__'],
        num_rows: 1704
    })
})

SI2M-Lab/DarijaBERT, try:0


The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3989,0.33181,0.873826,0.688338
100,0.3109,0.332829,0.876761,0.709931
150,0.2175,0.372362,0.878521,0.716345
200,0.2331,0.384803,0.88439,0.667998
250,0.1507,0.428496,0.877934,0.727472
300,0.1091,0.463164,0.885563,0.673612
350,0.0789,0.481249,0.887911,0.737731
400,0.0448,0.560135,0.875587,0.715835
450,0.0403,0.628042,0.876761,0.715229
500,0.0317,0.618908,0.882629,0.727385


The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.


SI2M-Lab/DarijaBERT, try:1


The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3989,0.33181,0.873826,0.688338
100,0.3109,0.332829,0.876761,0.709931
150,0.2175,0.372362,0.878521,0.716345
200,0.2331,0.384803,0.88439,0.667998
250,0.1507,0.428496,0.877934,0.727472
300,0.1091,0.463164,0.885563,0.673612
350,0.0789,0.481249,0.887911,0.737731
400,0.0448,0.560135,0.875587,0.715835
450,0.0403,0.628042,0.876761,0.715229
500,0.0317,0.618908,0.882629,0.727385


The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.


SI2M-Lab/DarijaBERT, try:2


The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3989,0.33181,0.873826,0.688338
100,0.3109,0.332829,0.876761,0.709931
150,0.2175,0.372362,0.878521,0.716345
200,0.2331,0.384803,0.88439,0.667998
250,0.1507,0.428496,0.877934,0.727472
300,0.1091,0.463164,0.885563,0.673612
350,0.0789,0.481249,0.887911,0.737731
400,0.0448,0.560135,0.875587,0.715835
450,0.0403,0.628042,0.876761,0.715229
500,0.0317,0.618908,0.882629,0.727385


The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.


SI2M-Lab/DarijaBERT, try:0


The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4071,0.323254,0.871479,0.701349
100,0.3123,0.324472,0.88615,0.644563
150,0.2646,0.356653,0.883216,0.701021
200,0.2117,0.359089,0.867371,0.666337
250,0.1489,0.413719,0.884977,0.700027
300,0.1188,0.410003,0.885563,0.723536
350,0.0791,0.496991,0.880282,0.723843
400,0.057,0.507634,0.892019,0.741583
450,0.0474,0.555412,0.891432,0.740012
500,0.0409,0.562397,0.888498,0.723551


The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.


SI2M-Lab/DarijaBERT, try:1


The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4071,0.323254,0.871479,0.701349
100,0.3123,0.324472,0.88615,0.644563
150,0.2646,0.356653,0.883216,0.701021
200,0.2117,0.359089,0.867371,0.666337
250,0.1489,0.413719,0.884977,0.700027
300,0.1188,0.410003,0.885563,0.723536
350,0.0791,0.496991,0.880282,0.723843
400,0.057,0.507634,0.892019,0.741583
450,0.0474,0.555412,0.891432,0.740012
500,0.0409,0.562397,0.888498,0.723551


The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.


SI2M-Lab/DarijaBERT, try:2


The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4071,0.323254,0.871479,0.701349
100,0.3123,0.324472,0.88615,0.644563
150,0.2646,0.356653,0.883216,0.701021
200,0.2117,0.359089,0.867371,0.666337
250,0.1489,0.413719,0.884977,0.700027
300,0.1188,0.410003,0.885563,0.723536
350,0.0791,0.496991,0.880282,0.723843
400,0.057,0.507634,0.892019,0.741583
450,0.0474,0.555412,0.891432,0.740012
500,0.0409,0.562397,0.888498,0.723551


The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.


SI2M-Lab/DarijaBERT, try:0


The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.417,0.336257,0.867958,0.69342
100,0.3061,0.310603,0.887911,0.740502
150,0.2383,0.305464,0.892019,0.709977
200,0.2249,0.300306,0.905516,0.760702
250,0.1401,0.45267,0.885563,0.712212
300,0.1222,0.369384,0.897887,0.725037
350,0.083,0.636626,0.859155,0.68037
400,0.0488,0.480514,0.900822,0.735498
450,0.0397,0.500639,0.897887,0.728991
500,0.034,0.565574,0.88615,0.723148


The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.


SI2M-Lab/DarijaBERT, try:1


The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.417,0.336257,0.867958,0.69342
100,0.3061,0.310603,0.887911,0.740502
150,0.2383,0.305464,0.892019,0.709977
200,0.2249,0.300306,0.905516,0.760702
250,0.1401,0.45267,0.885563,0.712212
300,0.1222,0.369384,0.897887,0.725037
350,0.083,0.636626,0.859155,0.68037
400,0.0488,0.480514,0.900822,0.735498
450,0.0397,0.500639,0.897887,0.728991
500,0.034,0.565574,0.88615,0.723148


The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.


SI2M-Lab/DarijaBERT, try:2


The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
The `xla_device` argument has been deprecated in v4.4.0 of Transformers. It is ignored and you can safely remove it from your `config.json` file.
Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.417,0.336257,0.867958,0.69342
100,0.3061,0.310603,0.887911,0.740502
150,0.2383,0.305464,0.892019,0.709977
200,0.2249,0.300306,0.905516,0.760702
250,0.1401,0.45267,0.885563,0.712212
300,0.1222,0.369384,0.897887,0.725037
350,0.083,0.636626,0.859155,0.68037
400,0.0488,0.480514,0.900822,0.735498
450,0.0397,0.500639,0.897887,0.728991
500,0.034,0.565574,0.88615,0.723148


DatasetDict({
    train: Dataset({
        features: ['Twits', 'label', '__index_level_0__'],
        num_rows: 6816
    })
    test: Dataset({
        features: ['Twits', 'label', '__index_level_0__'],
        num_rows: 1704
    })
})

otmangi/MorRoBERTa, try:0


Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at otmangi/MorRoBERTa and are newly initialized: ['classifier.dense.bias', 'classifier.dense.weight', 'classifier.out_proj.bias', 'classifier.out_proj.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3994,0.32573,0.880869,0.696009
100,0.3064,0.308644,0.88439,0.734313
150,0.2091,0.369309,0.876761,0.705504
200,0.2245,0.342283,0.889085,0.680744
250,0.1381,0.439343,0.882629,0.7061
300,0.091,0.4227,0.890845,0.727363
350,0.0635,0.520461,0.88615,0.69145
400,0.0327,0.597873,0.872653,0.717921
450,0.0297,0.59705,0.883803,0.721898
500,0.0156,0.674212,0.871479,0.699928


otmangi/MorRoBERTa, try:1


Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at otmangi/MorRoBERTa and are newly initialized: ['classifier.dense.bias', 'classifier.dense.weight', 'classifier.out_proj.bias', 'classifier.out_proj.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3994,0.32573,0.880869,0.696009
100,0.3064,0.308644,0.88439,0.734313
150,0.2091,0.369309,0.876761,0.705504
200,0.2245,0.342283,0.889085,0.680744
250,0.1381,0.439343,0.882629,0.7061
300,0.091,0.4227,0.890845,0.727363
350,0.0635,0.520461,0.88615,0.69145
400,0.0327,0.597873,0.872653,0.717921
450,0.0297,0.59705,0.883803,0.721898
500,0.0156,0.674212,0.871479,0.699928


otmangi/MorRoBERTa, try:2


Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at otmangi/MorRoBERTa and are newly initialized: ['classifier.dense.bias', 'classifier.dense.weight', 'classifier.out_proj.bias', 'classifier.out_proj.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3994,0.32573,0.880869,0.696009
100,0.3064,0.308644,0.88439,0.734313
150,0.2091,0.369309,0.876761,0.705504
200,0.2245,0.342283,0.889085,0.680744
250,0.1381,0.439343,0.882629,0.7061
300,0.091,0.4227,0.890845,0.727363
350,0.0635,0.520461,0.88615,0.69145
400,0.0327,0.597873,0.872653,0.717921
450,0.0297,0.59705,0.883803,0.721898
500,0.0156,0.674212,0.871479,0.699928


otmangi/MorRoBERTa, try:0


Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at otmangi/MorRoBERTa and are newly initialized: ['classifier.dense.bias', 'classifier.dense.weight', 'classifier.out_proj.bias', 'classifier.out_proj.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4091,0.316939,0.874413,0.697284
100,0.2967,0.302311,0.877934,0.691758
150,0.2348,0.318162,0.886737,0.71601
200,0.1915,0.374254,0.880869,0.71798
250,0.1292,0.456359,0.880869,0.71962
300,0.1093,0.399119,0.884977,0.734061
350,0.0678,0.531326,0.879695,0.723305
400,0.0462,0.543401,0.880869,0.717747
450,0.04,0.529996,0.880282,0.73147
500,0.0296,0.6217,0.880869,0.705671


otmangi/MorRoBERTa, try:1


Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at otmangi/MorRoBERTa and are newly initialized: ['classifier.dense.bias', 'classifier.dense.weight', 'classifier.out_proj.bias', 'classifier.out_proj.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4091,0.316939,0.874413,0.697284
100,0.2967,0.302311,0.877934,0.691758
150,0.2348,0.318162,0.886737,0.71601
200,0.1915,0.374254,0.880869,0.71798
250,0.1292,0.456359,0.880869,0.71962
300,0.1093,0.399119,0.884977,0.734061
350,0.0678,0.531326,0.879695,0.723305
400,0.0462,0.543401,0.880869,0.717747
450,0.04,0.529996,0.880282,0.73147
500,0.0296,0.6217,0.880869,0.705671


otmangi/MorRoBERTa, try:2


Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at otmangi/MorRoBERTa and are newly initialized: ['classifier.dense.bias', 'classifier.dense.weight', 'classifier.out_proj.bias', 'classifier.out_proj.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4091,0.316939,0.874413,0.697284
100,0.2967,0.302311,0.877934,0.691758
150,0.2348,0.318162,0.886737,0.71601
200,0.1915,0.374254,0.880869,0.71798
250,0.1292,0.456359,0.880869,0.71962
300,0.1093,0.399119,0.884977,0.734061
350,0.0678,0.531326,0.879695,0.723305
400,0.0462,0.543401,0.880869,0.717747
450,0.04,0.529996,0.880282,0.73147
500,0.0296,0.6217,0.880869,0.705671


otmangi/MorRoBERTa, try:0


Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at otmangi/MorRoBERTa and are newly initialized: ['classifier.dense.bias', 'classifier.dense.weight', 'classifier.out_proj.bias', 'classifier.out_proj.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4211,0.316038,0.875,0.684096
100,0.2881,0.296718,0.893192,0.721491
150,0.2221,0.312444,0.889671,0.723054
200,0.2001,0.321918,0.892606,0.735544
250,0.1279,0.432919,0.884977,0.735379
300,0.1069,0.451701,0.883803,0.698837
350,0.0801,0.533335,0.881455,0.728885
400,0.0445,0.573404,0.889085,0.730237
450,0.0311,0.662542,0.869131,0.690255
500,0.0316,0.622062,0.884977,0.741106


otmangi/MorRoBERTa, try:1


Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at otmangi/MorRoBERTa and are newly initialized: ['classifier.dense.bias', 'classifier.dense.weight', 'classifier.out_proj.bias', 'classifier.out_proj.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4211,0.316038,0.875,0.684096
100,0.2881,0.296718,0.893192,0.721491
150,0.2221,0.312444,0.889671,0.723054
200,0.2001,0.321918,0.892606,0.735544
250,0.1279,0.432919,0.884977,0.735379
300,0.1069,0.451701,0.883803,0.698837
350,0.0801,0.533335,0.881455,0.728885
400,0.0445,0.573404,0.889085,0.730237
450,0.0311,0.662542,0.869131,0.690255
500,0.0316,0.622062,0.884977,0.741106


otmangi/MorRoBERTa, try:2


Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at otmangi/MorRoBERTa and are newly initialized: ['classifier.dense.bias', 'classifier.dense.weight', 'classifier.out_proj.bias', 'classifier.out_proj.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4211,0.316038,0.875,0.684096
100,0.2881,0.296718,0.893192,0.721491
150,0.2221,0.312444,0.889671,0.723054
200,0.2001,0.321918,0.892606,0.735544
250,0.1279,0.432919,0.884977,0.735379
300,0.1069,0.451701,0.883803,0.698837
350,0.0801,0.533335,0.881455,0.728885
400,0.0445,0.573404,0.889085,0.730237
450,0.0311,0.662542,0.869131,0.690255
500,0.0316,0.622062,0.884977,0.741106


DatasetDict({
    train: Dataset({
        features: ['Twits', 'label', '__index_level_0__'],
        num_rows: 6816
    })
    test: Dataset({
        features: ['Twits', 'label', '__index_level_0__'],
        num_rows: 1704
    })
})

otmangi/MorrBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at otmangi/MorrBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3751,0.313671,0.883216,0.708885
100,0.3004,0.312895,0.875,0.694216
150,0.2052,0.347163,0.88615,0.717868
200,0.2068,0.348047,0.885563,0.687802
250,0.1241,0.412404,0.880869,0.703491
300,0.0667,0.454959,0.885563,0.711309
350,0.0654,0.536963,0.884977,0.704408
400,0.0433,0.535829,0.880282,0.69789
450,0.0187,0.621454,0.882629,0.705214
500,0.0194,0.64646,0.88439,0.705493


otmangi/MorrBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at otmangi/MorrBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3751,0.313671,0.883216,0.708885
100,0.3004,0.312895,0.875,0.694216
150,0.2052,0.347163,0.88615,0.717868
200,0.2068,0.348047,0.885563,0.687802
250,0.1241,0.412404,0.880869,0.703491
300,0.0667,0.454959,0.885563,0.711309
350,0.0654,0.536963,0.884977,0.704408
400,0.0433,0.535829,0.880282,0.69789
450,0.0187,0.621454,0.882629,0.705214
500,0.0194,0.64646,0.88439,0.705493


otmangi/MorrBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at otmangi/MorrBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3751,0.313671,0.883216,0.708885
100,0.3004,0.312895,0.875,0.694216
150,0.2052,0.347163,0.88615,0.717868
200,0.2068,0.348047,0.885563,0.687802
250,0.1241,0.412404,0.880869,0.703491
300,0.0667,0.454959,0.885563,0.711309
350,0.0654,0.536963,0.884977,0.704408
400,0.0433,0.535829,0.880282,0.69789
450,0.0187,0.621454,0.882629,0.705214
500,0.0194,0.64646,0.88439,0.705493


otmangi/MorrBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at otmangi/MorrBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.389,0.31341,0.883216,0.700499
100,0.2982,0.293738,0.889671,0.706551
150,0.2332,0.31339,0.887911,0.698033
200,0.1888,0.344724,0.881455,0.693932
250,0.1305,0.551678,0.870305,0.626156
300,0.1006,0.440868,0.876174,0.688218
350,0.0587,0.556709,0.879695,0.700947
400,0.0427,0.608421,0.873239,0.688855
450,0.0257,0.629472,0.880869,0.697694
500,0.0226,0.738301,0.877347,0.692228


otmangi/MorrBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at otmangi/MorrBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.389,0.31341,0.883216,0.700499
100,0.2982,0.293738,0.889671,0.706551
150,0.2332,0.31339,0.887911,0.698033
200,0.1888,0.344724,0.881455,0.693932
250,0.1305,0.551678,0.870305,0.626156
300,0.1006,0.440868,0.876174,0.688218
350,0.0587,0.556709,0.879695,0.700947
400,0.0427,0.608421,0.873239,0.688855
450,0.0257,0.629472,0.880869,0.697694
500,0.0226,0.738301,0.877347,0.692228


otmangi/MorrBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at otmangi/MorrBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.389,0.31341,0.883216,0.700499
100,0.2982,0.293738,0.889671,0.706551
150,0.2332,0.31339,0.887911,0.698033
200,0.1888,0.344724,0.881455,0.693932
250,0.1305,0.551678,0.870305,0.626156
300,0.1006,0.440868,0.876174,0.688218
350,0.0587,0.556709,0.879695,0.700947
400,0.0427,0.608421,0.873239,0.688855
450,0.0257,0.629472,0.880869,0.697694
500,0.0226,0.738301,0.877347,0.692228


otmangi/MorrBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at otmangi/MorrBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3987,0.310427,0.880869,0.675646
100,0.2975,0.298319,0.896127,0.709025
150,0.2247,0.319014,0.875,0.697351
200,0.208,0.297875,0.894366,0.72429
250,0.1079,0.40776,0.889671,0.734273
300,0.0869,0.41533,0.88615,0.691722
350,0.0736,0.485916,0.879108,0.69109
400,0.0429,0.582877,0.88439,0.707364
450,0.0402,0.549538,0.890258,0.724016
500,0.0288,0.572886,0.88615,0.712613


otmangi/MorrBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at otmangi/MorrBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3987,0.310427,0.880869,0.675646
100,0.2975,0.298319,0.896127,0.709025
150,0.2247,0.319014,0.875,0.697351
200,0.208,0.297875,0.894366,0.72429
250,0.1079,0.40776,0.889671,0.734273
300,0.0869,0.41533,0.88615,0.691722
350,0.0736,0.485916,0.879108,0.69109
400,0.0429,0.582877,0.88439,0.707364
450,0.0402,0.549538,0.890258,0.724016
500,0.0288,0.572886,0.88615,0.712613


otmangi/MorrBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at otmangi/MorrBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3987,0.310427,0.880869,0.675646
100,0.2975,0.298319,0.896127,0.709025
150,0.2247,0.319014,0.875,0.697351
200,0.208,0.297875,0.894366,0.72429
250,0.1079,0.40776,0.889671,0.734273
300,0.0869,0.41533,0.88615,0.691722
350,0.0736,0.485916,0.879108,0.69109
400,0.0429,0.582877,0.88439,0.707364
450,0.0402,0.549538,0.890258,0.724016
500,0.0288,0.572886,0.88615,0.712613


Unnamed: 0,Model,Accuracy,F1
0,SI2M-Lab/DarijaBERT,0.896127,0.762304
3,alger-ia/dziribert,0.889085,0.747426
6,faisalq/EgyBERT,0.893192,0.736059
9,faisalq/SaudiBERT,0.901408,0.759349
12,otmangi/MorRoBERTa,0.886737,0.744082
15,otmangi/MorrBERT,0.889671,0.734273
18,tunis-ai/TunBERT,0.879108,0.682487
