In [1]:
import os
os.environ["CUDA_VISIBLE_DEVICES"]="0" 

import numpy as np
import tensorflow as tf
import pandas as pd
import pyarabic.araby as araby
import warnings
warnings.filterwarnings('ignore')
from sklearn.model_selection import train_test_split
from sklearn.metrics import classification_report
from tensorflow.keras.layers import Dense, Input
from tensorflow.keras.utils import to_categorical
from tensorflow.keras.optimizers import Adam
from tensorflow.keras.callbacks import EarlyStopping
from tensorflow.keras.initializers import TruncatedNormal
from tensorflow.keras.losses import CategoricalCrossentropy
from tensorflow.keras.metrics import CategoricalAccuracy
import torch
from sklearn.metrics import accuracy_score, f1_score
from transformers import Trainer, TrainingArguments
from transformers import AutoTokenizer, AutoModelForSequenceClassification
from datasets import load_dataset, Dataset, concatenate_datasets
pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', None)
pd.set_option('display.max_colwidth', 1000)


fname = 'MAC_1'
log_file = fname + '.txt'

with open(log_file, 'w') as f:
    f.write('Model,Accuracy,F1\n')


df = pd.read_csv('datasets/MAC corpus.csv', encoding='utf-8', engine='python') #, quotechar="'"  , quoting=3


      
display(df.columns)
display(df[:4])

df['tweets'] = df['tweets'].astype('str')

classes = set(df['type'].values)
display(classes)

c = df['type'].value_counts()
display(c)

df['type'] = df['type'].astype('category')
df['label'] = df['type'].cat.codes

df = df[['tweets', 'label']]
classes_num = len(classes)
display(classes_num)
display(len(df))


# ds = Dataset.from_pandas(df)
# ds = ds.train_test_split(test_size=0.2)

# display(ds)

max_sequence_length = 128


models = [ 
        'aubmindlab/bert-base-arabertv02-twitter',
        'CAMeL-Lab/bert-base-arabic-camelbert-da',
        'qarib/bert-base-qarib', 
        'UBC-NLP/MARBERT',
        'UBC-NLP/MARBERTv2',
    'SI2M-Lab/DarijaBERT-mix',
    'SI2M-Lab/DarijaBERT-arabizi'
]





seeds = [0, 1, 42]

for model_name in models:
    for seed in seeds:
        ds = Dataset.from_pandas(df)
        ds = ds.train_test_split(test_size=0.2, seed = seed)
        if seed==0:
            display(ds)
        for i in range(3):
            print(f'{model_name}, try:{i}')
                  
            tokenizer = AutoTokenizer.from_pretrained(model_name)
            model = AutoModelForSequenceClassification.from_pretrained(model_name,
                                                                  num_labels=classes_num).to('cuda')                                                 
            dataset_train = ds['train']
            dataset_validation = ds['test']                                                    
            
          
    
            def preprocess_function(examples):
                return tokenizer(examples['tweets'], truncation=True, padding="max_length",
                                max_length=max_sequence_length)
            
            
            dataset_train = dataset_train.map(preprocess_function, batched=True) # , batched=True
            dataset_validation = dataset_validation.map(preprocess_function, batched=True)  # , batched=True
            
           
            
            def compute_metrics(eval_pred):
                logits, labels = eval_pred
                predictions = np.argmax(logits, axis=-1)    
                acc = accuracy_score(labels, predictions)        
                f1 = f1_score(labels, predictions, average='macro')   
                with open(log_file, 'a') as f:
                    f.write(f'{model_name},{acc},{f1}\n')
                return {'accuracy': acc, 'f1_score': f1}
    
    
            
            
            epochs = 10
            save_steps = 10000 #save checkpoint every 10000 steps
            batch_size = 64
            
            training_args = TrainingArguments(
                output_dir = 'bert/',
                overwrite_output_dir=True,
                num_train_epochs = epochs,
                per_device_train_batch_size = batch_size,
                per_device_eval_batch_size = batch_size,
                save_steps = save_steps,
                save_total_limit = 1, #only save the last 5 checkpoints
                fp16=True,
                learning_rate = 5e-5,  # 5e-5 is the default
                logging_steps = 80, #50_000
                evaluation_strategy = 'steps',
                # evaluate_during_training = True,
                eval_steps = 80
                
            )
            
            trainer = Trainer(
                model = model,
                args = training_args,
                # data_collator=data_collator,
                train_dataset=dataset_train,
                eval_dataset=dataset_validation,
                compute_metrics = compute_metrics
            )
            
            
            trainer.train()


results = pd.read_csv(log_file)

best_results = results.groupby('Model', as_index=False)['F1'].max()

best_results = pd.merge(best_results, results, on=['Model', 'F1'])
best_results = best_results[['Model', 'Accuracy', 'F1']]
best_results = best_results.drop_duplicates()
best_results.to_csv(f'{fname}.csv')
display(best_results)



2024-09-17 18:35:28.163300: I tensorflow/core/util/port.cc:110] oneDNN custom operations are on. You may see slightly different numerical results due to floating-point round-off errors from different computation orders. To turn them off, set the environment variable `TF_ENABLE_ONEDNN_OPTS=0`.
2024-09-17 18:35:28.187619: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.
To enable the following instructions: AVX2 AVX512F AVX512_VNNI AVX512_BF16 FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.


Index(['tweets', 'type', 'class'], dtype='object')

Unnamed: 0,tweets,type,class
0,ماهي آرائكم متتبعي الكرام,neutral,standard
1,عبقرية المدرب وروعة اللاعبين,positive,standard
2,أمة عربية واحدة خالدة,positive,standard
3,عاد إليكم من جديد وأخيرا درت جيم لهاد الصفحة,neutral,dialectal


{'mixed', 'negative', 'neutral', 'positive'}

type
positive    9897
neutral     4039
negative    3508
mixed        643
Name: count, dtype: int64

4

18087

DatasetDict({
    train: Dataset({
        features: ['tweets', 'label'],
        num_rows: 14469
    })
    test: Dataset({
        features: ['tweets', 'label'],
        num_rows: 3618
    })
})

aubmindlab/bert-base-arabertv02-twitter, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.6465,0.536313,0.796573,0.583601
160,0.4722,0.399063,0.858209,0.689441
240,0.3759,0.39509,0.876451,0.77288
320,0.2555,0.400439,0.880321,0.791386
400,0.2496,0.348608,0.885849,0.785403
480,0.1961,0.395206,0.891376,0.805827
560,0.1185,0.3986,0.889718,0.813182
640,0.1317,0.444532,0.889994,0.808587
720,0.1222,0.435082,0.899116,0.822343
800,0.0926,0.398371,0.901603,0.830156


aubmindlab/bert-base-arabertv02-twitter, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.6634,0.520379,0.797402,0.58615
160,0.4683,0.399973,0.859867,0.70977
240,0.3752,0.384216,0.88115,0.791982
320,0.2484,0.392003,0.880044,0.77989
400,0.2467,0.336127,0.892482,0.806098
480,0.1921,0.387547,0.889442,0.81467
560,0.1117,0.386705,0.896904,0.821985
640,0.1312,0.432509,0.896075,0.826097
720,0.0973,0.419002,0.903261,0.823845
800,0.0837,0.392594,0.902432,0.833743


aubmindlab/bert-base-arabertv02-twitter, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.6634,0.520379,0.797402,0.58615
160,0.4683,0.399973,0.859867,0.70977
240,0.3752,0.384216,0.88115,0.791982
320,0.2484,0.392003,0.880044,0.77989
400,0.2467,0.336127,0.892482,0.806098
480,0.1921,0.387547,0.889442,0.81467
560,0.1117,0.386705,0.896904,0.821985
640,0.1312,0.432509,0.896075,0.826097
720,0.0973,0.419002,0.903261,0.823845
800,0.0837,0.392594,0.902432,0.833743


aubmindlab/bert-base-arabertv02-twitter, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.6712,0.478331,0.825871,0.621728
160,0.4364,0.411367,0.851023,0.726869
240,0.3734,0.408364,0.867606,0.770356
320,0.2235,0.407113,0.872305,0.775153
400,0.2451,0.384374,0.877004,0.7841
480,0.1722,0.409952,0.884467,0.794479
560,0.1237,0.431949,0.890271,0.79571
640,0.1194,0.458705,0.885572,0.794302
720,0.0924,0.544694,0.881426,0.787726
800,0.0712,0.478208,0.892482,0.819106


aubmindlab/bert-base-arabertv02-twitter, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.6712,0.478331,0.825871,0.621728
160,0.4364,0.411367,0.851023,0.726869
240,0.3734,0.408364,0.867606,0.770356
320,0.2235,0.407113,0.872305,0.775153
400,0.2451,0.384374,0.877004,0.7841
480,0.1722,0.409952,0.884467,0.794479
560,0.1237,0.431949,0.890271,0.79571
640,0.1194,0.458705,0.885572,0.794302
720,0.0924,0.544694,0.881426,0.787726
800,0.0712,0.478208,0.892482,0.819106


aubmindlab/bert-base-arabertv02-twitter, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.6712,0.478331,0.825871,0.621728
160,0.4364,0.411367,0.851023,0.726869
240,0.3734,0.408364,0.867606,0.770356
320,0.2235,0.407113,0.872305,0.775153
400,0.2451,0.384374,0.877004,0.7841
480,0.1722,0.409952,0.884467,0.794479
560,0.1237,0.431949,0.890271,0.79571
640,0.1194,0.458705,0.885572,0.794302
720,0.0924,0.544694,0.881426,0.787726
800,0.0712,0.478208,0.892482,0.819106


aubmindlab/bert-base-arabertv02-twitter, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.6471,0.538881,0.805694,0.571454
160,0.4675,0.407706,0.849641,0.720808
240,0.3724,0.391284,0.86429,0.76431
320,0.2517,0.382877,0.875345,0.776698
400,0.2286,0.372858,0.887783,0.799801
480,0.1867,0.38935,0.889442,0.808638
560,0.118,0.408831,0.893588,0.814223
640,0.127,0.412591,0.888889,0.809149
720,0.1058,0.443588,0.893864,0.823592
800,0.0777,0.464227,0.894693,0.825875


aubmindlab/bert-base-arabertv02-twitter, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.6471,0.538881,0.805694,0.571454
160,0.4675,0.407706,0.849641,0.720808
240,0.3724,0.391284,0.86429,0.76431
320,0.2517,0.382877,0.875345,0.776698
400,0.2286,0.372858,0.887783,0.799801
480,0.1867,0.38935,0.889442,0.808638
560,0.118,0.408831,0.893588,0.814223
640,0.127,0.412591,0.888889,0.809149
720,0.1058,0.443588,0.893864,0.823592
800,0.0777,0.464227,0.894693,0.825875


aubmindlab/bert-base-arabertv02-twitter, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.6471,0.538881,0.805694,0.571454
160,0.4675,0.407706,0.849641,0.720808
240,0.3724,0.391284,0.86429,0.76431
320,0.2517,0.382877,0.875345,0.776698
400,0.2286,0.372858,0.887783,0.799801
480,0.1867,0.38935,0.889442,0.808638
560,0.118,0.408831,0.893588,0.814223
640,0.127,0.412591,0.888889,0.809149
720,0.1058,0.443588,0.893864,0.823592
800,0.0777,0.464227,0.894693,0.825875


DatasetDict({
    train: Dataset({
        features: ['tweets', 'label'],
        num_rows: 14469
    })
    test: Dataset({
        features: ['tweets', 'label'],
        num_rows: 3618
    })
})

CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.7157,0.567618,0.796849,0.579471
160,0.5413,0.448734,0.834163,0.614591
240,0.436,0.411051,0.852957,0.744784
320,0.2664,0.430105,0.860697,0.759052
400,0.2633,0.397061,0.862078,0.762993
480,0.2026,0.488788,0.878386,0.780046
560,0.1201,0.439546,0.876175,0.793355
640,0.1177,0.470941,0.876451,0.79134
720,0.1043,0.492643,0.887231,0.79514
800,0.0773,0.521842,0.885019,0.797623


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.7157,0.567618,0.796849,0.579471
160,0.5413,0.448734,0.834163,0.614591
240,0.436,0.411051,0.852957,0.744784
320,0.2664,0.430105,0.860697,0.759052
400,0.2633,0.397061,0.862078,0.762993
480,0.2026,0.488788,0.878386,0.780046
560,0.1201,0.439546,0.876175,0.793355
640,0.1177,0.470941,0.876451,0.79134
720,0.1043,0.492643,0.887231,0.79514
800,0.0773,0.521842,0.885019,0.797623


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.7157,0.567618,0.796849,0.579471
160,0.5413,0.448734,0.834163,0.614591
240,0.436,0.411051,0.852957,0.744784
320,0.2664,0.430105,0.860697,0.759052
400,0.2633,0.397061,0.862078,0.762993
480,0.2026,0.488788,0.878386,0.780046
560,0.1201,0.439546,0.876175,0.793355
640,0.1177,0.470941,0.876451,0.79134
720,0.1043,0.492643,0.887231,0.79514
800,0.0773,0.521842,0.885019,0.797623


CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.7349,0.55763,0.791874,0.603966
160,0.5307,0.469687,0.828635,0.690235
240,0.4427,0.467692,0.847153,0.728365
320,0.2432,0.463051,0.85738,0.740271
400,0.2703,0.409843,0.869265,0.756849
480,0.1745,0.500566,0.8712,0.777033
560,0.1162,0.500123,0.872029,0.772689
640,0.1139,0.526713,0.868436,0.770864
720,0.1017,0.541458,0.881979,0.797615
800,0.0818,0.528993,0.877557,0.78896


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.7349,0.55763,0.791874,0.603966
160,0.5307,0.469687,0.828635,0.690235
240,0.4427,0.467692,0.847153,0.728365
320,0.2432,0.463051,0.85738,0.740271
400,0.2703,0.409843,0.869265,0.756849
480,0.1745,0.500566,0.8712,0.777033
560,0.1162,0.500123,0.872029,0.772689
640,0.1139,0.526713,0.868436,0.770864
720,0.1017,0.541458,0.881979,0.797615
800,0.0818,0.528993,0.877557,0.78896


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.7349,0.55763,0.791874,0.603966
160,0.5307,0.469687,0.828635,0.690235
240,0.4427,0.467692,0.847153,0.728365
320,0.2432,0.463051,0.85738,0.740271
400,0.2703,0.409843,0.869265,0.756849
480,0.1745,0.500566,0.8712,0.777033
560,0.1162,0.500123,0.872029,0.772689
640,0.1139,0.526713,0.868436,0.770864
720,0.1017,0.541458,0.881979,0.797615
800,0.0818,0.528993,0.877557,0.78896


CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.707,0.601141,0.776949,0.580439
160,0.5589,0.465545,0.830293,0.698137
240,0.441,0.439351,0.8466,0.72002
320,0.2609,0.43376,0.858762,0.756783
400,0.2491,0.428542,0.861802,0.764795
480,0.1973,0.471245,0.86429,0.758816
560,0.1189,0.450253,0.873687,0.781236
640,0.1142,0.472951,0.875898,0.79893
720,0.0904,0.552607,0.87728,0.795259
800,0.0727,0.539236,0.885296,0.80801


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.707,0.601141,0.776949,0.580439
160,0.5589,0.465545,0.830293,0.698137
240,0.441,0.439351,0.8466,0.72002
320,0.2609,0.43376,0.858762,0.756783
400,0.2491,0.428542,0.861802,0.764795
480,0.1973,0.471245,0.86429,0.758816
560,0.1189,0.450253,0.873687,0.781236
640,0.1142,0.472951,0.875898,0.79893
720,0.0904,0.552607,0.87728,0.795259
800,0.0727,0.539236,0.885296,0.80801


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.707,0.601141,0.776949,0.580439
160,0.5589,0.465545,0.830293,0.698137
240,0.441,0.439351,0.8466,0.72002
320,0.2609,0.43376,0.858762,0.756783
400,0.2491,0.428542,0.861802,0.764795
480,0.1973,0.471245,0.86429,0.758816
560,0.1189,0.450253,0.873687,0.781236
640,0.1142,0.472951,0.875898,0.79893
720,0.0904,0.552607,0.87728,0.795259
800,0.0727,0.539236,0.885296,0.80801


DatasetDict({
    train: Dataset({
        features: ['tweets', 'label'],
        num_rows: 14469
    })
    test: Dataset({
        features: ['tweets', 'label'],
        num_rows: 3618
    })
})

qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.6527,0.492784,0.815091,0.599039
160,0.4708,0.3988,0.859867,0.710127
240,0.3814,0.387712,0.879215,0.785443
320,0.2354,0.391591,0.873687,0.76969
400,0.223,0.344537,0.888336,0.802129
480,0.1695,0.439825,0.888889,0.798064
560,0.1093,0.451046,0.885849,0.807889
640,0.122,0.428872,0.893311,0.82471
720,0.1007,0.446701,0.898839,0.831691
800,0.0696,0.459458,0.896075,0.826869


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.6527,0.492784,0.815091,0.599039
160,0.4708,0.3988,0.859867,0.710127
240,0.3814,0.387712,0.879215,0.785443
320,0.2354,0.391591,0.873687,0.76969
400,0.223,0.344537,0.888336,0.802129
480,0.1695,0.439825,0.888889,0.798064
560,0.1093,0.451046,0.885849,0.807889
640,0.122,0.428872,0.893311,0.82471
720,0.1007,0.446701,0.898839,0.831691
800,0.0696,0.459458,0.896075,0.826869


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.6527,0.492784,0.815091,0.599039
160,0.4708,0.3988,0.859867,0.710127
240,0.3814,0.387712,0.879215,0.785443
320,0.2354,0.391591,0.873687,0.76969
400,0.223,0.344537,0.888336,0.802129
480,0.1695,0.439825,0.888889,0.798064
560,0.1093,0.451046,0.885849,0.807889
640,0.122,0.428872,0.893311,0.82471
720,0.1007,0.446701,0.898839,0.831691
800,0.0696,0.459458,0.896075,0.826869


qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.6491,0.494635,0.822001,0.652327
160,0.4616,0.420154,0.85047,0.722178
240,0.387,0.426404,0.86429,0.760001
320,0.2127,0.441687,0.87424,0.762611
400,0.2329,0.403239,0.876727,0.769707
480,0.1554,0.485317,0.880321,0.789248
560,0.1203,0.437769,0.880597,0.790762
640,0.1087,0.474365,0.881979,0.788221
720,0.0859,0.543037,0.880597,0.79073
800,0.0674,0.513804,0.891376,0.815241


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.6491,0.494635,0.822001,0.652327
160,0.4616,0.420154,0.85047,0.722178
240,0.387,0.426404,0.86429,0.760001
320,0.2127,0.441687,0.87424,0.762611
400,0.2329,0.403239,0.876727,0.769707
480,0.1554,0.485317,0.880321,0.789248
560,0.1203,0.437769,0.880597,0.790762
640,0.1087,0.474365,0.881979,0.788221
720,0.0859,0.543037,0.880597,0.79073
800,0.0674,0.513804,0.891376,0.815241


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.6491,0.494635,0.822001,0.652327
160,0.4616,0.420154,0.85047,0.722178
240,0.387,0.426404,0.86429,0.760001
320,0.2127,0.441687,0.87424,0.762611
400,0.2329,0.403239,0.876727,0.769707
480,0.1554,0.485317,0.880321,0.789248
560,0.1203,0.437769,0.880597,0.790762
640,0.1087,0.474365,0.881979,0.788221
720,0.0859,0.543037,0.880597,0.79073
800,0.0674,0.513804,0.891376,0.815241


qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.6158,0.492073,0.822278,0.632281
160,0.4866,0.410484,0.852957,0.7227
240,0.3845,0.380692,0.868159,0.781474
320,0.2368,0.375736,0.871476,0.776193
400,0.2086,0.404958,0.87728,0.787234
480,0.164,0.46164,0.88115,0.797335
560,0.1157,0.454842,0.876451,0.794089
640,0.112,0.453939,0.891376,0.821888
720,0.0825,0.490842,0.894417,0.830744
800,0.067,0.563231,0.882808,0.794811


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.6158,0.492073,0.822278,0.632281
160,0.4866,0.410484,0.852957,0.7227
240,0.3845,0.380692,0.868159,0.781474
320,0.2368,0.375736,0.871476,0.776193
400,0.2086,0.404958,0.87728,0.787234
480,0.164,0.46164,0.88115,0.797335
560,0.1157,0.454842,0.876451,0.794089
640,0.112,0.453939,0.891376,0.821888
720,0.0825,0.490842,0.894417,0.830744
800,0.067,0.563231,0.882808,0.794811


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.6158,0.492073,0.822278,0.632281
160,0.4866,0.410484,0.852957,0.7227
240,0.3845,0.380692,0.868159,0.781474
320,0.2368,0.375736,0.871476,0.776193
400,0.2086,0.404958,0.87728,0.787234
480,0.164,0.46164,0.88115,0.797335
560,0.1157,0.454842,0.876451,0.794089
640,0.112,0.453939,0.891376,0.821888
720,0.0825,0.490842,0.894417,0.830744
800,0.067,0.563231,0.882808,0.794811


DatasetDict({
    train: Dataset({
        features: ['tweets', 'label'],
        num_rows: 14469
    })
    test: Dataset({
        features: ['tweets', 'label'],
        num_rows: 3618
    })
})

UBC-NLP/MARBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.7211,0.515326,0.80597,0.593751
160,0.5038,0.449337,0.845771,0.669218
240,0.4061,0.447761,0.859867,0.752562
320,0.2694,0.412056,0.865948,0.746937
400,0.2577,0.365655,0.878662,0.792066
480,0.1954,0.467479,0.883361,0.791595
560,0.127,0.443373,0.883637,0.812523
640,0.1278,0.476101,0.885572,0.80939
720,0.1041,0.554307,0.883914,0.786554
800,0.0871,0.489822,0.895246,0.826075


UBC-NLP/MARBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.7211,0.515326,0.80597,0.593751
160,0.5038,0.449337,0.845771,0.669218
240,0.4061,0.447761,0.859867,0.752562
320,0.2694,0.412056,0.865948,0.746937
400,0.2577,0.365655,0.878662,0.792066
480,0.1954,0.467479,0.883361,0.791595
560,0.127,0.443373,0.883637,0.812523
640,0.1278,0.476101,0.885572,0.80939
720,0.1041,0.554307,0.883914,0.786554
800,0.0871,0.489822,0.895246,0.826075


UBC-NLP/MARBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.7211,0.515326,0.80597,0.593751
160,0.5038,0.449337,0.845771,0.669218
240,0.4061,0.447761,0.859867,0.752562
320,0.2694,0.412056,0.865948,0.746937
400,0.2577,0.365655,0.878662,0.792066
480,0.1954,0.467479,0.883361,0.791595
560,0.127,0.443373,0.883637,0.812523
640,0.1278,0.476101,0.885572,0.80939
720,0.1041,0.554307,0.883914,0.786554
800,0.0871,0.489822,0.895246,0.826075


UBC-NLP/MARBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.6874,0.519274,0.813433,0.591704
160,0.4922,0.43608,0.844666,0.700842
240,0.4073,0.462428,0.849088,0.740611
320,0.2472,0.42784,0.866224,0.751811
400,0.2603,0.454864,0.862908,0.733898
480,0.195,0.551602,0.862355,0.756841
560,0.1284,0.481817,0.878109,0.786419
640,0.129,0.482414,0.881426,0.789344
720,0.0988,0.563244,0.873134,0.771974
800,0.0814,0.52195,0.887783,0.804315


UBC-NLP/MARBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.6874,0.519274,0.813433,0.591704
160,0.4922,0.43608,0.844666,0.700842
240,0.4073,0.462428,0.849088,0.740611
320,0.2472,0.42784,0.866224,0.751811
400,0.2603,0.454864,0.862908,0.733898
480,0.195,0.551602,0.862355,0.756841
560,0.1284,0.481817,0.878109,0.786419
640,0.129,0.482414,0.881426,0.789344
720,0.0988,0.563244,0.873134,0.771974
800,0.0814,0.52195,0.887783,0.804315


UBC-NLP/MARBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.6874,0.519274,0.813433,0.591704
160,0.4922,0.43608,0.844666,0.700842
240,0.4073,0.462428,0.849088,0.740611
320,0.2472,0.42784,0.866224,0.751811
400,0.2603,0.454864,0.862908,0.733898
480,0.195,0.551602,0.862355,0.756841
560,0.1284,0.481817,0.878109,0.786419
640,0.129,0.482414,0.881426,0.789344
720,0.0988,0.563244,0.873134,0.771974
800,0.0814,0.52195,0.887783,0.804315


UBC-NLP/MARBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.6793,0.536795,0.804035,0.590804
160,0.5316,0.431755,0.845218,0.708197
240,0.4051,0.422051,0.860973,0.755015
320,0.2621,0.394608,0.873411,0.776078
400,0.2407,0.381607,0.878939,0.800375
480,0.1943,0.451047,0.872305,0.795796
560,0.135,0.457282,0.874793,0.782882
640,0.1218,0.442062,0.88419,0.801206
720,0.0938,0.530295,0.884467,0.811231
800,0.0868,0.54959,0.889442,0.80831


UBC-NLP/MARBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.6793,0.536795,0.804035,0.590804
160,0.5316,0.431755,0.845218,0.708197
240,0.4051,0.422051,0.860973,0.755015
320,0.2621,0.394608,0.873411,0.776078
400,0.2407,0.381607,0.878939,0.800375
480,0.1943,0.451047,0.872305,0.795796
560,0.135,0.457282,0.874793,0.782882
640,0.1218,0.442062,0.88419,0.801206
720,0.0938,0.530295,0.884467,0.811231
800,0.0868,0.54959,0.889442,0.80831


UBC-NLP/MARBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.6793,0.536795,0.804035,0.590804
160,0.5316,0.431755,0.845218,0.708197
240,0.4051,0.422051,0.860973,0.755015
320,0.2621,0.394608,0.873411,0.776078
400,0.2407,0.381607,0.878939,0.800375
480,0.1943,0.451047,0.872305,0.795796
560,0.135,0.457282,0.874793,0.782882
640,0.1218,0.442062,0.88419,0.801206
720,0.0938,0.530295,0.884467,0.811231
800,0.0868,0.54959,0.889442,0.80831


DatasetDict({
    train: Dataset({
        features: ['tweets', 'label'],
        num_rows: 14469
    })
    test: Dataset({
        features: ['tweets', 'label'],
        num_rows: 3618
    })
})

UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.873,0.560994,0.79298,0.580414
160,0.5396,0.438242,0.844389,0.673043
240,0.4148,0.418779,0.866777,0.764717
320,0.3145,0.411444,0.867054,0.776833
400,0.2843,0.336111,0.886401,0.809115
480,0.216,0.418376,0.889165,0.805909
560,0.14,0.386282,0.8911,0.817958
640,0.1422,0.377237,0.898839,0.81717
720,0.1246,0.46768,0.898286,0.818467
800,0.0966,0.431102,0.902156,0.829135


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.873,0.560994,0.79298,0.580414
160,0.5396,0.438242,0.844389,0.673043
240,0.4148,0.418779,0.866777,0.764717
320,0.3145,0.411444,0.867054,0.776833
400,0.2843,0.336111,0.886401,0.809115
480,0.216,0.418376,0.889165,0.805909
560,0.14,0.386282,0.8911,0.817958
640,0.1422,0.377237,0.898839,0.81717
720,0.1246,0.46768,0.898286,0.818467
800,0.0966,0.431102,0.902156,0.829135


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.873,0.560994,0.79298,0.580414
160,0.5396,0.438242,0.844389,0.673043
240,0.4148,0.418779,0.866777,0.764717
320,0.3145,0.411444,0.867054,0.776833
400,0.2843,0.336111,0.886401,0.809115
480,0.216,0.418376,0.889165,0.805909
560,0.14,0.386282,0.8911,0.817958
640,0.1422,0.377237,0.898839,0.81717
720,0.1246,0.46768,0.898286,0.818467
800,0.0966,0.431102,0.902156,0.829135


UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.7673,0.525231,0.811222,0.590798
160,0.4781,0.423313,0.852681,0.684206
240,0.409,0.41213,0.859591,0.741075
320,0.2622,0.440577,0.864842,0.738965
400,0.2724,0.404936,0.872029,0.770452
480,0.1963,0.458724,0.877004,0.775145
560,0.1441,0.415143,0.890271,0.806014
640,0.1325,0.453341,0.880044,0.780049
720,0.1216,0.506112,0.881703,0.784094
800,0.0864,0.474741,0.887231,0.786908


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.7673,0.525231,0.811222,0.590798
160,0.4781,0.423313,0.852681,0.684206
240,0.409,0.41213,0.859591,0.741075
320,0.2622,0.440577,0.864842,0.738965
400,0.2724,0.404936,0.872029,0.770452
480,0.1963,0.458724,0.877004,0.775145
560,0.1441,0.415143,0.890271,0.806014
640,0.1325,0.453341,0.880044,0.780049
720,0.1216,0.506112,0.881703,0.784094
800,0.0864,0.474741,0.887231,0.786908


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.7673,0.525231,0.811222,0.590798
160,0.4781,0.423313,0.852681,0.684206
240,0.409,0.41213,0.859591,0.741075
320,0.2622,0.440577,0.864842,0.738965
400,0.2724,0.404936,0.872029,0.770452
480,0.1963,0.458724,0.877004,0.775145
560,0.1441,0.415143,0.890271,0.806014
640,0.1325,0.453341,0.880044,0.780049
720,0.1216,0.506112,0.881703,0.784094
800,0.0864,0.474741,0.887231,0.786908


UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.7439,0.545264,0.819514,0.596925
160,0.5146,0.439476,0.848811,0.690317
240,0.3986,0.41824,0.860973,0.737416
320,0.2656,0.411907,0.872029,0.777124
400,0.2434,0.395617,0.879215,0.800257
480,0.2066,0.40737,0.884467,0.812613
560,0.1352,0.435043,0.889994,0.809815
640,0.1334,0.447743,0.890271,0.811275
720,0.1096,0.492718,0.881979,0.797177
800,0.0861,0.497827,0.894417,0.810485


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.7439,0.545264,0.819514,0.596925
160,0.5146,0.439476,0.848811,0.690317
240,0.3986,0.41824,0.860973,0.737416
320,0.2656,0.411907,0.872029,0.777124
400,0.2434,0.395617,0.879215,0.800257
480,0.2066,0.40737,0.884467,0.812613
560,0.1352,0.435043,0.889994,0.809815
640,0.1334,0.447743,0.890271,0.811275
720,0.1096,0.492718,0.881979,0.797177
800,0.0861,0.497827,0.894417,0.810485


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.7439,0.545264,0.819514,0.596925
160,0.5146,0.439476,0.848811,0.690317
240,0.3986,0.41824,0.860973,0.737416
320,0.2656,0.411907,0.872029,0.777124
400,0.2434,0.395617,0.879215,0.800257
480,0.2066,0.40737,0.884467,0.812613
560,0.1352,0.435043,0.889994,0.809815
640,0.1334,0.447743,0.890271,0.811275
720,0.1096,0.492718,0.881979,0.797177
800,0.0861,0.497827,0.894417,0.810485


DatasetDict({
    train: Dataset({
        features: ['tweets', 'label'],
        num_rows: 14469
    })
    test: Dataset({
        features: ['tweets', 'label'],
        num_rows: 3618
    })
})

SI2M-Lab/DarijaBERT-mix, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.8797,0.743593,0.702598,0.492579
160,0.6287,0.560012,0.794085,0.578756
240,0.5246,0.466572,0.839967,0.69513
320,0.3873,0.448383,0.837203,0.680845
400,0.3699,0.410941,0.855169,0.710878
480,0.3012,0.46737,0.863184,0.757039
560,0.185,0.440908,0.868712,0.767808
640,0.1998,0.441563,0.874793,0.763574
720,0.1549,0.476665,0.877557,0.791192
800,0.1132,0.492937,0.865395,0.76572


SI2M-Lab/DarijaBERT-mix, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.8797,0.743593,0.702598,0.492579
160,0.6287,0.560012,0.794085,0.578756
240,0.5246,0.466572,0.839967,0.69513
320,0.3873,0.448383,0.837203,0.680845
400,0.3699,0.410941,0.855169,0.710878
480,0.3012,0.46737,0.863184,0.757039
560,0.185,0.440908,0.868712,0.767808
640,0.1998,0.441563,0.874793,0.763574
720,0.1549,0.476665,0.877557,0.791192
800,0.1132,0.492937,0.865395,0.76572


SI2M-Lab/DarijaBERT-mix, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.8797,0.743593,0.702598,0.492579
160,0.6287,0.560012,0.794085,0.578756
240,0.5246,0.466572,0.839967,0.69513
320,0.3873,0.448383,0.837203,0.680845
400,0.3699,0.410941,0.855169,0.710878
480,0.3012,0.46737,0.863184,0.757039
560,0.185,0.440908,0.868712,0.767808
640,0.1998,0.441563,0.874793,0.763574
720,0.1549,0.476665,0.877557,0.791192
800,0.1132,0.492937,0.865395,0.76572


SI2M-Lab/DarijaBERT-mix, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.8446,0.653261,0.749033,0.539069
160,0.6327,0.56679,0.778607,0.58825
240,0.5585,0.52231,0.808181,0.623328
320,0.4306,0.490266,0.820619,0.632435
400,0.4157,0.462349,0.83361,0.702998
480,0.3175,0.495322,0.84356,0.715823
560,0.2273,0.465434,0.858209,0.73057
640,0.2326,0.480543,0.849917,0.729666
720,0.1886,0.489314,0.865119,0.764881
800,0.1282,0.498577,0.875622,0.781525


SI2M-Lab/DarijaBERT-mix, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.8446,0.653261,0.749033,0.539069
160,0.6327,0.56679,0.778607,0.58825
240,0.5585,0.52231,0.808181,0.623328
320,0.4306,0.490266,0.820619,0.632435
400,0.4157,0.462349,0.83361,0.702998
480,0.3175,0.495322,0.84356,0.715823
560,0.2273,0.465434,0.858209,0.73057
640,0.2326,0.480543,0.849917,0.729666
720,0.1886,0.489314,0.865119,0.764881
800,0.1282,0.498577,0.875622,0.781525


SI2M-Lab/DarijaBERT-mix, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.8446,0.653261,0.749033,0.539069
160,0.6327,0.56679,0.778607,0.58825
240,0.5585,0.52231,0.808181,0.623328
320,0.4306,0.490266,0.820619,0.632435
400,0.4157,0.462349,0.83361,0.702998
480,0.3175,0.495322,0.84356,0.715823
560,0.2273,0.465434,0.858209,0.73057
640,0.2326,0.480543,0.849917,0.729666
720,0.1886,0.489314,0.865119,0.764881
800,0.1282,0.498577,0.875622,0.781525


SI2M-Lab/DarijaBERT-mix, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.8512,0.7415,0.702045,0.485468
160,0.716,0.614764,0.771697,0.56929
240,0.5856,0.528491,0.797402,0.604605
320,0.4729,0.469048,0.830569,0.659355
400,0.4391,0.4198,0.842178,0.702067
480,0.3474,0.437069,0.849641,0.738519
560,0.2568,0.399602,0.866501,0.769902
640,0.234,0.454253,0.862078,0.762474
720,0.1756,0.497467,0.872582,0.780401
800,0.1495,0.465617,0.8712,0.775411


SI2M-Lab/DarijaBERT-mix, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.8512,0.7415,0.702045,0.485468
160,0.716,0.614764,0.771697,0.56929
240,0.5856,0.528491,0.797402,0.604605
320,0.4729,0.469048,0.830569,0.659355
400,0.4391,0.4198,0.842178,0.702067
480,0.3474,0.437069,0.849641,0.738519
560,0.2568,0.399602,0.866501,0.769902
640,0.234,0.454253,0.862078,0.762474
720,0.1756,0.497467,0.872582,0.780401
800,0.1495,0.465617,0.8712,0.775411


SI2M-Lab/DarijaBERT-mix, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.8512,0.7415,0.702045,0.485468
160,0.716,0.614764,0.771697,0.56929
240,0.5856,0.528491,0.797402,0.604605
320,0.4729,0.469048,0.830569,0.659355
400,0.4391,0.4198,0.842178,0.702067
480,0.3474,0.437069,0.849641,0.738519
560,0.2568,0.399602,0.866501,0.769902
640,0.234,0.454253,0.862078,0.762474
720,0.1756,0.497467,0.872582,0.780401
800,0.1495,0.465617,0.8712,0.775411


DatasetDict({
    train: Dataset({
        features: ['tweets', 'label'],
        num_rows: 14469
    })
    test: Dataset({
        features: ['tweets', 'label'],
        num_rows: 3618
    })
})

SI2M-Lab/DarijaBERT-arabizi, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.8661,0.790529,0.687673,0.439686
160,0.7186,0.664414,0.731896,0.520906
240,0.6078,0.647707,0.78524,0.603323
320,0.4383,0.598211,0.79298,0.635317
400,0.4235,0.527505,0.810116,0.679415
480,0.3501,0.648336,0.825871,0.707487
560,0.2198,0.577788,0.830846,0.720449
640,0.2234,0.604513,0.840796,0.740627
720,0.1632,0.655704,0.850746,0.769368
800,0.1229,0.696144,0.844389,0.756346


SI2M-Lab/DarijaBERT-arabizi, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.8661,0.790529,0.687673,0.439686
160,0.7186,0.664414,0.731896,0.520906
240,0.6078,0.647707,0.78524,0.603323
320,0.4383,0.598211,0.79298,0.635317
400,0.4235,0.527505,0.810116,0.679415
480,0.3501,0.648336,0.825871,0.707487
560,0.2198,0.577788,0.830846,0.720449
640,0.2234,0.604513,0.840796,0.740627
720,0.1632,0.655704,0.850746,0.769368
800,0.1229,0.696144,0.844389,0.756346


SI2M-Lab/DarijaBERT-arabizi, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.8661,0.790529,0.687673,0.439686
160,0.7186,0.664414,0.731896,0.520906
240,0.6078,0.647707,0.78524,0.603323
320,0.4383,0.598211,0.79298,0.635317
400,0.4235,0.527505,0.810116,0.679415
480,0.3501,0.648336,0.825871,0.707487
560,0.2198,0.577788,0.830846,0.720449
640,0.2234,0.604513,0.840796,0.740627
720,0.1632,0.655704,0.850746,0.769368
800,0.1229,0.696144,0.844389,0.756346


SI2M-Lab/DarijaBERT-arabizi, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.8588,0.718871,0.717523,0.502476
160,0.72,0.63855,0.74848,0.543286
240,0.615,0.643548,0.776119,0.57692
320,0.438,0.622213,0.784964,0.640929
400,0.4465,0.538898,0.812051,0.671874
480,0.3231,0.634511,0.818961,0.690109
560,0.225,0.618836,0.818684,0.692832
640,0.2158,0.583978,0.830846,0.707548
720,0.1713,0.690104,0.820896,0.698248
800,0.1337,0.664157,0.83361,0.726233


SI2M-Lab/DarijaBERT-arabizi, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.8588,0.718871,0.717523,0.502476
160,0.72,0.63855,0.74848,0.543286
240,0.615,0.643548,0.776119,0.57692
320,0.438,0.622213,0.784964,0.640929
400,0.4465,0.538898,0.812051,0.671874
480,0.3231,0.634511,0.818961,0.690109
560,0.225,0.618836,0.818684,0.692832
640,0.2158,0.583978,0.830846,0.707548
720,0.1713,0.690104,0.820896,0.698248
800,0.1337,0.664157,0.83361,0.726233


SI2M-Lab/DarijaBERT-arabizi, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.8588,0.718871,0.717523,0.502476
160,0.72,0.63855,0.74848,0.543286
240,0.615,0.643548,0.776119,0.57692
320,0.438,0.622213,0.784964,0.640929
400,0.4465,0.538898,0.812051,0.671874
480,0.3231,0.634511,0.818961,0.690109
560,0.225,0.618836,0.818684,0.692832
640,0.2158,0.583978,0.830846,0.707548
720,0.1713,0.690104,0.820896,0.698248
800,0.1337,0.664157,0.83361,0.726233


SI2M-Lab/DarijaBERT-arabizi, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.8459,0.706298,0.718629,0.493103
160,0.7323,0.641349,0.752626,0.52927
240,0.6258,0.598146,0.78607,0.59184
320,0.4388,0.573991,0.791045,0.660008
400,0.4234,0.532891,0.811774,0.686574
480,0.3349,0.610464,0.810945,0.705107
560,0.2187,0.579557,0.833057,0.726352
640,0.2033,0.619807,0.83361,0.73853
720,0.1587,0.705518,0.83361,0.743044
800,0.1321,0.655334,0.838861,0.744333


SI2M-Lab/DarijaBERT-arabizi, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.8459,0.706298,0.718629,0.493103
160,0.7323,0.641349,0.752626,0.52927
240,0.6258,0.598146,0.78607,0.59184
320,0.4388,0.573991,0.791045,0.660008
400,0.4234,0.532891,0.811774,0.686574
480,0.3349,0.610464,0.810945,0.705107
560,0.2187,0.579557,0.833057,0.726352
640,0.2033,0.619807,0.83361,0.73853
720,0.1587,0.705518,0.83361,0.743044
800,0.1321,0.655334,0.838861,0.744333


SI2M-Lab/DarijaBERT-arabizi, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/14469 [00:00<?, ? examples/s]

Map:   0%|          | 0/3618 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
80,0.8459,0.706298,0.718629,0.493103
160,0.7323,0.641349,0.752626,0.52927
240,0.6258,0.598146,0.78607,0.59184
320,0.4388,0.573991,0.791045,0.660008
400,0.4234,0.532891,0.811774,0.686574
480,0.3349,0.610464,0.810945,0.705107
560,0.2187,0.579557,0.833057,0.726352
640,0.2033,0.619807,0.83361,0.73853
720,0.1587,0.705518,0.83361,0.743044
800,0.1321,0.655334,0.838861,0.744333


Unnamed: 0,Model,Accuracy,F1
0,CAMeL-Lab/bert-base-arabic-camelbert-da,0.892482,0.833672
3,SI2M-Lab/DarijaBERT-arabizi,0.854892,0.791231
6,SI2M-Lab/DarijaBERT-mix,0.891929,0.828301
9,UBC-NLP/MARBERT,0.898286,0.840144
12,UBC-NLP/MARBERTv2,0.907407,0.836553
15,aubmindlab/bert-base-arabertv02-twitter,0.90796,0.852333
17,qarib/bert-base-qarib,0.902432,0.847129
