In [1]:
import os
os.environ["CUDA_VISIBLE_DEVICES"]="1" 

import numpy as np
import tensorflow as tf
import pandas as pd
import pyarabic.araby as araby
import warnings
warnings.filterwarnings('ignore')
from sklearn.model_selection import train_test_split
from sklearn.metrics import classification_report
from tensorflow.keras.layers import Dense, Input
from tensorflow.keras.utils import to_categorical
from tensorflow.keras.optimizers import Adam
from tensorflow.keras.callbacks import EarlyStopping
from tensorflow.keras.initializers import TruncatedNormal
from tensorflow.keras.losses import CategoricalCrossentropy
from tensorflow.keras.metrics import CategoricalAccuracy
import torch
from sklearn.metrics import accuracy_score, f1_score
from transformers import Trainer, TrainingArguments
from transformers import AutoTokenizer, AutoModelForSequenceClassification
from datasets import load_dataset, Dataset, concatenate_datasets
pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', None)
pd.set_option('display.max_colwidth', 1000)


fname = 'MDOD_1'
log_file = fname + '.txt'

with open(log_file, 'w') as f:
    f.write('Model,Accuracy,F1\n')


df = pd.read_csv('datasets/Moroccan_Darija_Offensive_Language_Detection_Dataset.csv', encoding='utf-8', engine='python') #, quotechar="'"  , quoting=3


      
display(df.columns)
display(len(df))
display(df[:4])



classes = set(df['label'].values)
display(classes)

c = df['label'].value_counts()
display(c)

df['label'] = df['label'].astype('category')
df['label'] = df['label'].cat.codes

df = df[['text', 'label']]
classes_num = len(classes)
display(classes_num)
display(len(df))


# ds = Dataset.from_pandas(df)
# ds = ds.train_test_split(test_size=0.2)

# display(ds)

max_sequence_length = 128


models = [ 
        'aubmindlab/bert-base-arabertv02-twitter',
        'CAMeL-Lab/bert-base-arabic-camelbert-da',
        'qarib/bert-base-qarib', 
        'UBC-NLP/MARBERT',
        'UBC-NLP/MARBERTv2',
]





seeds = [0, 1, 42]

for model_name in models:
    for seed in seeds:
        ds = Dataset.from_pandas(df)
        ds = ds.train_test_split(test_size=0.2, seed = seed)
        if seed==0:
            display(ds)
    
        for i in range(3):
            print(f'{model_name}, try:{i}')
                  
            tokenizer = AutoTokenizer.from_pretrained(model_name)
            model = AutoModelForSequenceClassification.from_pretrained(model_name,
                                                                  num_labels=classes_num).to('cuda')                                                 
            dataset_train = ds['train']
            dataset_validation = ds['test']                                                    
            
          
    
            def preprocess_function(examples):
                return tokenizer(examples['text'], truncation=True, padding="max_length",
                                max_length=max_sequence_length)
            
            
            dataset_train = dataset_train.map(preprocess_function, batched=True) # , batched=True
            dataset_validation = dataset_validation.map(preprocess_function, batched=True)  # , batched=True
            
           
            
            def compute_metrics(eval_pred):
                logits, labels = eval_pred
                predictions = np.argmax(logits, axis=-1)    
                acc = accuracy_score(labels, predictions)        
                f1 = f1_score(labels, predictions, average='macro')   
                with open(log_file, 'a') as f:
                    f.write(f'{model_name},{acc},{f1}\n')
                return {'accuracy': acc, 'f1_score': f1}
    
    
            
            
            epochs = 12
            save_steps = 10000 #save checkpoint every 10000 steps
            batch_size = 64
            
            training_args = TrainingArguments(
                output_dir = 'bert/',
                overwrite_output_dir=True,
                num_train_epochs = epochs,
                per_device_train_batch_size = batch_size,
                per_device_eval_batch_size = batch_size,
                save_steps = save_steps,
                save_total_limit = 1, #only save the last 5 checkpoints
                fp16=True,
                learning_rate = 5e-5,  # 5e-5 is the default
                logging_steps = 100, #50_000
                evaluation_strategy = 'steps',
                # evaluate_during_training = True,
                eval_steps = 100
                
            )
            
            trainer = Trainer(
                model = model,
                args = training_args,
                # data_collator=data_collator,
                train_dataset=dataset_train,
                eval_dataset=dataset_validation,
                compute_metrics = compute_metrics
            )
            
            
            trainer.train()


results = pd.read_csv(log_file)

best_results = results.groupby('Model', as_index=False)['F1'].max()

best_results = pd.merge(best_results, results, on=['Model', 'F1'])
best_results = best_results[['Model', 'Accuracy', 'F1']]
best_results = best_results.drop_duplicates()
best_results.to_csv(f'{fname}.csv')
display(best_results)



2024-09-16 20:34:44.135062: I tensorflow/core/util/port.cc:110] oneDNN custom operations are on. You may see slightly different numerical results due to floating-point round-off errors from different computation orders. To turn them off, set the environment variable `TF_ENABLE_ONEDNN_OPTS=0`.
2024-09-16 20:34:44.159118: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.
To enable the following instructions: AVX2 AVX512F AVX512_VNNI AVX512_BF16 FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.


Index(['text', 'label'], dtype='object')

20402

Unnamed: 0,text,label
0,eh mais enfaite ‘zebi’ ça veut dire bise’ en verlan nan,1
1,je vais me réveiller à 6h au lieu de 7h histoire de réviser un peu zebi oslm tu m’a plus jamais revu,1
2,ma matrixe la video il est trop chou zebi,1
3,mmh tu manquer l’odeur de ta culotte nahchtoulimek y’a zebi,1


{0, 1}

label
0    12685
1     7717
Name: count, dtype: int64

2

20402

DatasetDict({
    train: Dataset({
        features: ['text', 'label'],
        num_rows: 16321
    })
    test: Dataset({
        features: ['text', 'label'],
        num_rows: 4081
    })
})

aubmindlab/bert-base-arabertv02-twitter, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4203,0.317003,0.848076,0.833984
200,0.3271,0.304273,0.8716,0.859425
300,0.2726,0.331312,0.87356,0.868063
400,0.205,0.299594,0.881647,0.874341
500,0.207,0.303668,0.881647,0.875045
600,0.1308,0.336804,0.887037,0.878632
700,0.133,0.349659,0.885567,0.879745
800,0.1206,0.393386,0.890223,0.883635
900,0.0968,0.403982,0.893408,0.88749
1000,0.0966,0.389334,0.888753,0.882279


aubmindlab/bert-base-arabertv02-twitter, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4188,0.319185,0.854447,0.842292
200,0.3253,0.296854,0.872335,0.862017
300,0.2721,0.324039,0.870865,0.865095
400,0.206,0.29345,0.882137,0.875414
500,0.2019,0.307479,0.880176,0.872812
600,0.1372,0.360491,0.883362,0.874098
700,0.1365,0.331952,0.886302,0.879832
800,0.1195,0.39637,0.888263,0.881351
900,0.0899,0.38533,0.889488,0.883156
1000,0.1015,0.366655,0.884832,0.878394


aubmindlab/bert-base-arabertv02-twitter, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4188,0.319185,0.854447,0.842292
200,0.3253,0.296854,0.872335,0.862017
300,0.2721,0.324039,0.870865,0.865095
400,0.206,0.29345,0.882137,0.875414
500,0.2019,0.307479,0.880176,0.872812
600,0.1372,0.360491,0.883362,0.874098
700,0.1365,0.331952,0.886302,0.879832
800,0.1195,0.39637,0.888263,0.881351
900,0.0899,0.38533,0.889488,0.883156
1000,0.1015,0.366655,0.884832,0.878394


aubmindlab/bert-base-arabertv02-twitter, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4263,0.337502,0.848812,0.838738
200,0.3242,0.300581,0.868905,0.857208
300,0.2852,0.290449,0.879196,0.866601
400,0.2129,0.293805,0.884342,0.874793
500,0.2103,0.28376,0.891203,0.881332
600,0.1357,0.296333,0.892183,0.883587
700,0.1427,0.294607,0.893408,0.884249
800,0.1385,0.420007,0.897329,0.888934
900,0.1019,0.38211,0.893654,0.883897
1000,0.1106,0.362476,0.895859,0.889235


aubmindlab/bert-base-arabertv02-twitter, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4263,0.337502,0.848812,0.838738
200,0.3242,0.300581,0.868905,0.857208
300,0.2852,0.290449,0.879196,0.866601
400,0.2129,0.293805,0.884342,0.874793
500,0.2103,0.28376,0.891203,0.881332
600,0.1357,0.296333,0.892183,0.883587
700,0.1427,0.294607,0.893408,0.884249
800,0.1385,0.420007,0.897329,0.888934
900,0.1019,0.38211,0.893654,0.883897
1000,0.1106,0.362476,0.895859,0.889235


aubmindlab/bert-base-arabertv02-twitter, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4263,0.337502,0.848812,0.838738
200,0.3242,0.300581,0.868905,0.857208
300,0.2852,0.290449,0.879196,0.866601
400,0.2129,0.293805,0.884342,0.874793
500,0.2103,0.28376,0.891203,0.881332
600,0.1357,0.296333,0.892183,0.883587
700,0.1427,0.294607,0.893408,0.884249
800,0.1385,0.420007,0.897329,0.888934
900,0.1019,0.38211,0.893654,0.883897
1000,0.1106,0.362476,0.895859,0.889235


aubmindlab/bert-base-arabertv02-twitter, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4163,0.370616,0.834844,0.809245
200,0.3323,0.290274,0.875766,0.864805
300,0.2608,0.323407,0.874541,0.86286
400,0.2221,0.292723,0.878951,0.872062
500,0.2103,0.293283,0.887528,0.880127
600,0.136,0.317012,0.888508,0.880668
700,0.1405,0.375062,0.887528,0.878081
800,0.1291,0.377454,0.889978,0.883098
900,0.0965,0.391599,0.890958,0.884052
1000,0.0925,0.403199,0.893163,0.887164


aubmindlab/bert-base-arabertv02-twitter, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4163,0.370616,0.834844,0.809245
200,0.3323,0.290274,0.875766,0.864805
300,0.2608,0.323407,0.874541,0.86286
400,0.2221,0.292723,0.878951,0.872062
500,0.2103,0.293283,0.887528,0.880127
600,0.136,0.317012,0.888508,0.880668
700,0.1405,0.375062,0.887528,0.878081
800,0.1291,0.377454,0.889978,0.883098
900,0.0965,0.391599,0.890958,0.884052
1000,0.0925,0.403199,0.893163,0.887164


aubmindlab/bert-base-arabertv02-twitter, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4163,0.370616,0.834844,0.809245
200,0.3323,0.290274,0.875766,0.864805
300,0.2608,0.323407,0.874541,0.86286
400,0.2221,0.292723,0.878951,0.872062
500,0.2103,0.293283,0.887528,0.880127
600,0.136,0.317012,0.888508,0.880668
700,0.1405,0.375062,0.887528,0.878081
800,0.1291,0.377454,0.889978,0.883098
900,0.0965,0.391599,0.890958,0.884052
1000,0.0925,0.403199,0.893163,0.887164


DatasetDict({
    train: Dataset({
        features: ['text', 'label'],
        num_rows: 16321
    })
    test: Dataset({
        features: ['text', 'label'],
        num_rows: 4081
    })
})

CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4328,0.349418,0.841951,0.82214
200,0.3435,0.3243,0.861309,0.847965
300,0.2814,0.341873,0.870865,0.862928
400,0.2106,0.309467,0.875766,0.866778
500,0.2085,0.322514,0.883362,0.873695
600,0.1357,0.39854,0.883117,0.874558
700,0.1433,0.34961,0.887528,0.879024
800,0.1281,0.534476,0.877971,0.87115
900,0.1006,0.466899,0.882137,0.875141
1000,0.1107,0.474242,0.888018,0.879618


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4328,0.349418,0.841951,0.82214
200,0.3435,0.3243,0.861309,0.847965
300,0.2814,0.341873,0.870865,0.862928
400,0.2106,0.309467,0.875766,0.866778
500,0.2085,0.322514,0.883362,0.873695
600,0.1357,0.39854,0.883117,0.874558
700,0.1433,0.34961,0.887528,0.879024
800,0.1281,0.534476,0.877971,0.87115
900,0.1006,0.466899,0.882137,0.875141
1000,0.1107,0.474242,0.888018,0.879618


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4328,0.349418,0.841951,0.82214
200,0.3435,0.3243,0.861309,0.847965
300,0.2814,0.341873,0.870865,0.862928
400,0.2106,0.309467,0.875766,0.866778
500,0.2085,0.322514,0.883362,0.873695
600,0.1357,0.39854,0.883117,0.874558
700,0.1433,0.34961,0.887528,0.879024
800,0.1281,0.534476,0.877971,0.87115
900,0.1006,0.466899,0.882137,0.875141
1000,0.1107,0.474242,0.888018,0.879618


CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4286,0.344393,0.848076,0.831066
200,0.3431,0.322483,0.863269,0.848582
300,0.2977,0.306069,0.87356,0.859645
400,0.2169,0.297827,0.882382,0.873577
500,0.2089,0.293055,0.883362,0.8747
600,0.1498,0.310082,0.884097,0.875712
700,0.1406,0.3738,0.883852,0.876097
800,0.1313,0.474072,0.883607,0.876108
900,0.1021,0.430279,0.888018,0.880399
1000,0.111,0.41911,0.885812,0.878657


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4286,0.344393,0.848076,0.831066
200,0.3431,0.322483,0.863269,0.848582
300,0.2977,0.306069,0.87356,0.859645
400,0.2169,0.297827,0.882382,0.873577
500,0.2089,0.293055,0.883362,0.8747
600,0.1498,0.310082,0.884097,0.875712
700,0.1406,0.3738,0.883852,0.876097
800,0.1313,0.474072,0.883607,0.876108
900,0.1021,0.430279,0.888018,0.880399
1000,0.111,0.41911,0.885812,0.878657


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4286,0.344393,0.848076,0.831066
200,0.3431,0.322483,0.863269,0.848582
300,0.2977,0.306069,0.87356,0.859645
400,0.2169,0.297827,0.882382,0.873577
500,0.2089,0.293055,0.883362,0.8747
600,0.1498,0.310082,0.884097,0.875712
700,0.1406,0.3738,0.883852,0.876097
800,0.1313,0.474072,0.883607,0.876108
900,0.1021,0.430279,0.888018,0.880399
1000,0.111,0.41911,0.885812,0.878657


CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.436,0.353687,0.844646,0.826154
200,0.3511,0.312816,0.864494,0.852404
300,0.2701,0.350843,0.866944,0.852577
400,0.227,0.3359,0.860328,0.853758
500,0.2209,0.321961,0.881157,0.871955
600,0.1437,0.406765,0.866699,0.86049
700,0.134,0.453959,0.875276,0.867069
800,0.1272,0.452096,0.879196,0.870062
900,0.1051,0.418335,0.883117,0.876714
1000,0.1071,0.436616,0.885567,0.876881


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.436,0.353687,0.844646,0.826154
200,0.3511,0.312816,0.864494,0.852404
300,0.2701,0.350843,0.866944,0.852577
400,0.227,0.3359,0.860328,0.853758
500,0.2209,0.321961,0.881157,0.871955
600,0.1437,0.406765,0.866699,0.86049
700,0.134,0.453959,0.875276,0.867069
800,0.1272,0.452096,0.879196,0.870062
900,0.1051,0.418335,0.883117,0.876714
1000,0.1071,0.436616,0.885567,0.876881


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.436,0.353687,0.844646,0.826154
200,0.3511,0.312816,0.864494,0.852404
300,0.2701,0.350843,0.866944,0.852577
400,0.227,0.3359,0.860328,0.853758
500,0.2209,0.321961,0.881157,0.871955
600,0.1437,0.406765,0.866699,0.86049
700,0.134,0.453959,0.875276,0.867069
800,0.1272,0.452096,0.879196,0.870062
900,0.1051,0.418335,0.883117,0.876714
1000,0.1071,0.436616,0.885567,0.876881


DatasetDict({
    train: Dataset({
        features: ['text', 'label'],
        num_rows: 16321
    })
    test: Dataset({
        features: ['text', 'label'],
        num_rows: 4081
    })
})

qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4034,0.316622,0.858613,0.843558
200,0.3176,0.289777,0.878951,0.871003
300,0.2469,0.311463,0.879686,0.87439
400,0.1654,0.35541,0.887037,0.880185
500,0.1709,0.280656,0.888508,0.881832
600,0.1004,0.443451,0.885567,0.879772
700,0.1036,0.335516,0.889243,0.881692
800,0.0938,0.499783,0.888263,0.8821
900,0.0741,0.415214,0.881892,0.876549
1000,0.0917,0.40274,0.890958,0.884169


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4034,0.316622,0.858613,0.843558
200,0.3176,0.289777,0.878951,0.871003
300,0.2469,0.311463,0.879686,0.87439
400,0.1654,0.35541,0.887037,0.880185
500,0.1709,0.280656,0.888508,0.881832
600,0.1004,0.443451,0.885567,0.879772
700,0.1036,0.335516,0.889243,0.881692
800,0.0938,0.499783,0.888263,0.8821
900,0.0741,0.415214,0.881892,0.876549
1000,0.0917,0.40274,0.890958,0.884169


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4034,0.316622,0.858613,0.843558
200,0.3176,0.289777,0.878951,0.871003
300,0.2469,0.311463,0.879686,0.87439
400,0.1654,0.35541,0.887037,0.880185
500,0.1709,0.280656,0.888508,0.881832
600,0.1004,0.443451,0.885567,0.879772
700,0.1036,0.335516,0.889243,0.881692
800,0.0938,0.499783,0.888263,0.8821
900,0.0741,0.415214,0.881892,0.876549
1000,0.0917,0.40274,0.890958,0.884169


qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4142,0.316144,0.859838,0.847953
200,0.3125,0.324572,0.8716,0.86195
300,0.2721,0.31462,0.878951,0.864591
400,0.1785,0.299526,0.881157,0.872559
500,0.1907,0.261976,0.895369,0.888102
600,0.1175,0.312061,0.892428,0.884834
700,0.1136,0.327209,0.888753,0.881661
800,0.113,0.530408,0.890223,0.883374
900,0.0868,0.400271,0.894144,0.884106
1000,0.0796,0.419454,0.893654,0.885468


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4142,0.316144,0.859838,0.847953
200,0.3125,0.324572,0.8716,0.86195
300,0.2721,0.31462,0.878951,0.864591
400,0.1785,0.299526,0.881157,0.872559
500,0.1907,0.261976,0.895369,0.888102
600,0.1175,0.312061,0.892428,0.884834
700,0.1136,0.327209,0.888753,0.881661
800,0.113,0.530408,0.890223,0.883374
900,0.0868,0.400271,0.894144,0.884106
1000,0.0796,0.419454,0.893654,0.885468


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4142,0.316144,0.859838,0.847953
200,0.3125,0.324572,0.8716,0.86195
300,0.2721,0.31462,0.878951,0.864591
400,0.1785,0.299526,0.881157,0.872559
500,0.1907,0.261976,0.895369,0.888102
600,0.1175,0.312061,0.892428,0.884834
700,0.1136,0.327209,0.888753,0.881661
800,0.113,0.530408,0.890223,0.883374
900,0.0868,0.400271,0.894144,0.884106
1000,0.0796,0.419454,0.893654,0.885468


qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4049,0.34773,0.851752,0.834135
200,0.3241,0.291929,0.873805,0.865005
300,0.2451,0.31406,0.881647,0.871894
400,0.1783,0.312143,0.877971,0.873282
500,0.1809,0.299958,0.891448,0.885768
600,0.1113,0.381363,0.894144,0.888279
700,0.1047,0.399345,0.887773,0.880373
800,0.1048,0.501262,0.894389,0.88653
900,0.0746,0.428561,0.894144,0.886837
1000,0.0745,0.441602,0.894634,0.887715


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4049,0.34773,0.851752,0.834135
200,0.3241,0.291929,0.873805,0.865005
300,0.2451,0.31406,0.881647,0.871894
400,0.1783,0.312143,0.877971,0.873282
500,0.1809,0.299958,0.891448,0.885768
600,0.1113,0.381363,0.894144,0.888279
700,0.1047,0.399345,0.887773,0.880373
800,0.1048,0.501262,0.894389,0.88653
900,0.0746,0.428561,0.894144,0.886837
1000,0.0745,0.441602,0.894634,0.887715


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4049,0.34773,0.851752,0.834135
200,0.3241,0.291929,0.873805,0.865005
300,0.2451,0.31406,0.881647,0.871894
400,0.1783,0.312143,0.877971,0.873282
500,0.1809,0.299958,0.891448,0.885768
600,0.1113,0.381363,0.894144,0.888279
700,0.1047,0.399345,0.887773,0.880373
800,0.1048,0.501262,0.894389,0.88653
900,0.0746,0.428561,0.894144,0.886837
1000,0.0745,0.441602,0.894634,0.887715


DatasetDict({
    train: Dataset({
        features: ['text', 'label'],
        num_rows: 16321
    })
    test: Dataset({
        features: ['text', 'label'],
        num_rows: 4081
    })
})

UBC-NLP/MARBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4329,0.335106,0.848076,0.834898
200,0.3426,0.328231,0.865229,0.857106
300,0.2676,0.34118,0.859593,0.854241
400,0.189,0.395532,0.877481,0.867863
500,0.1828,0.335663,0.878706,0.873525
600,0.1194,0.427692,0.883362,0.875076
700,0.1244,0.40467,0.87013,0.864652
800,0.0992,0.443618,0.882872,0.875965
900,0.0739,0.669171,0.86817,0.862176
1000,0.0843,0.497922,0.884832,0.877677


UBC-NLP/MARBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4329,0.335106,0.848076,0.834898
200,0.3426,0.328231,0.865229,0.857106
300,0.2676,0.34118,0.859593,0.854241
400,0.189,0.395532,0.877481,0.867863
500,0.1828,0.335663,0.878706,0.873525
600,0.1194,0.427692,0.883362,0.875076
700,0.1244,0.40467,0.87013,0.864652
800,0.0992,0.443618,0.882872,0.875965
900,0.0739,0.669171,0.86817,0.862176
1000,0.0843,0.497922,0.884832,0.877677


UBC-NLP/MARBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4329,0.335106,0.848076,0.834898
200,0.3426,0.328231,0.865229,0.857106
300,0.2676,0.34118,0.859593,0.854241
400,0.189,0.395532,0.877481,0.867863
500,0.1828,0.335663,0.878706,0.873525
600,0.1194,0.427692,0.883362,0.875076
700,0.1244,0.40467,0.87013,0.864652
800,0.0992,0.443618,0.882872,0.875965
900,0.0739,0.669171,0.86817,0.862176
1000,0.0843,0.497922,0.884832,0.877677


UBC-NLP/MARBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4256,0.355626,0.853222,0.836928
200,0.3298,0.297137,0.878706,0.869203
300,0.2701,0.350384,0.881402,0.868839
400,0.1898,0.301518,0.885322,0.87859
500,0.1947,0.27506,0.883852,0.876667
600,0.1235,0.375027,0.886547,0.875692
700,0.1178,0.329399,0.886302,0.877993
800,0.1327,0.475144,0.881647,0.874278
900,0.0864,0.480287,0.880176,0.872587
1000,0.1047,0.487979,0.882137,0.873011


UBC-NLP/MARBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4256,0.355626,0.853222,0.836928
200,0.3298,0.297137,0.878706,0.869203
300,0.2701,0.350384,0.881402,0.868839
400,0.1898,0.301518,0.885322,0.87859
500,0.1947,0.27506,0.883852,0.876667
600,0.1235,0.375027,0.886547,0.875692
700,0.1178,0.329399,0.886302,0.877993
800,0.1327,0.475144,0.881647,0.874278
900,0.0864,0.480287,0.880176,0.872587
1000,0.1047,0.487979,0.882137,0.873011


UBC-NLP/MARBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4256,0.355626,0.853222,0.836928
200,0.3298,0.297137,0.878706,0.869203
300,0.2701,0.350384,0.881402,0.868839
400,0.1898,0.301518,0.885322,0.87859
500,0.1947,0.27506,0.883852,0.876667
600,0.1235,0.375027,0.886547,0.875692
700,0.1178,0.329399,0.886302,0.877993
800,0.1327,0.475144,0.881647,0.874278
900,0.0864,0.480287,0.880176,0.872587
1000,0.1047,0.487979,0.882137,0.873011


UBC-NLP/MARBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4424,0.360183,0.851997,0.835652
200,0.3486,0.296177,0.87062,0.86002
300,0.2729,0.368644,0.8716,0.860999
400,0.1883,0.327762,0.881647,0.874529
500,0.1976,0.348782,0.890223,0.881939
600,0.1303,0.450112,0.889488,0.882842
700,0.1245,0.341857,0.882872,0.875149
800,0.1131,0.554713,0.884097,0.87578
900,0.0852,0.605575,0.885812,0.878156
1000,0.094,0.501556,0.884832,0.875685


UBC-NLP/MARBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4424,0.360183,0.851997,0.835652
200,0.3486,0.296177,0.87062,0.86002
300,0.2729,0.368644,0.8716,0.860999
400,0.1883,0.327762,0.881647,0.874529
500,0.1976,0.348782,0.890223,0.881939
600,0.1303,0.450112,0.889488,0.882842
700,0.1245,0.341857,0.882872,0.875149
800,0.1131,0.554713,0.884097,0.87578
900,0.0852,0.605575,0.885812,0.878156
1000,0.094,0.501556,0.884832,0.875685


UBC-NLP/MARBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4424,0.360183,0.851997,0.835652
200,0.3486,0.296177,0.87062,0.86002
300,0.2729,0.368644,0.8716,0.860999
400,0.1883,0.327762,0.881647,0.874529
500,0.1976,0.348782,0.890223,0.881939
600,0.1303,0.450112,0.889488,0.882842
700,0.1245,0.341857,0.882872,0.875149
800,0.1131,0.554713,0.884097,0.87578
900,0.0852,0.605575,0.885812,0.878156
1000,0.094,0.501556,0.884832,0.875685


DatasetDict({
    train: Dataset({
        features: ['text', 'label'],
        num_rows: 16321
    })
    test: Dataset({
        features: ['text', 'label'],
        num_rows: 4081
    })
})

UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4571,0.341692,0.836315,0.815077
200,0.3447,0.312992,0.86964,0.859764
300,0.2779,0.358942,0.871355,0.866052
400,0.2081,0.306516,0.891693,0.883258
500,0.2045,0.292638,0.891203,0.885284
600,0.125,0.351902,0.888018,0.880208
700,0.1369,0.327624,0.879931,0.874711
800,0.11,0.495667,0.890958,0.884985
900,0.0869,0.487429,0.891938,0.885065
1000,0.0949,0.412056,0.891448,0.885583


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4571,0.341692,0.836315,0.815077
200,0.3447,0.312992,0.86964,0.859764
300,0.2779,0.358942,0.871355,0.866052
400,0.2081,0.306516,0.891693,0.883258
500,0.2045,0.292638,0.891203,0.885284
600,0.125,0.351902,0.888018,0.880208
700,0.1369,0.327624,0.879931,0.874711
800,0.11,0.495667,0.890958,0.884985
900,0.0869,0.487429,0.891938,0.885065
1000,0.0949,0.412056,0.891448,0.885583


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4571,0.341692,0.836315,0.815077
200,0.3447,0.312992,0.86964,0.859764
300,0.2779,0.358942,0.871355,0.866052
400,0.2081,0.306516,0.891693,0.883258
500,0.2045,0.292638,0.891203,0.885284
600,0.125,0.351902,0.888018,0.880208
700,0.1369,0.327624,0.879931,0.874711
800,0.11,0.495667,0.890958,0.884985
900,0.0869,0.487429,0.891938,0.885065
1000,0.0949,0.412056,0.891448,0.885583


UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4288,0.308386,0.859348,0.844657
200,0.323,0.294741,0.876256,0.866862
300,0.2789,0.330708,0.884097,0.876212
400,0.2023,0.284097,0.891693,0.884309
500,0.1999,0.280222,0.889733,0.884188
600,0.1235,0.295397,0.889488,0.881654
700,0.1233,0.31613,0.897819,0.890575
800,0.1202,0.511721,0.881402,0.87645
900,0.0867,0.387828,0.891693,0.884993
1000,0.0895,0.458582,0.894389,0.887144


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4288,0.308386,0.859348,0.844657
200,0.323,0.294741,0.876256,0.866862
300,0.2789,0.330708,0.884097,0.876212
400,0.2023,0.284097,0.891693,0.884309
500,0.1999,0.280222,0.889733,0.884188
600,0.1235,0.295397,0.889488,0.881654
700,0.1233,0.31613,0.897819,0.890575
800,0.1202,0.511721,0.881402,0.87645
900,0.0867,0.387828,0.891693,0.884993
1000,0.0895,0.458582,0.894389,0.887144


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4288,0.308386,0.859348,0.844657
200,0.323,0.294741,0.876256,0.866862
300,0.2789,0.330708,0.884097,0.876212
400,0.2023,0.284097,0.891693,0.884309
500,0.1999,0.280222,0.889733,0.884188
600,0.1235,0.295397,0.889488,0.881654
700,0.1233,0.31613,0.897819,0.890575
800,0.1202,0.511721,0.881402,0.87645
900,0.0867,0.387828,0.891693,0.884993
1000,0.0895,0.458582,0.894389,0.887144


UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4221,0.337495,0.861063,0.847962
200,0.3391,0.289371,0.870375,0.861953
300,0.2615,0.345929,0.875766,0.863308
400,0.2118,0.300721,0.87356,0.869226
500,0.2178,0.307603,0.895369,0.887552
600,0.1357,0.333968,0.895859,0.889375
700,0.123,0.389857,0.898554,0.891407
800,0.124,0.404656,0.896104,0.888139
900,0.0866,0.412632,0.894879,0.889327
1000,0.0902,0.423277,0.897574,0.891017


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4221,0.337495,0.861063,0.847962
200,0.3391,0.289371,0.870375,0.861953
300,0.2615,0.345929,0.875766,0.863308
400,0.2118,0.300721,0.87356,0.869226
500,0.2178,0.307603,0.895369,0.887552
600,0.1357,0.333968,0.895859,0.889375
700,0.123,0.389857,0.898554,0.891407
800,0.124,0.404656,0.896104,0.888139
900,0.0866,0.412632,0.894879,0.889327
1000,0.0902,0.423277,0.897574,0.891017


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/16321 [00:00<?, ? examples/s]

Map:   0%|          | 0/4081 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
100,0.4221,0.337495,0.861063,0.847962
200,0.3391,0.289371,0.870375,0.861953
300,0.2615,0.345929,0.875766,0.863308
400,0.2118,0.300721,0.87356,0.869226
500,0.2178,0.307603,0.895369,0.887552
600,0.1357,0.333968,0.895859,0.889375
700,0.123,0.389857,0.898554,0.891407
800,0.124,0.404656,0.896104,0.888139
900,0.0866,0.412632,0.894879,0.889327
1000,0.0902,0.423277,0.897574,0.891017


Unnamed: 0,Model,Accuracy,F1
0,CAMeL-Lab/bert-base-arabic-camelbert-da,0.893654,0.886612
3,UBC-NLP/MARBERT,0.889488,0.882842
6,UBC-NLP/MARBERTv2,0.897819,0.892644
9,aubmindlab/bert-base-arabertv02-twitter,0.900025,0.892238
12,qarib/bert-base-qarib,0.898064,0.890585
