In [1]:
import os
os.environ["CUDA_VISIBLE_DEVICES"]="1" 

import numpy as np
import tensorflow as tf
import pandas as pd
import pyarabic.araby as araby
import warnings
warnings.filterwarnings('ignore')
from sklearn.model_selection import train_test_split
from sklearn.metrics import classification_report
from tensorflow.keras.layers import Dense, Input
from tensorflow.keras.utils import to_categorical
from tensorflow.keras.optimizers import Adam
from tensorflow.keras.callbacks import EarlyStopping
from tensorflow.keras.initializers import TruncatedNormal
from tensorflow.keras.losses import CategoricalCrossentropy
from tensorflow.keras.metrics import CategoricalAccuracy
import torch
from sklearn.metrics import accuracy_score, f1_score, precision_score, recall_score
from transformers import Trainer, TrainingArguments
from transformers import AutoTokenizer, AutoModelForSequenceClassification
from datasets import load_dataset, Dataset, concatenate_datasets
import torch
import torch.nn as nn
from transformers import AutoModel, TrainingArguments, Trainer, BertModel
from transformers.modeling_outputs import SequenceClassifierOutput
import numpy as np
from sklearn.metrics import confusion_matrix, ConfusionMatrixDisplay
import matplotlib.pyplot as plt
import seaborn as sns
pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', None)
pd.set_option('display.max_colwidth', 1000)


fname = 'Tadawul_emotions'
log_file = fname + '.txt'

with open(log_file, 'w') as f:
    f.write('Model,Accuracy,Precision,Recall,F1\n')


df = pd.read_csv('Tadawul_Sentiment_Emotions_Analysis.csv', encoding='utf-8', engine='python', sep='\t')



df.fillna('', inplace=True)  
display(len(df))


display(df.columns)
display(len(df))
display(df[:4])



classes = set(df['emotion'].values)
display(classes)

c = df['emotion'].value_counts()
display(c)

df['emotion'] = df['emotion'].astype('category')
df['label'] = df['emotion'].cat.codes

df = df[['text', 'label']]

classes_num = len(classes)
display(classes_num)
display(len(df))


max_sequence_length = 128



class BertLSTMModel(nn.Module):
    def __init__(self, model_name, num_labels, hidden_dim=128, num_layers=2):
        super(BertLSTMModel, self).__init__()
        
        self.bert = AutoModel.from_pretrained(model_name)
        self.lstm = nn.LSTM(input_size=self.bert.config.hidden_size, 
                            hidden_size=hidden_dim, 
                            num_layers=num_layers, 
                            batch_first=True, 
                            bidirectional=True)
        self.classifier = nn.Linear(hidden_dim * 2, num_labels)
        self.num_labels = num_labels
    
    def forward(self, input_ids, attention_mask, labels=None):
        bert_outputs = self.bert(input_ids=input_ids, attention_mask=attention_mask)
        sequence_output = bert_outputs.last_hidden_state
        lstm_output, _ = self.lstm(sequence_output)
        lstm_output = lstm_output[:, -1, :]  
        logits = self.classifier(lstm_output)
        
        loss = None
        if labels is not None:
            loss_fct = nn.CrossEntropyLoss()
            loss = loss_fct(logits.view(-1, self.num_labels), labels.view(-1))
        
        return SequenceClassifierOutput(
            loss=loss,
            logits=logits,
        )



class BertCNNModel(nn.Module):
    def __init__(self, model_name, num_labels, num_filters=100, filter_sizes=[3, 4, 5]):
        super(BertCNNModel, self).__init__()
        self.bert = BertModel.from_pretrained(model_name)
        self.convs = nn.ModuleList([
            nn.Conv2d(1, num_filters, (fs, self.bert.config.hidden_size)) for fs in filter_sizes
        ])
        self.classifier = nn.Linear(len(filter_sizes) * num_filters, num_labels)
        self.num_labels = num_labels


    def forward(self, input_ids, attention_mask, token_type_ids=None, labels=None):
        bert_outputs = self.bert(input_ids=input_ids, attention_mask=attention_mask, token_type_ids=token_type_ids)
        sequence_output = bert_outputs.last_hidden_state.unsqueeze(1) 

        conv_outputs = [torch.relu(conv(sequence_output)).squeeze(3) for conv in self.convs]
        pooled_outputs = [torch.max(output, 2)[0] for output in conv_outputs]
        cat_output = torch.cat(pooled_outputs, 1)
        
        logits = self.classifier(cat_output)
        
        loss = None
        if labels is not None:
            loss_fct = nn.CrossEntropyLoss()
            loss = loss_fct(logits.view(-1, self.num_labels), labels.view(-1))
        
        return SequenceClassifierOutput(
            loss=loss,
            logits=logits,
        )



models = [ 
        'aubmindlab/bert-base-arabertv02-twitter',
        'CAMeL-Lab/bert-base-arabic-camelbert-da',
        'qarib/bert-base-qarib', 
        'UBC-NLP/MARBERT',
        'UBC-NLP/MARBERTv2',
        'faisalq/SaudiBERT',
        'SaudiBERT_LSTM',
        'SaudiBERT_CNN',    
]


seeds = [0, 1, 42]


for model_name in models:
    for seed in seeds:
        ds = Dataset.from_pandas(df)
        ds = ds.train_test_split(test_size=0.2, seed = seed)
        if seed==0:
            display(ds)
        for i in range(3):
            print(f'{model_name}, try:{i}')
                  
            if(model_name == 'SaudiBERT_LSTM'):
                tokenizer = AutoTokenizer.from_pretrained('faisalq/SaudiBERT')
                model = BertLSTMModel(model_name='faisalq/SaudiBERT', num_labels=classes_num).to('cuda')       
            elif(model_name == 'SaudiBERT_CNN'):
                tokenizer = AutoTokenizer.from_pretrained('faisalq/SaudiBERT')
                model = BertCNNModel(model_name='faisalq/SaudiBERT', num_labels=classes_num).to('cuda')
            else:
                tokenizer = AutoTokenizer.from_pretrained(model_name)                
                model = AutoModelForSequenceClassification.from_pretrained(model_name,
                                                                  num_labels=classes_num).to('cuda')                                                 
            dataset_train = ds['train']
            dataset_validation = ds['test']                                                    
            
          
    
            def preprocess_function(examples):
                return tokenizer(examples['text'], truncation=True, padding="max_length",
                                max_length=max_sequence_length)
            
            
            dataset_train = dataset_train.map(preprocess_function, batched=True) 
            dataset_validation = dataset_validation.map(preprocess_function, batched=True)  
            
           
            
            def compute_metrics(eval_pred):
                logits, labels = eval_pred
                predictions = np.argmax(logits, axis=-1)    
                acc = accuracy_score(labels, predictions)        
                f1 = f1_score(labels, predictions, average='macro')  
                precision = precision_score(labels, predictions, average='macro')
                recall = recall_score(labels, predictions, average='macro')
                with open(log_file, 'a') as f:
                    f.write(f'{model_name},{acc},{precision},{recall},{f1}\n')
                return {'accuracy': acc, 'precision': precision, 'recall':recall, 'f1_score': f1}
    
    
            
            
            epochs = 8
            save_steps = 10000 #save checkpoint every 10000 steps
            batch_size = 64
            
            training_args = TrainingArguments(
                output_dir = 'bert/',
                overwrite_output_dir=True,
                num_train_epochs = epochs,
                per_device_train_batch_size = batch_size,
                per_device_eval_batch_size = batch_size,
                save_steps = save_steps,
                save_total_limit = 1, #only save the last 5 checkpoints
                fp16=True,
                learning_rate = 5e-5,  # 5e-5 is the default
                logging_steps = 50, #50_000
                evaluation_strategy = 'steps',
                # evaluate_during_training = True,
                eval_steps = 50
                
            )
            
            trainer = Trainer(
                model = model,
                args = training_args,
                train_dataset=dataset_train,
                eval_dataset=dataset_validation,
                compute_metrics = compute_metrics
            )
            
            
            trainer.train()


results = pd.read_csv(log_file)

best_results = results.groupby('Model', as_index=False)['F1'].max()

best_results = pd.merge(best_results, results, on=['Model', 'F1'])
best_results = best_results[['Model', 'Accuracy', 'Precision', 'Recall', 'F1']]
best_results = best_results.drop_duplicates()
best_results.to_csv(f'{fname}.csv')
display(best_results)



2024-09-30 04:13:32.782340: I tensorflow/core/util/port.cc:110] oneDNN custom operations are on. You may see slightly different numerical results due to floating-point round-off errors from different computation orders. To turn them off, set the environment variable `TF_ENABLE_ONEDNN_OPTS=0`.
2024-09-30 04:13:32.806188: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.
To enable the following instructions: AVX2 AVX512F AVX512_VNNI AVX512_BF16 FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.


11953

Index(['text', 'sentiment', 'emotion'], dtype='object')

11953

Unnamed: 0,text,sentiment,emotion
0,الله يعوضك خيرا مماخسرت ويوفقك من خيري الدنيا والاخرة,p,Sadness
1,من جدك هذا وانت استاذنا الله يعوضك اضعافها يارب,p,Sadness
2,الله يعوضك اضعاف ماخسرت ويرزقك بر ولدك وجميع الاخوان,p,Sadness
3,انما النصر صبر ساعه,p,Happiness


{'Anger', 'Fear', 'Happiness', 'Sadness'}

emotion
Happiness    5590
Anger        2602
Fear         2596
Sadness      1165
Name: count, dtype: int64

4

11953

DatasetDict({
    train: Dataset({
        features: ['text', 'label'],
        num_rows: 9562
    })
    test: Dataset({
        features: ['text', 'label'],
        num_rows: 2391
    })
})

aubmindlab/bert-base-arabertv02-twitter, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8875,0.659288,0.740276,0.687098,0.682048,0.682412
100,0.6394,0.513067,0.808867,0.786466,0.755307,0.768973
150,0.5549,0.468465,0.82476,0.810882,0.779179,0.788846
200,0.3026,0.480065,0.81514,0.791499,0.785271,0.785147
250,0.3146,0.493966,0.815977,0.77532,0.811241,0.790113
300,0.2987,0.443848,0.83647,0.815091,0.793989,0.803163
350,0.1254,0.532885,0.827269,0.789019,0.80041,0.79334
400,0.1167,0.577268,0.828105,0.797081,0.798617,0.795559
450,0.1364,0.556591,0.835634,0.806529,0.802545,0.802669
500,0.0685,0.609853,0.826432,0.789525,0.804909,0.796493


aubmindlab/bert-base-arabertv02-twitter, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.864,0.64929,0.755332,0.701837,0.713209,0.705939
100,0.637,0.526533,0.801757,0.792234,0.740699,0.760221
150,0.5452,0.464676,0.825178,0.801034,0.781729,0.789529
200,0.307,0.469088,0.831033,0.804971,0.791095,0.797363
250,0.308,0.51398,0.808867,0.767369,0.809415,0.783886
300,0.2787,0.460127,0.843162,0.821881,0.812575,0.813158
350,0.1265,0.534278,0.828942,0.793041,0.80979,0.800724
400,0.1173,0.534501,0.842325,0.809869,0.812273,0.809726
450,0.1375,0.534538,0.840652,0.814994,0.803405,0.807681
500,0.0656,0.659415,0.827269,0.791077,0.806097,0.791208


aubmindlab/bert-base-arabertv02-twitter, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.864,0.64929,0.755332,0.701837,0.713209,0.705939
100,0.637,0.526533,0.801757,0.792234,0.740699,0.760221
150,0.5452,0.464676,0.825178,0.801034,0.781729,0.789529
200,0.307,0.469088,0.831033,0.804971,0.791095,0.797363
250,0.308,0.51398,0.808867,0.767369,0.809415,0.783886
300,0.2787,0.460127,0.843162,0.821881,0.812575,0.813158
350,0.1265,0.534278,0.828942,0.793041,0.80979,0.800724
400,0.1173,0.534501,0.842325,0.809869,0.812273,0.809726
450,0.1375,0.534538,0.840652,0.814994,0.803405,0.807681
500,0.0656,0.659415,0.827269,0.791077,0.806097,0.791208


aubmindlab/bert-base-arabertv02-twitter, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8688,0.654351,0.75115,0.714486,0.678166,0.690975
100,0.5952,0.55903,0.795065,0.780507,0.739108,0.749029
150,0.5386,0.49727,0.810958,0.79594,0.762625,0.775843
200,0.307,0.55291,0.798411,0.756985,0.797674,0.771972
250,0.2869,0.515717,0.820577,0.784019,0.801956,0.790452
300,0.3177,0.514759,0.821414,0.815786,0.782618,0.788979
350,0.1277,0.574928,0.82936,0.800337,0.804965,0.800932
400,0.1357,0.572585,0.818904,0.782701,0.797156,0.788773
450,0.1472,0.576806,0.822668,0.786629,0.797968,0.791326
500,0.0558,0.710594,0.823505,0.794973,0.797766,0.795199


aubmindlab/bert-base-arabertv02-twitter, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8688,0.654351,0.75115,0.714486,0.678166,0.690975
100,0.5952,0.55903,0.795065,0.780507,0.739108,0.749029
150,0.5386,0.49727,0.810958,0.79594,0.762625,0.775843
200,0.307,0.55291,0.798411,0.756985,0.797674,0.771972
250,0.2869,0.515717,0.820577,0.784019,0.801956,0.790452
300,0.3177,0.514759,0.821414,0.815786,0.782618,0.788979
350,0.1277,0.574928,0.82936,0.800337,0.804965,0.800932
400,0.1357,0.572585,0.818904,0.782701,0.797156,0.788773
450,0.1472,0.576806,0.822668,0.786629,0.797968,0.791326
500,0.0558,0.710594,0.823505,0.794973,0.797766,0.795199


aubmindlab/bert-base-arabertv02-twitter, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8688,0.654351,0.75115,0.714486,0.678166,0.690975
100,0.5952,0.55903,0.795065,0.780507,0.739108,0.749029
150,0.5386,0.49727,0.810958,0.79594,0.762625,0.775843
200,0.307,0.55291,0.798411,0.756985,0.797674,0.771972
250,0.2869,0.515717,0.820577,0.784019,0.801956,0.790452
300,0.3177,0.514759,0.821414,0.815786,0.782618,0.788979
350,0.1277,0.574928,0.82936,0.800337,0.804965,0.800932
400,0.1357,0.572585,0.818904,0.782701,0.797156,0.788773
450,0.1472,0.576806,0.822668,0.786629,0.797968,0.791326
500,0.0558,0.710594,0.823505,0.794973,0.797766,0.795199


aubmindlab/bert-base-arabertv02-twitter, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8734,0.666138,0.73693,0.69649,0.654278,0.666401
100,0.5879,0.601942,0.758678,0.710926,0.753561,0.72421
150,0.5211,0.496968,0.79632,0.748328,0.78165,0.758964
200,0.2957,0.501329,0.822668,0.790622,0.783865,0.78659
250,0.2744,0.488182,0.815977,0.780569,0.777552,0.778646
300,0.2999,0.490663,0.820577,0.785323,0.782537,0.782693
350,0.1121,0.640235,0.803848,0.798344,0.760695,0.764439
400,0.1295,0.638972,0.803011,0.762473,0.797205,0.770276
450,0.128,0.57017,0.818486,0.774235,0.799268,0.785063
500,0.0575,0.668673,0.824341,0.79602,0.793706,0.792549


aubmindlab/bert-base-arabertv02-twitter, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8734,0.666138,0.73693,0.69649,0.654278,0.666401
100,0.5879,0.601942,0.758678,0.710926,0.753561,0.72421
150,0.5211,0.496968,0.79632,0.748328,0.78165,0.758964
200,0.2957,0.501329,0.822668,0.790622,0.783865,0.78659
250,0.2744,0.488182,0.815977,0.780569,0.777552,0.778646
300,0.2999,0.490663,0.820577,0.785323,0.782537,0.782693
350,0.1121,0.640235,0.803848,0.798344,0.760695,0.764439
400,0.1295,0.638972,0.803011,0.762473,0.797205,0.770276
450,0.128,0.57017,0.818486,0.774235,0.799268,0.785063
500,0.0575,0.668673,0.824341,0.79602,0.793706,0.792549


aubmindlab/bert-base-arabertv02-twitter, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8734,0.666138,0.73693,0.69649,0.654278,0.666401
100,0.5879,0.601942,0.758678,0.710926,0.753561,0.72421
150,0.5211,0.496968,0.79632,0.748328,0.78165,0.758964
200,0.2957,0.501329,0.822668,0.790622,0.783865,0.78659
250,0.2744,0.488182,0.815977,0.780569,0.777552,0.778646
300,0.2999,0.490663,0.820577,0.785323,0.782537,0.782693
350,0.1121,0.640235,0.803848,0.798344,0.760695,0.764439
400,0.1295,0.638972,0.803011,0.762473,0.797205,0.770276
450,0.128,0.57017,0.818486,0.774235,0.799268,0.785063
500,0.0575,0.668673,0.824341,0.79602,0.793706,0.792549


DatasetDict({
    train: Dataset({
        features: ['text', 'label'],
        num_rows: 9562
    })
    test: Dataset({
        features: ['text', 'label'],
        num_rows: 2391
    })
})

CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.9957,0.781535,0.690088,0.695853,0.574878,0.566665
100,0.7914,0.663569,0.745713,0.702457,0.689206,0.69064
150,0.6789,0.60271,0.76537,0.732182,0.709393,0.718454
200,0.3756,0.671092,0.748641,0.70437,0.709119,0.704475
250,0.3651,0.640638,0.762442,0.719448,0.721712,0.716851
300,0.3629,0.583051,0.791301,0.759974,0.740531,0.748572
350,0.1569,0.758246,0.765788,0.719678,0.74199,0.725815
400,0.1255,0.765949,0.785027,0.756166,0.731656,0.742124
450,0.144,0.757769,0.781263,0.739988,0.742976,0.740557
500,0.0587,0.985382,0.774571,0.735382,0.73392,0.730023


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.9957,0.781535,0.690088,0.695853,0.574878,0.566665
100,0.7914,0.663569,0.745713,0.702457,0.689206,0.69064
150,0.6789,0.60271,0.76537,0.732182,0.709393,0.718454
200,0.3756,0.671092,0.748641,0.70437,0.709119,0.704475
250,0.3651,0.640638,0.762442,0.719448,0.721712,0.716851
300,0.3629,0.583051,0.791301,0.759974,0.740531,0.748572
350,0.1569,0.758246,0.765788,0.719678,0.74199,0.725815
400,0.1255,0.765949,0.785027,0.756166,0.731656,0.742124
450,0.144,0.757769,0.781263,0.739988,0.742976,0.740557
500,0.0587,0.985382,0.774571,0.735382,0.73392,0.730023


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.9957,0.781535,0.690088,0.695853,0.574878,0.566665
100,0.7914,0.663569,0.745713,0.702457,0.689206,0.69064
150,0.6789,0.60271,0.76537,0.732182,0.709393,0.718454
200,0.3756,0.671092,0.748641,0.70437,0.709119,0.704475
250,0.3651,0.640638,0.762442,0.719448,0.721712,0.716851
300,0.3629,0.583051,0.791301,0.759974,0.740531,0.748572
350,0.1569,0.758246,0.765788,0.719678,0.74199,0.725815
400,0.1255,0.765949,0.785027,0.756166,0.731656,0.742124
450,0.144,0.757769,0.781263,0.739988,0.742976,0.740557
500,0.0587,0.985382,0.774571,0.735382,0.73392,0.730023


CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,1.0091,0.833838,0.679632,0.69856,0.531994,0.534178
100,0.7409,0.6515,0.744877,0.731399,0.666014,0.688396
150,0.6739,0.631114,0.750732,0.725908,0.692599,0.700463
200,0.3818,0.616509,0.776244,0.754991,0.718533,0.731624
250,0.3491,0.591457,0.792137,0.766624,0.747156,0.755282
300,0.3778,0.610762,0.780427,0.750601,0.729389,0.737854
350,0.1281,0.82183,0.785027,0.766367,0.723705,0.74025
400,0.1574,0.781703,0.790882,0.769055,0.738816,0.749948
450,0.1163,0.909859,0.757842,0.729781,0.70551,0.71051
500,0.043,1.043598,0.772898,0.744767,0.730565,0.734772


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,1.0091,0.833838,0.679632,0.69856,0.531994,0.534178
100,0.7409,0.6515,0.744877,0.731399,0.666014,0.688396
150,0.6739,0.631114,0.750732,0.725908,0.692599,0.700463
200,0.3818,0.616509,0.776244,0.754991,0.718533,0.731624
250,0.3491,0.591457,0.792137,0.766624,0.747156,0.755282
300,0.3778,0.610762,0.780427,0.750601,0.729389,0.737854
350,0.1281,0.82183,0.785027,0.766367,0.723705,0.74025
400,0.1574,0.781703,0.790882,0.769055,0.738816,0.749948
450,0.1163,0.909859,0.757842,0.729781,0.70551,0.71051
500,0.043,1.043598,0.772898,0.744767,0.730565,0.734772


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,1.0091,0.833838,0.679632,0.69856,0.531994,0.534178
100,0.7409,0.6515,0.744877,0.731399,0.666014,0.688396
150,0.6739,0.631114,0.750732,0.725908,0.692599,0.700463
200,0.3818,0.616509,0.776244,0.754991,0.718533,0.731624
250,0.3491,0.591457,0.792137,0.766624,0.747156,0.755282
300,0.3778,0.610762,0.780427,0.750601,0.729389,0.737854
350,0.1281,0.82183,0.785027,0.766367,0.723705,0.74025
400,0.1574,0.781703,0.790882,0.769055,0.738816,0.749948
450,0.1163,0.909859,0.757842,0.729781,0.70551,0.71051
500,0.043,1.043598,0.772898,0.744767,0.730565,0.734772


CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,1.0276,0.803454,0.676704,0.656212,0.523756,0.529245
100,0.7334,0.71136,0.717691,0.664349,0.685049,0.66916
150,0.6566,0.646682,0.751987,0.721184,0.69167,0.695955
200,0.3787,0.649163,0.765788,0.719219,0.719154,0.719108
250,0.3556,0.64822,0.775408,0.746443,0.71524,0.725036
300,0.3673,0.620227,0.772898,0.733765,0.726944,0.729874
350,0.1343,0.913477,0.742367,0.721231,0.723667,0.710563
400,0.129,0.824697,0.775826,0.742053,0.718747,0.72851
450,0.132,0.779473,0.777499,0.738276,0.733747,0.734105
500,0.0575,1.074143,0.756169,0.715766,0.724144,0.712266


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,1.0276,0.803454,0.676704,0.656212,0.523756,0.529245
100,0.7334,0.71136,0.717691,0.664349,0.685049,0.66916
150,0.6566,0.646682,0.751987,0.721184,0.69167,0.695955
200,0.3787,0.649163,0.765788,0.719219,0.719154,0.719108
250,0.3556,0.64822,0.775408,0.746443,0.71524,0.725036
300,0.3673,0.620227,0.772898,0.733765,0.726944,0.729874
350,0.1343,0.913477,0.742367,0.721231,0.723667,0.710563
400,0.129,0.824697,0.775826,0.742053,0.718747,0.72851
450,0.132,0.779473,0.777499,0.738276,0.733747,0.734105
500,0.0575,1.074143,0.756169,0.715766,0.724144,0.712266


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,1.0276,0.803454,0.676704,0.656212,0.523756,0.529245
100,0.7334,0.71136,0.717691,0.664349,0.685049,0.66916
150,0.6566,0.646682,0.751987,0.721184,0.69167,0.695955
200,0.3787,0.649163,0.765788,0.719219,0.719154,0.719108
250,0.3556,0.64822,0.775408,0.746443,0.71524,0.725036
300,0.3673,0.620227,0.772898,0.733765,0.726944,0.729874
350,0.1343,0.913477,0.742367,0.721231,0.723667,0.710563
400,0.129,0.824697,0.775826,0.742053,0.718747,0.72851
450,0.132,0.779473,0.777499,0.738276,0.733747,0.734105
500,0.0575,1.074143,0.756169,0.715766,0.724144,0.712266


DatasetDict({
    train: Dataset({
        features: ['text', 'label'],
        num_rows: 9562
    })
    test: Dataset({
        features: ['text', 'label'],
        num_rows: 2391
    })
})

qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8707,0.660553,0.74655,0.69537,0.713912,0.698682
100,0.6215,0.507093,0.808448,0.795419,0.75726,0.770104
150,0.543,0.461802,0.826014,0.808961,0.785252,0.7958
200,0.2391,0.519151,0.816395,0.778242,0.791871,0.781591
250,0.266,0.496675,0.830615,0.81874,0.787889,0.798021
300,0.259,0.479092,0.839398,0.829329,0.780249,0.797017
350,0.0871,0.701775,0.824341,0.802366,0.78647,0.78952
400,0.1081,0.6429,0.823087,0.785751,0.801418,0.792342
450,0.0983,0.607314,0.827687,0.789082,0.804643,0.795906
500,0.0416,0.720482,0.832706,0.798351,0.806736,0.801451


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8707,0.660553,0.74655,0.69537,0.713912,0.698682
100,0.6215,0.507093,0.808448,0.795419,0.75726,0.770104
150,0.543,0.461802,0.826014,0.808961,0.785252,0.7958
200,0.2391,0.519151,0.816395,0.778242,0.791871,0.781591
250,0.266,0.496675,0.830615,0.81874,0.787889,0.798021
300,0.259,0.479092,0.839398,0.829329,0.780249,0.797017
350,0.0871,0.701775,0.824341,0.802366,0.78647,0.78952
400,0.1081,0.6429,0.823087,0.785751,0.801418,0.792342
450,0.0983,0.607314,0.827687,0.789082,0.804643,0.795906
500,0.0416,0.720482,0.832706,0.798351,0.806736,0.801451


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8707,0.660553,0.74655,0.69537,0.713912,0.698682
100,0.6215,0.507093,0.808448,0.795419,0.75726,0.770104
150,0.543,0.461802,0.826014,0.808961,0.785252,0.7958
200,0.2391,0.519151,0.816395,0.778242,0.791871,0.781591
250,0.266,0.496675,0.830615,0.81874,0.787889,0.798021
300,0.259,0.479092,0.839398,0.829329,0.780249,0.797017
350,0.0871,0.701775,0.824341,0.802366,0.78647,0.78952
400,0.1081,0.6429,0.823087,0.785751,0.801418,0.792342
450,0.0983,0.607314,0.827687,0.789082,0.804643,0.795906
500,0.0416,0.720482,0.832706,0.798351,0.806736,0.801451


qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8648,0.659482,0.75115,0.752335,0.668121,0.696826
100,0.5889,0.521688,0.798829,0.798671,0.732698,0.753305
150,0.5421,0.464491,0.820995,0.786643,0.796635,0.789596
200,0.2509,0.496639,0.827269,0.798574,0.799975,0.798684
250,0.2227,0.521787,0.812631,0.778067,0.782956,0.77999
300,0.2401,0.517873,0.823087,0.805958,0.773472,0.787694
350,0.0854,0.653002,0.82476,0.810655,0.780446,0.792734
400,0.0844,0.698118,0.809285,0.792483,0.782013,0.782279
450,0.1014,0.67652,0.817231,0.797952,0.792443,0.79148
500,0.0445,0.749173,0.826014,0.807352,0.787497,0.793105


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8648,0.659482,0.75115,0.752335,0.668121,0.696826
100,0.5889,0.521688,0.798829,0.798671,0.732698,0.753305
150,0.5421,0.464491,0.820995,0.786643,0.796635,0.789596
200,0.2509,0.496639,0.827269,0.798574,0.799975,0.798684
250,0.2227,0.521787,0.812631,0.778067,0.782956,0.77999
300,0.2401,0.517873,0.823087,0.805958,0.773472,0.787694
350,0.0854,0.653002,0.82476,0.810655,0.780446,0.792734
400,0.0844,0.698118,0.809285,0.792483,0.782013,0.782279
450,0.1014,0.67652,0.817231,0.797952,0.792443,0.79148
500,0.0445,0.749173,0.826014,0.807352,0.787497,0.793105


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8648,0.659482,0.75115,0.752335,0.668121,0.696826
100,0.5889,0.521688,0.798829,0.798671,0.732698,0.753305
150,0.5421,0.464491,0.820995,0.786643,0.796635,0.789596
200,0.2509,0.496639,0.827269,0.798574,0.799975,0.798684
250,0.2227,0.521787,0.812631,0.778067,0.782956,0.77999
300,0.2401,0.517873,0.823087,0.805958,0.773472,0.787694
350,0.0854,0.653002,0.82476,0.810655,0.780446,0.792734
400,0.0844,0.698118,0.809285,0.792483,0.782013,0.782279
450,0.1014,0.67652,0.817231,0.797952,0.792443,0.79148
500,0.0445,0.749173,0.826014,0.807352,0.787497,0.793105


qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8818,0.643905,0.74655,0.719131,0.650847,0.674618
100,0.5982,0.54857,0.788791,0.741768,0.774991,0.754983
150,0.5196,0.505547,0.805939,0.781463,0.763744,0.764174
200,0.2481,0.552119,0.809703,0.773997,0.770241,0.770927
250,0.2282,0.554268,0.815558,0.780313,0.779768,0.779723
300,0.2596,0.505192,0.818486,0.793195,0.782768,0.785508
350,0.107,0.687774,0.805939,0.79017,0.773892,0.774161
400,0.1017,0.634205,0.823505,0.793634,0.79014,0.79095
450,0.0956,0.650173,0.814722,0.790096,0.772851,0.778738
500,0.045,0.771458,0.814304,0.781304,0.784766,0.781908


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8818,0.643905,0.74655,0.719131,0.650847,0.674618
100,0.5982,0.54857,0.788791,0.741768,0.774991,0.754983
150,0.5196,0.505547,0.805939,0.781463,0.763744,0.764174
200,0.2481,0.552119,0.809703,0.773997,0.770241,0.770927
250,0.2282,0.554268,0.815558,0.780313,0.779768,0.779723
300,0.2596,0.505192,0.818486,0.793195,0.782768,0.785508
350,0.107,0.687774,0.805939,0.79017,0.773892,0.774161
400,0.1017,0.634205,0.823505,0.793634,0.79014,0.79095
450,0.0956,0.650173,0.814722,0.790096,0.772851,0.778738
500,0.045,0.771458,0.814304,0.781304,0.784766,0.781908


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8818,0.643905,0.74655,0.719131,0.650847,0.674618
100,0.5982,0.54857,0.788791,0.741768,0.774991,0.754983
150,0.5196,0.505547,0.805939,0.781463,0.763744,0.764174
200,0.2481,0.552119,0.809703,0.773997,0.770241,0.770927
250,0.2282,0.554268,0.815558,0.780313,0.779768,0.779723
300,0.2596,0.505192,0.818486,0.793195,0.782768,0.785508
350,0.107,0.687774,0.805939,0.79017,0.773892,0.774161
400,0.1017,0.634205,0.823505,0.793634,0.79014,0.79095
450,0.0956,0.650173,0.814722,0.790096,0.772851,0.778738
500,0.045,0.771458,0.814304,0.781304,0.784766,0.781908


DatasetDict({
    train: Dataset({
        features: ['text', 'label'],
        num_rows: 9562
    })
    test: Dataset({
        features: ['text', 'label'],
        num_rows: 2391
    })
})

UBC-NLP/MARBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.983,0.737534,0.706817,0.700057,0.569127,0.564959
100,0.7037,0.562172,0.783772,0.787599,0.703447,0.720358
150,0.5911,0.509679,0.805521,0.765142,0.770667,0.766052
200,0.3148,0.546704,0.813049,0.786523,0.769679,0.777391
250,0.3042,0.547435,0.803011,0.77625,0.770398,0.76824
300,0.3,0.494923,0.82476,0.796154,0.780429,0.786469
350,0.1396,0.598844,0.821832,0.78198,0.802041,0.788753
400,0.1157,0.800121,0.796738,0.784715,0.747846,0.756065
450,0.1529,0.671433,0.814304,0.79138,0.782979,0.777833
500,0.0575,0.842199,0.80803,0.783691,0.768743,0.769479


UBC-NLP/MARBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.983,0.737534,0.706817,0.700057,0.569127,0.564959
100,0.7037,0.562172,0.783772,0.787599,0.703447,0.720358
150,0.5911,0.509679,0.805521,0.765142,0.770667,0.766052
200,0.3148,0.546704,0.813049,0.786523,0.769679,0.777391
250,0.3042,0.547435,0.803011,0.77625,0.770398,0.76824
300,0.3,0.494923,0.82476,0.796154,0.780429,0.786469
350,0.1396,0.598844,0.821832,0.78198,0.802041,0.788753
400,0.1157,0.800121,0.796738,0.784715,0.747846,0.756065
450,0.1529,0.671433,0.814304,0.79138,0.782979,0.777833
500,0.0575,0.842199,0.80803,0.783691,0.768743,0.769479


UBC-NLP/MARBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.983,0.737534,0.706817,0.700057,0.569127,0.564959
100,0.7037,0.562172,0.783772,0.787599,0.703447,0.720358
150,0.5911,0.509679,0.805521,0.765142,0.770667,0.766052
200,0.3148,0.546704,0.813049,0.786523,0.769679,0.777391
250,0.3042,0.547435,0.803011,0.77625,0.770398,0.76824
300,0.3,0.494923,0.82476,0.796154,0.780429,0.786469
350,0.1396,0.598844,0.821832,0.78198,0.802041,0.788753
400,0.1157,0.800121,0.796738,0.784715,0.747846,0.756065
450,0.1529,0.671433,0.814304,0.79138,0.782979,0.777833
500,0.0575,0.842199,0.80803,0.783691,0.768743,0.769479


UBC-NLP/MARBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.9757,0.681727,0.745713,0.701766,0.66493,0.676435
100,0.6502,0.536905,0.799665,0.786341,0.752501,0.76646
150,0.5821,0.522581,0.805521,0.812823,0.733932,0.760177
200,0.3124,0.547432,0.803011,0.78418,0.769062,0.768788
250,0.2873,0.503772,0.820577,0.790629,0.798438,0.793471
300,0.2917,0.477807,0.832288,0.816936,0.804065,0.809773
350,0.1029,0.786928,0.80092,0.78997,0.749976,0.763461
400,0.1315,0.677119,0.798411,0.765495,0.770183,0.764402
450,0.102,0.725376,0.809285,0.789938,0.782835,0.783195
500,0.057,0.998043,0.791301,0.801169,0.761906,0.763929


UBC-NLP/MARBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.9757,0.681727,0.745713,0.701766,0.66493,0.676435
100,0.6502,0.536905,0.799665,0.786341,0.752501,0.76646
150,0.5821,0.522581,0.805521,0.812823,0.733932,0.760177
200,0.3124,0.547432,0.803011,0.78418,0.769062,0.768788
250,0.2873,0.503772,0.820577,0.790629,0.798438,0.793471
300,0.2917,0.477807,0.832288,0.816936,0.804065,0.809773
350,0.1029,0.786928,0.80092,0.78997,0.749976,0.763461
400,0.1315,0.677119,0.798411,0.765495,0.770183,0.764402
450,0.102,0.725376,0.809285,0.789938,0.782835,0.783195
500,0.057,0.998043,0.791301,0.801169,0.761906,0.763929


UBC-NLP/MARBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.9757,0.681727,0.745713,0.701766,0.66493,0.676435
100,0.6502,0.536905,0.799665,0.786341,0.752501,0.76646
150,0.5821,0.522581,0.805521,0.812823,0.733932,0.760177
200,0.3124,0.547432,0.803011,0.78418,0.769062,0.768788
250,0.2873,0.503772,0.820577,0.790629,0.798438,0.793471
300,0.2917,0.477807,0.832288,0.816936,0.804065,0.809773
350,0.1029,0.786928,0.80092,0.78997,0.749976,0.763461
400,0.1315,0.677119,0.798411,0.765495,0.770183,0.764402
450,0.102,0.725376,0.809285,0.789938,0.782835,0.783195
500,0.057,0.998043,0.791301,0.801169,0.761906,0.763929


UBC-NLP/MARBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.9816,0.715924,0.721874,0.686408,0.636511,0.645372
100,0.6733,0.588913,0.772898,0.727767,0.72664,0.726438
150,0.6005,0.550834,0.798829,0.779446,0.739078,0.754273
200,0.3351,0.669442,0.780427,0.762347,0.72383,0.728136
250,0.3001,0.565228,0.804266,0.761886,0.789426,0.773851
300,0.357,0.525936,0.81514,0.796483,0.763784,0.777115
350,0.1327,0.718615,0.796738,0.763703,0.763779,0.76224
400,0.151,0.651692,0.803011,0.768233,0.768587,0.764427
450,0.1356,0.700872,0.787955,0.749823,0.788296,0.765486
500,0.0605,0.867833,0.78921,0.75406,0.769961,0.757634


UBC-NLP/MARBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.9816,0.715924,0.721874,0.686408,0.636511,0.645372
100,0.6733,0.588913,0.772898,0.727767,0.72664,0.726438
150,0.6005,0.550834,0.798829,0.779446,0.739078,0.754273
200,0.3351,0.669442,0.780427,0.762347,0.72383,0.728136
250,0.3001,0.565228,0.804266,0.761886,0.789426,0.773851
300,0.357,0.525936,0.81514,0.796483,0.763784,0.777115
350,0.1327,0.718615,0.796738,0.763703,0.763779,0.76224
400,0.151,0.651692,0.803011,0.768233,0.768587,0.764427
450,0.1356,0.700872,0.787955,0.749823,0.788296,0.765486
500,0.0605,0.867833,0.78921,0.75406,0.769961,0.757634


UBC-NLP/MARBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.9816,0.715924,0.721874,0.686408,0.636511,0.645372
100,0.6733,0.588913,0.772898,0.727767,0.72664,0.726438
150,0.6005,0.550834,0.798829,0.779446,0.739078,0.754273
200,0.3351,0.669442,0.780427,0.762347,0.72383,0.728136
250,0.3001,0.565228,0.804266,0.761886,0.789426,0.773851
300,0.357,0.525936,0.81514,0.796483,0.763784,0.777115
350,0.1327,0.718615,0.796738,0.763703,0.763779,0.76224
400,0.151,0.651692,0.803011,0.768233,0.768587,0.764427
450,0.1356,0.700872,0.787955,0.749823,0.788296,0.765486
500,0.0605,0.867833,0.78921,0.75406,0.769961,0.757634


DatasetDict({
    train: Dataset({
        features: ['text', 'label'],
        num_rows: 9562
    })
    test: Dataset({
        features: ['text', 'label'],
        num_rows: 2391
    })
})

UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.9996,0.739245,0.712673,0.519637,0.564662,0.532064
100,0.7074,0.552518,0.80092,0.776849,0.750061,0.760743
150,0.5483,0.53362,0.804266,0.793739,0.743171,0.76208
200,0.3396,0.490516,0.822668,0.791135,0.787256,0.78789
250,0.3296,0.505355,0.821414,0.792858,0.796045,0.790727
300,0.3024,0.43068,0.844835,0.829161,0.795393,0.808166
350,0.1483,0.525347,0.832706,0.796092,0.805912,0.795675
400,0.1135,0.511045,0.844417,0.83228,0.798179,0.811754
450,0.1416,0.518098,0.85069,0.819956,0.82376,0.821728
500,0.0758,0.610234,0.841907,0.815791,0.809212,0.809414


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.9996,0.739245,0.712673,0.519637,0.564662,0.532064
100,0.7074,0.552518,0.80092,0.776849,0.750061,0.760743
150,0.5483,0.53362,0.804266,0.793739,0.743171,0.76208
200,0.3396,0.490516,0.822668,0.791135,0.787256,0.78789
250,0.3296,0.505355,0.821414,0.792858,0.796045,0.790727
300,0.3024,0.43068,0.844835,0.829161,0.795393,0.808166
350,0.1483,0.525347,0.832706,0.796092,0.805912,0.795675
400,0.1135,0.511045,0.844417,0.83228,0.798179,0.811754
450,0.1416,0.518098,0.85069,0.819956,0.82376,0.821728
500,0.0758,0.610234,0.841907,0.815791,0.809212,0.809414


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.9996,0.739245,0.712673,0.519637,0.564662,0.532064
100,0.7074,0.552518,0.80092,0.776849,0.750061,0.760743
150,0.5483,0.53362,0.804266,0.793739,0.743171,0.76208
200,0.3396,0.490516,0.822668,0.791135,0.787256,0.78789
250,0.3296,0.505355,0.821414,0.792858,0.796045,0.790727
300,0.3024,0.43068,0.844835,0.829161,0.795393,0.808166
350,0.1483,0.525347,0.832706,0.796092,0.805912,0.795675
400,0.1135,0.511045,0.844417,0.83228,0.798179,0.811754
450,0.1416,0.518098,0.85069,0.819956,0.82376,0.821728
500,0.0758,0.610234,0.841907,0.815791,0.809212,0.809414


UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.9754,0.714169,0.722292,0.778738,0.588358,0.553102
100,0.6672,0.541828,0.798829,0.778874,0.741286,0.753255
150,0.5771,0.474886,0.827269,0.801203,0.797476,0.79895
200,0.3373,0.483383,0.833961,0.825114,0.795255,0.806268
250,0.2857,0.487248,0.837307,0.81328,0.804726,0.808864
300,0.3194,0.473382,0.835634,0.811659,0.813595,0.811755
350,0.1223,0.553311,0.838143,0.811399,0.815757,0.812756
400,0.1307,0.548203,0.833961,0.7962,0.825794,0.808537
450,0.134,0.658767,0.807612,0.779577,0.794615,0.780271
500,0.0586,0.659289,0.84358,0.821604,0.805812,0.813101


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.9754,0.714169,0.722292,0.778738,0.588358,0.553102
100,0.6672,0.541828,0.798829,0.778874,0.741286,0.753255
150,0.5771,0.474886,0.827269,0.801203,0.797476,0.79895
200,0.3373,0.483383,0.833961,0.825114,0.795255,0.806268
250,0.2857,0.487248,0.837307,0.81328,0.804726,0.808864
300,0.3194,0.473382,0.835634,0.811659,0.813595,0.811755
350,0.1223,0.553311,0.838143,0.811399,0.815757,0.812756
400,0.1307,0.548203,0.833961,0.7962,0.825794,0.808537
450,0.134,0.658767,0.807612,0.779577,0.794615,0.780271
500,0.0586,0.659289,0.84358,0.821604,0.805812,0.813101


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.9754,0.714169,0.722292,0.778738,0.588358,0.553102
100,0.6672,0.541828,0.798829,0.778874,0.741286,0.753255
150,0.5771,0.474886,0.827269,0.801203,0.797476,0.79895
200,0.3373,0.483383,0.833961,0.825114,0.795255,0.806268
250,0.2857,0.487248,0.837307,0.81328,0.804726,0.808864
300,0.3194,0.473382,0.835634,0.811659,0.813595,0.811755
350,0.1223,0.553311,0.838143,0.811399,0.815757,0.812756
400,0.1307,0.548203,0.833961,0.7962,0.825794,0.808537
450,0.134,0.658767,0.807612,0.779577,0.794615,0.780271
500,0.0586,0.659289,0.84358,0.821604,0.805812,0.813101


UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,1.0053,0.764842,0.706399,0.765884,0.545418,0.52762
100,0.7019,0.638835,0.759097,0.719226,0.739944,0.722388
150,0.5379,0.512114,0.809703,0.767539,0.778211,0.767524
200,0.3421,0.498351,0.82936,0.786994,0.806326,0.794157
250,0.2996,0.490934,0.823923,0.784036,0.787635,0.783758
300,0.3301,0.480832,0.830615,0.794902,0.801565,0.798109
350,0.1346,0.572862,0.823923,0.799163,0.785897,0.788695
400,0.1436,0.612724,0.814722,0.781231,0.78568,0.775694
450,0.1364,0.565213,0.833124,0.807711,0.795957,0.801305
500,0.0616,0.683143,0.826432,0.790839,0.802324,0.794201


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,1.0053,0.764842,0.706399,0.765884,0.545418,0.52762
100,0.7019,0.638835,0.759097,0.719226,0.739944,0.722388
150,0.5379,0.512114,0.809703,0.767539,0.778211,0.767524
200,0.3421,0.498351,0.82936,0.786994,0.806326,0.794157
250,0.2996,0.490934,0.823923,0.784036,0.787635,0.783758
300,0.3301,0.480832,0.830615,0.794902,0.801565,0.798109
350,0.1346,0.572862,0.823923,0.799163,0.785897,0.788695
400,0.1436,0.612724,0.814722,0.781231,0.78568,0.775694
450,0.1364,0.565213,0.833124,0.807711,0.795957,0.801305
500,0.0616,0.683143,0.826432,0.790839,0.802324,0.794201


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,1.0053,0.764842,0.706399,0.765884,0.545418,0.52762
100,0.7019,0.638835,0.759097,0.719226,0.739944,0.722388
150,0.5379,0.512114,0.809703,0.767539,0.778211,0.767524
200,0.3421,0.498351,0.82936,0.786994,0.806326,0.794157
250,0.2996,0.490934,0.823923,0.784036,0.787635,0.783758
300,0.3301,0.480832,0.830615,0.794902,0.801565,0.798109
350,0.1346,0.572862,0.823923,0.799163,0.785897,0.788695
400,0.1436,0.612724,0.814722,0.781231,0.78568,0.775694
450,0.1364,0.565213,0.833124,0.807711,0.795957,0.801305
500,0.0616,0.683143,0.826432,0.790839,0.802324,0.794201


DatasetDict({
    train: Dataset({
        features: ['text', 'label'],
        num_rows: 9562
    })
    test: Dataset({
        features: ['text', 'label'],
        num_rows: 2391
    })
})

faisalq/SaudiBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7118,0.51375,0.80803,0.75485,0.801127,0.770387
100,0.453,0.335431,0.869092,0.871497,0.821601,0.842795
150,0.3418,0.282042,0.894605,0.882715,0.876278,0.878172
200,0.1396,0.357074,0.879548,0.867397,0.852201,0.858392
250,0.1686,0.347948,0.879548,0.880279,0.854793,0.861269
300,0.1543,0.294229,0.903806,0.903133,0.887316,0.894248
350,0.0503,0.328232,0.900042,0.88855,0.884925,0.885428
400,0.0507,0.390969,0.891677,0.87968,0.8856,0.880809
450,0.0647,0.368448,0.898369,0.874611,0.889449,0.881226
500,0.0286,0.421835,0.906315,0.898182,0.877905,0.886354


faisalq/SaudiBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7118,0.51375,0.80803,0.75485,0.801127,0.770387
100,0.453,0.335431,0.869092,0.871497,0.821601,0.842795
150,0.3418,0.282042,0.894605,0.882715,0.876278,0.878172
200,0.1396,0.357074,0.879548,0.867397,0.852201,0.858392
250,0.1686,0.347948,0.879548,0.880279,0.854793,0.861269
300,0.1543,0.294229,0.903806,0.903133,0.887316,0.894248
350,0.0503,0.328232,0.900042,0.88855,0.884925,0.885428
400,0.0507,0.390969,0.891677,0.87968,0.8856,0.880809
450,0.0647,0.368448,0.898369,0.874611,0.889449,0.881226
500,0.0286,0.421835,0.906315,0.898182,0.877905,0.886354


faisalq/SaudiBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7118,0.51375,0.80803,0.75485,0.801127,0.770387
100,0.453,0.335431,0.869092,0.871497,0.821601,0.842795
150,0.3418,0.282042,0.894605,0.882715,0.876278,0.878172
200,0.1396,0.357074,0.879548,0.867397,0.852201,0.858392
250,0.1686,0.347948,0.879548,0.880279,0.854793,0.861269
300,0.1543,0.294229,0.903806,0.903133,0.887316,0.894248
350,0.0503,0.328232,0.900042,0.88855,0.884925,0.885428
400,0.0507,0.390969,0.891677,0.87968,0.8856,0.880809
450,0.0647,0.368448,0.898369,0.874611,0.889449,0.881226
500,0.0286,0.421835,0.906315,0.898182,0.877905,0.886354


faisalq/SaudiBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7227,0.435023,0.838143,0.823199,0.790797,0.804587
100,0.3967,0.341074,0.875784,0.880698,0.820371,0.843257
150,0.3376,0.332542,0.877875,0.857871,0.861428,0.85382
200,0.1562,0.292357,0.900878,0.875121,0.896483,0.884529
250,0.155,0.295127,0.898369,0.886396,0.879652,0.881932
300,0.1421,0.379306,0.87913,0.874275,0.854888,0.85787
350,0.0689,0.330839,0.898787,0.883518,0.885839,0.88415
400,0.0599,0.35393,0.901297,0.896114,0.8736,0.882701
450,0.065,0.434654,0.88624,0.871608,0.86379,0.865133
500,0.0464,0.427949,0.896696,0.878253,0.873624,0.875734


faisalq/SaudiBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7227,0.435023,0.838143,0.823199,0.790797,0.804587
100,0.3967,0.341074,0.875784,0.880698,0.820371,0.843257
150,0.3376,0.332542,0.877875,0.857871,0.861428,0.85382
200,0.1562,0.292357,0.900878,0.875121,0.896483,0.884529
250,0.155,0.295127,0.898369,0.886396,0.879652,0.881932
300,0.1421,0.379306,0.87913,0.874275,0.854888,0.85787
350,0.0689,0.330839,0.898787,0.883518,0.885839,0.88415
400,0.0599,0.35393,0.901297,0.896114,0.8736,0.882701
450,0.065,0.434654,0.88624,0.871608,0.86379,0.865133
500,0.0464,0.427949,0.896696,0.878253,0.873624,0.875734


faisalq/SaudiBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7227,0.435023,0.838143,0.823199,0.790797,0.804587
100,0.3967,0.341074,0.875784,0.880698,0.820371,0.843257
150,0.3376,0.332542,0.877875,0.857871,0.861428,0.85382
200,0.1562,0.292357,0.900878,0.875121,0.896483,0.884529
250,0.155,0.295127,0.898369,0.886396,0.879652,0.881932
300,0.1421,0.379306,0.87913,0.874275,0.854888,0.85787
350,0.0689,0.330839,0.898787,0.883518,0.885839,0.88415
400,0.0599,0.35393,0.901297,0.896114,0.8736,0.882701
450,0.065,0.434654,0.88624,0.871608,0.86379,0.865133
500,0.0464,0.427949,0.896696,0.878253,0.873624,0.875734


faisalq/SaudiBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7454,0.430932,0.840234,0.80747,0.800872,0.803301
100,0.3971,0.362172,0.860309,0.815403,0.856962,0.831024
150,0.3251,0.313531,0.871602,0.842838,0.853107,0.839333
200,0.1214,0.351263,0.882476,0.876512,0.833807,0.852165
250,0.1412,0.371449,0.876202,0.873886,0.826025,0.844268
300,0.1365,0.364087,0.878294,0.85359,0.86052,0.854035
350,0.0603,0.380885,0.892514,0.863117,0.872507,0.867068
400,0.0567,0.423859,0.883312,0.854762,0.862581,0.857374
450,0.065,0.351064,0.895859,0.872676,0.877137,0.874828
500,0.0433,0.418005,0.887913,0.860525,0.876394,0.868052


faisalq/SaudiBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7454,0.430932,0.840234,0.80747,0.800872,0.803301
100,0.3971,0.362172,0.860309,0.815403,0.856962,0.831024
150,0.3251,0.313531,0.871602,0.842838,0.853107,0.839333
200,0.1214,0.351263,0.882476,0.876512,0.833807,0.852165
250,0.1412,0.371449,0.876202,0.873886,0.826025,0.844268
300,0.1365,0.364087,0.878294,0.85359,0.86052,0.854035
350,0.0603,0.380885,0.892514,0.863117,0.872507,0.867068
400,0.0567,0.423859,0.883312,0.854762,0.862581,0.857374
450,0.065,0.351064,0.895859,0.872676,0.877137,0.874828
500,0.0433,0.418005,0.887913,0.860525,0.876394,0.868052


faisalq/SaudiBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7454,0.430932,0.840234,0.80747,0.800872,0.803301
100,0.3971,0.362172,0.860309,0.815403,0.856962,0.831024
150,0.3251,0.313531,0.871602,0.842838,0.853107,0.839333
200,0.1214,0.351263,0.882476,0.876512,0.833807,0.852165
250,0.1412,0.371449,0.876202,0.873886,0.826025,0.844268
300,0.1365,0.364087,0.878294,0.85359,0.86052,0.854035
350,0.0603,0.380885,0.892514,0.863117,0.872507,0.867068
400,0.0567,0.423859,0.883312,0.854762,0.862581,0.857374
450,0.065,0.351064,0.895859,0.872676,0.877137,0.874828
500,0.0433,0.418005,0.887913,0.860525,0.876394,0.868052


DatasetDict({
    train: Dataset({
        features: ['text', 'label'],
        num_rows: 9562
    })
    test: Dataset({
        features: ['text', 'label'],
        num_rows: 2391
    })
})

SaudiBERT_LSTM, try:0


Some weights of BertModel were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,1.0752,0.817577,0.766625,0.554128,0.615073,0.582732
100,0.7443,0.569803,0.860309,0.82806,0.821055,0.822646
150,0.54,0.44737,0.879548,0.877333,0.823497,0.842132
200,0.3763,0.403831,0.876621,0.864461,0.849861,0.853661
250,0.3027,0.402061,0.874529,0.869328,0.835853,0.845569
300,0.2587,0.359941,0.877039,0.849316,0.858736,0.847161
350,0.169,0.3472,0.891259,0.867165,0.872743,0.869732
400,0.1259,0.35035,0.889586,0.866034,0.871078,0.867111
450,0.1384,0.386752,0.879967,0.865131,0.846154,0.850998
500,0.0965,0.346745,0.90046,0.869998,0.883611,0.875339


SaudiBERT_LSTM, try:1


Some weights of BertModel were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,1.0752,0.817577,0.766625,0.554128,0.615073,0.582732
100,0.7443,0.569803,0.860309,0.82806,0.821055,0.822646
150,0.54,0.44737,0.879548,0.877333,0.823497,0.842132
200,0.3763,0.403831,0.876621,0.864461,0.849861,0.853661
250,0.3027,0.402061,0.874529,0.869328,0.835853,0.845569
300,0.2587,0.359941,0.877039,0.849316,0.858736,0.847161
350,0.169,0.3472,0.891259,0.867165,0.872743,0.869732
400,0.1259,0.35035,0.889586,0.866034,0.871078,0.867111
450,0.1384,0.386752,0.879967,0.865131,0.846154,0.850998
500,0.0965,0.346745,0.90046,0.869998,0.883611,0.875339


SaudiBERT_LSTM, try:2


Some weights of BertModel were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,1.0752,0.817577,0.766625,0.554128,0.615073,0.582732
100,0.7443,0.569803,0.860309,0.82806,0.821055,0.822646
150,0.54,0.44737,0.879548,0.877333,0.823497,0.842132
200,0.3763,0.403831,0.876621,0.864461,0.849861,0.853661
250,0.3027,0.402061,0.874529,0.869328,0.835853,0.845569
300,0.2587,0.359941,0.877039,0.849316,0.858736,0.847161
350,0.169,0.3472,0.891259,0.867165,0.872743,0.869732
400,0.1259,0.35035,0.889586,0.866034,0.871078,0.867111
450,0.1384,0.386752,0.879967,0.865131,0.846154,0.850998
500,0.0965,0.346745,0.90046,0.869998,0.883611,0.875339


SaudiBERT_LSTM, try:0


Some weights of BertModel were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,1.0605,0.831131,0.749895,0.545355,0.598736,0.570317
100,0.7138,0.586532,0.823087,0.832657,0.71577,0.727785
150,0.5497,0.478411,0.86491,0.843896,0.841057,0.838912
200,0.3599,0.381993,0.884985,0.859395,0.852885,0.854889
250,0.2857,0.413809,0.854036,0.819327,0.86196,0.825077
300,0.3115,0.366775,0.871602,0.840384,0.873319,0.852039
350,0.1577,0.358026,0.890422,0.871341,0.866589,0.867674
400,0.1575,0.341926,0.897951,0.896152,0.862544,0.876379
450,0.1567,0.352341,0.883312,0.854757,0.873335,0.860951
500,0.0808,0.371724,0.897951,0.88241,0.874326,0.877476


SaudiBERT_LSTM, try:1


Some weights of BertModel were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,1.0605,0.831131,0.749895,0.545355,0.598736,0.570317
100,0.7138,0.586532,0.823087,0.832657,0.71577,0.727785
150,0.5497,0.478411,0.86491,0.843896,0.841057,0.838912
200,0.3599,0.381993,0.884985,0.859395,0.852885,0.854889
250,0.2857,0.413809,0.854036,0.819327,0.86196,0.825077
300,0.3115,0.366775,0.871602,0.840384,0.873319,0.852039
350,0.1577,0.358026,0.890422,0.871341,0.866589,0.867674
400,0.1575,0.341926,0.897951,0.896152,0.862544,0.876379
450,0.1567,0.352341,0.883312,0.854757,0.873335,0.860951
500,0.0808,0.371724,0.897951,0.88241,0.874326,0.877476


SaudiBERT_LSTM, try:2


Some weights of BertModel were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,1.0605,0.831131,0.749895,0.545355,0.598736,0.570317
100,0.7138,0.586532,0.823087,0.832657,0.71577,0.727785
150,0.5497,0.478411,0.86491,0.843896,0.841057,0.838912
200,0.3599,0.381993,0.884985,0.859395,0.852885,0.854889
250,0.2857,0.413809,0.854036,0.819327,0.86196,0.825077
300,0.3115,0.366775,0.871602,0.840384,0.873319,0.852039
350,0.1577,0.358026,0.890422,0.871341,0.866589,0.867674
400,0.1575,0.341926,0.897951,0.896152,0.862544,0.876379
450,0.1567,0.352341,0.883312,0.854757,0.873335,0.860951
500,0.0808,0.371724,0.897951,0.88241,0.874326,0.877476


SaudiBERT_LSTM, try:0


Some weights of BertModel were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,1.09,0.860591,0.73944,0.532566,0.603338,0.562028
100,0.7211,0.5927,0.83647,0.797405,0.78395,0.784993
150,0.5343,0.46936,0.87202,0.842976,0.850744,0.846255
200,0.3479,0.406709,0.874529,0.84122,0.85886,0.845986
250,0.2802,0.379412,0.880385,0.848262,0.862568,0.854097
300,0.2818,0.391628,0.869929,0.856261,0.846351,0.845446
350,0.1577,0.385546,0.873275,0.846641,0.867975,0.854094
400,0.1575,0.354306,0.894605,0.869289,0.879169,0.873664
450,0.1426,0.376421,0.876621,0.838798,0.871608,0.849933
500,0.0956,0.420168,0.879548,0.838379,0.87615,0.852441


SaudiBERT_LSTM, try:1


Some weights of BertModel were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,1.09,0.860591,0.73944,0.532566,0.603338,0.562028
100,0.7211,0.5927,0.83647,0.797405,0.78395,0.784993
150,0.5343,0.46936,0.87202,0.842976,0.850744,0.846255
200,0.3479,0.406709,0.874529,0.84122,0.85886,0.845986
250,0.2802,0.379412,0.880385,0.848262,0.862568,0.854097
300,0.2818,0.391628,0.869929,0.856261,0.846351,0.845446
350,0.1577,0.385546,0.873275,0.846641,0.867975,0.854094
400,0.1575,0.354306,0.894605,0.869289,0.879169,0.873664
450,0.1426,0.376421,0.876621,0.838798,0.871608,0.849933
500,0.0956,0.420168,0.879548,0.838379,0.87615,0.852441


SaudiBERT_LSTM, try:2


Some weights of BertModel were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,1.09,0.860591,0.73944,0.532566,0.603338,0.562028
100,0.7211,0.5927,0.83647,0.797405,0.78395,0.784993
150,0.5343,0.46936,0.87202,0.842976,0.850744,0.846255
200,0.3479,0.406709,0.874529,0.84122,0.85886,0.845986
250,0.2802,0.379412,0.880385,0.848262,0.862568,0.854097
300,0.2818,0.391628,0.869929,0.856261,0.846351,0.845446
350,0.1577,0.385546,0.873275,0.846641,0.867975,0.854094
400,0.1575,0.354306,0.894605,0.869289,0.879169,0.873664
450,0.1426,0.376421,0.876621,0.838798,0.871608,0.849933
500,0.0956,0.420168,0.879548,0.838379,0.87615,0.852441


DatasetDict({
    train: Dataset({
        features: ['text', 'label'],
        num_rows: 9562
    })
    test: Dataset({
        features: ['text', 'label'],
        num_rows: 2391
    })
})

SaudiBERT_CNN, try:0


Some weights of BertModel were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7135,0.493357,0.813467,0.764164,0.789159,0.772815
100,0.4372,0.336813,0.871184,0.878192,0.820534,0.842578
150,0.3313,0.293908,0.889168,0.880231,0.867363,0.871621
200,0.1604,0.293962,0.89335,0.888685,0.865338,0.875797
250,0.1457,0.284908,0.906734,0.902879,0.87948,0.887994
300,0.1521,0.274708,0.895441,0.889019,0.864559,0.875894
350,0.0612,0.375172,0.881221,0.847686,0.887863,0.863688
400,0.0531,0.392739,0.887913,0.870968,0.881553,0.87423
450,0.0659,0.400265,0.894187,0.889874,0.868861,0.876252
500,0.0371,0.377461,0.899624,0.885616,0.873744,0.879378


SaudiBERT_CNN, try:1


Some weights of BertModel were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7205,0.474283,0.820159,0.771442,0.789333,0.777601
100,0.4364,0.358438,0.86491,0.871931,0.800976,0.827606
150,0.3367,0.285975,0.890004,0.876366,0.868387,0.871126
200,0.1463,0.32271,0.883312,0.87979,0.852749,0.863707
250,0.1461,0.291601,0.897951,0.900308,0.853872,0.869074
300,0.1463,0.291949,0.894187,0.889375,0.861861,0.873464
350,0.0554,0.406943,0.879967,0.85193,0.873154,0.855192
400,0.056,0.36169,0.899624,0.876176,0.887974,0.881184
450,0.0676,0.348609,0.900878,0.881484,0.884623,0.882122
500,0.0398,0.418129,0.887913,0.877869,0.863544,0.867118


SaudiBERT_CNN, try:2


Some weights of BertModel were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7225,0.462748,0.823087,0.774929,0.790848,0.780748
100,0.4368,0.366902,0.860309,0.872163,0.795786,0.82412
150,0.3375,0.290796,0.889586,0.876473,0.868108,0.871015
200,0.1479,0.338069,0.877875,0.878803,0.847728,0.860697
250,0.143,0.31141,0.890841,0.881569,0.870031,0.872667
300,0.1512,0.298898,0.892095,0.882156,0.872584,0.873966
350,0.055,0.341375,0.901715,0.877833,0.889501,0.881723
400,0.0456,0.44307,0.891677,0.879305,0.876968,0.873469
450,0.0663,0.345059,0.900878,0.873461,0.894763,0.882916
500,0.0414,0.347389,0.906315,0.889084,0.891592,0.889647


SaudiBERT_CNN, try:0


Some weights of BertModel were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.8291,0.575925,0.795065,0.747568,0.780483,0.760387
100,0.472,0.34759,0.875784,0.858967,0.845543,0.850821
150,0.3589,0.317515,0.886658,0.868768,0.86237,0.864898
200,0.1828,0.357,0.868674,0.836901,0.866109,0.84763
250,0.2026,0.291084,0.888749,0.862633,0.877511,0.869269
300,0.1877,0.278785,0.887495,0.874953,0.860704,0.866731
350,0.07,0.329377,0.889586,0.875628,0.868917,0.871606
400,0.0917,0.354954,0.889168,0.881852,0.853639,0.863719
450,0.0714,0.354952,0.895023,0.874855,0.884903,0.879334
500,0.0385,0.427344,0.887495,0.883474,0.844855,0.855575


SaudiBERT_CNN, try:1


Some weights of BertModel were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7234,0.458695,0.821414,0.794189,0.771726,0.781209
100,0.4084,0.294385,0.883731,0.863043,0.861768,0.862379
150,0.3103,0.276996,0.884567,0.87491,0.856417,0.86392
200,0.1633,0.263724,0.901297,0.881503,0.891436,0.885161
250,0.1474,0.312469,0.889168,0.867847,0.878249,0.870196
300,0.1465,0.297357,0.890004,0.89524,0.843105,0.859266
350,0.0523,0.349133,0.897114,0.889394,0.866864,0.875345
400,0.0648,0.368524,0.891259,0.884463,0.870171,0.874702
450,0.0722,0.397715,0.887913,0.867619,0.872432,0.869188
500,0.0403,0.433035,0.883312,0.874239,0.861242,0.863909


SaudiBERT_CNN, try:2


Some weights of BertModel were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7214,0.484324,0.81514,0.79344,0.760755,0.771978
100,0.4189,0.319481,0.877457,0.874894,0.832298,0.849412
150,0.3225,0.289629,0.879548,0.866444,0.857827,0.860725
200,0.1593,0.271873,0.899205,0.879617,0.883811,0.879594
250,0.1468,0.292652,0.892095,0.868967,0.884857,0.875486
300,0.1328,0.293998,0.887495,0.879123,0.86792,0.870158
350,0.0578,0.334297,0.892932,0.875425,0.874525,0.874215
400,0.0658,0.322524,0.900878,0.886028,0.881677,0.88339
450,0.0683,0.379409,0.881639,0.853807,0.880253,0.864566
500,0.0331,0.369324,0.898787,0.885948,0.88204,0.883007


SaudiBERT_CNN, try:0


Some weights of BertModel were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7555,0.443613,0.839816,0.795715,0.807479,0.798885
100,0.3988,0.341716,0.874529,0.837997,0.861511,0.847528
150,0.3313,0.285153,0.892932,0.863566,0.875522,0.869236
200,0.1361,0.312957,0.881639,0.863698,0.858628,0.859053
250,0.1457,0.322617,0.889586,0.870377,0.871073,0.868777
300,0.13,0.298767,0.897532,0.870466,0.883957,0.876424
350,0.0541,0.500075,0.864492,0.839255,0.854938,0.842204
400,0.0656,0.345412,0.897532,0.874532,0.879164,0.876031
450,0.0781,0.385863,0.883312,0.84134,0.87914,0.857282
500,0.0372,0.346119,0.899205,0.867109,0.892848,0.878208


SaudiBERT_CNN, try:1


Some weights of BertModel were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7477,0.434191,0.836052,0.80197,0.79729,0.794781
100,0.3934,0.322752,0.880385,0.850971,0.861242,0.85488
150,0.3216,0.279699,0.894187,0.874082,0.870107,0.870807
200,0.1212,0.336882,0.878294,0.866019,0.845778,0.853299
250,0.1497,0.323943,0.888749,0.87651,0.858072,0.863339
300,0.1382,0.327958,0.884985,0.865834,0.875178,0.867113
350,0.0621,0.347507,0.897532,0.885741,0.87468,0.87795
400,0.06,0.377728,0.88624,0.873561,0.870047,0.867367
450,0.0745,0.430655,0.874111,0.833847,0.871433,0.848897
500,0.0378,0.356806,0.897951,0.866139,0.894946,0.878333


SaudiBERT_CNN, try:2


Some weights of BertModel were not initialized from the model checkpoint at faisalq/SaudiBERT and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/9562 [00:00<?, ? examples/s]

Map:   0%|          | 0/2391 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1 Score
50,0.7491,0.440077,0.831451,0.797236,0.792181,0.789229
100,0.4037,0.335978,0.877457,0.846409,0.858341,0.850309
150,0.318,0.274356,0.893768,0.873017,0.868828,0.869925
200,0.1259,0.32691,0.881221,0.862019,0.858751,0.858959
250,0.1417,0.284191,0.897532,0.873393,0.874856,0.873914
300,0.129,0.322272,0.881221,0.855736,0.869342,0.860898
350,0.0592,0.368336,0.893768,0.884821,0.862194,0.869488
400,0.0623,0.392141,0.886658,0.87703,0.851395,0.860859
450,0.0646,0.421031,0.878712,0.843239,0.868641,0.853496
500,0.0435,0.392191,0.891259,0.86692,0.875999,0.870396


Unnamed: 0,Model,Accuracy,Precision,Recall,F1
0,CAMeL-Lab/bert-base-arabic-camelbert-da,0.795901,0.760071,0.762201,0.760424
3,SaudiBERT_CNN,0.919699,0.911292,0.897105,0.903856
4,SaudiBERT_LSTM,0.91468,0.899867,0.904016,0.901896
7,UBC-NLP/MARBERT,0.832288,0.816936,0.804065,0.809773
10,UBC-NLP/MARBERTv2,0.847344,0.829816,0.821659,0.825433
13,aubmindlab/bert-base-arabertv02-twitter,0.848181,0.821111,0.818306,0.819407
15,faisalq/SaudiBERT,0.916771,0.909514,0.896095,0.902327
18,qarib/bert-base-qarib,0.840234,0.813145,0.814997,0.814038
