In [1]:
import os
os.environ["CUDA_VISIBLE_DEVICES"]="0" 

import numpy as np
import tensorflow as tf
import pandas as pd
import pyarabic.araby as araby
import warnings
warnings.filterwarnings('ignore')
from sklearn.model_selection import train_test_split
from sklearn.metrics import classification_report
from tensorflow.keras.layers import Dense, Input
from tensorflow.keras.utils import to_categorical
from tensorflow.keras.optimizers import Adam
from tensorflow.keras.callbacks import EarlyStopping
from tensorflow.keras.initializers import TruncatedNormal
from tensorflow.keras.losses import CategoricalCrossentropy
from tensorflow.keras.metrics import CategoricalAccuracy
import torch
from sklearn.metrics import accuracy_score, f1_score
from transformers import Trainer, TrainingArguments
from transformers import AutoTokenizer, AutoModelForSequenceClassification
from datasets import load_dataset, Dataset, concatenate_datasets
pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', None)
pd.set_option('display.max_colwidth', 1000)


fname = 'MSAC_1'
log_file = fname + '.txt'

with open(log_file, 'w') as f:
    f.write('Model,Accuracy,F1\n')



dataset = load_dataset('AbderrahmanSkiredj1/MSAC_darija_sentiment_analysis')
df = pd.DataFrame(dataset['train']) 

      
display(df.columns)
display(len(df))
display(df[:4])

df['label'] = df['label'].replace(',ne', 'neg')

classes = set(df['label'].values)
display(classes)

c = df['label'].value_counts()
display(c)

df['label'] = df['label'].astype('category')
df['label'] = df['label'].cat.codes

df = df[['text', 'label']]
classes_num = len(classes)
display(classes_num)
display(len(df))


# ds = Dataset.from_pandas(df)
# ds = ds.train_test_split(test_size=0.2)

# display(ds)

max_sequence_length = 128


models = [ 
        'aubmindlab/bert-base-arabertv02-twitter',
        'CAMeL-Lab/bert-base-arabic-camelbert-da',
        'qarib/bert-base-qarib', 
        'UBC-NLP/MARBERT',
        'UBC-NLP/MARBERTv2',
]





seeds = [0, 1, 42]

for model_name in models:
    for seed in seeds:
        ds = Dataset.from_pandas(df)
        ds = ds.train_test_split(test_size=0.2, seed = seed)
        if seed==0:
            display(ds)
    
        for i in range(3):
            print(f'{model_name}, try:{i}')
                  
            tokenizer = AutoTokenizer.from_pretrained(model_name)
            model = AutoModelForSequenceClassification.from_pretrained(model_name,
                                                                  num_labels=classes_num).to('cuda')                                                 
            dataset_train = ds['train']
            dataset_validation = ds['test']                                                    
            
          
    
            def preprocess_function(examples):
                return tokenizer(examples['text'], truncation=True, padding="max_length",
                                max_length=max_sequence_length)
            
            
            dataset_train = dataset_train.map(preprocess_function, batched=True) # , batched=True
            dataset_validation = dataset_validation.map(preprocess_function, batched=True)  # , batched=True
            
           
            
            def compute_metrics(eval_pred):
                logits, labels = eval_pred
                predictions = np.argmax(logits, axis=-1)    
                acc = accuracy_score(labels, predictions)        
                f1 = f1_score(labels, predictions, average='macro')   
                with open(log_file, 'a') as f:
                    f.write(f'{model_name},{acc},{f1}\n')
                return {'accuracy': acc, 'f1_score': f1}
    
    
            
            
            epochs = 25
            save_steps = 10000 #save checkpoint every 10000 steps
            batch_size = 64
            
            training_args = TrainingArguments(
                output_dir = 'bert/',
                overwrite_output_dir=True,
                num_train_epochs = epochs,
                per_device_train_batch_size = batch_size,
                per_device_eval_batch_size = batch_size,
                save_steps = save_steps,
                save_total_limit = 1, #only save the last 5 checkpoints
                fp16=True,
                learning_rate = 5e-5,  # 5e-5 is the default
                logging_steps = 20, #50_000
                evaluation_strategy = 'steps',
                # evaluate_during_training = True,
                eval_steps = 20
                
            )
            
            trainer = Trainer(
                model = model,
                args = training_args,
                # data_collator=data_collator,
                train_dataset=dataset_train,
                eval_dataset=dataset_validation,
                compute_metrics = compute_metrics
            )
            
            
            trainer.train()


results = pd.read_csv(log_file)

best_results = results.groupby('Model', as_index=False)['F1'].max()

best_results = pd.merge(best_results, results, on=['Model', 'F1'])
best_results = best_results[['Model', 'Accuracy', 'F1']]
best_results = best_results.drop_duplicates()
best_results.to_csv(f'{fname}.csv')
display(best_results)



2024-09-17 04:54:18.916753: I tensorflow/core/util/port.cc:110] oneDNN custom operations are on. You may see slightly different numerical results due to floating-point round-off errors from different computation orders. To turn them off, set the environment variable `TF_ENABLE_ONEDNN_OPTS=0`.
2024-09-17 04:54:18.939674: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.
To enable the following instructions: AVX2 AVX512F AVX512_VNNI AVX512_BF16 FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.
Found cached dataset parquet (/home/ffq/.cache/huggingface/datasets/AbderrahmanSkiredj1___parquet/AbderrahmanSkiredj1--MSAC_darija_sentiment_analysis-78ec287cfc3da3ad/0.0.0/14a00e99c0d15a23649d0db8944380ac81082d4b021f398733dd84f3a6c569a7)


  0%|          | 0/1 [00:00<?, ?it/s]

Index(['text', 'label'], dtype='object')

2000

Unnamed: 0,text,label
0,'طوال حياتي لم المس اي تغير حتى قدمت هذه الحكومة فل نقف بجانها بصوتنا',pos
1,'منتوج رائع وثمن مناسب ....جميل',pos
2,'كلنا ابن كيران لمتافق معايا يدير جيم',pos
3,'وفقك الله لولاية اخرى حقاش مكينش محسن منك',pos


{'neg', 'pos'}

label
pos    1000
neg    1000
Name: count, dtype: int64

2

2000

DatasetDict({
    train: Dataset({
        features: ['text', 'label'],
        num_rows: 1600
    })
    test: Dataset({
        features: ['text', 'label'],
        num_rows: 400
    })
})

aubmindlab/bert-base-arabertv02-twitter, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.3304,0.286844,0.9,0.899183
40,0.1588,0.247279,0.9025,0.902118
60,0.0827,0.275547,0.9125,0.911571
80,0.031,0.301574,0.925,0.924576
100,0.0163,0.362803,0.925,0.924729
120,0.0117,0.383156,0.9225,0.922286
140,0.0078,0.393745,0.9175,0.916624
160,0.0106,0.359181,0.925,0.924317
180,0.012,0.3685,0.9225,0.922145
200,0.0012,0.386448,0.92,0.919606


aubmindlab/bert-base-arabertv02-twitter, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.3816,0.287244,0.9075,0.906702
40,0.1623,0.242887,0.9075,0.906941
60,0.0908,0.293726,0.915,0.914742
80,0.0385,0.401522,0.9075,0.907193
100,0.025,0.370439,0.9025,0.901832
120,0.0097,0.400138,0.915,0.914581
140,0.0109,0.424739,0.9125,0.911825
160,0.0079,0.447293,0.91,0.909675
180,0.0074,0.462536,0.9125,0.911825
200,0.0009,0.49359,0.9125,0.912038


aubmindlab/bert-base-arabertv02-twitter, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.3816,0.287244,0.9075,0.906702
40,0.1623,0.242887,0.9075,0.906941
60,0.0908,0.293726,0.915,0.914742
80,0.0385,0.401522,0.9075,0.907193
100,0.025,0.370439,0.9025,0.901832
120,0.0097,0.400138,0.915,0.914581
140,0.0109,0.424739,0.9125,0.911825
160,0.0079,0.447293,0.91,0.909675
180,0.0074,0.462536,0.9125,0.911825
200,0.0009,0.49359,0.9125,0.912038


aubmindlab/bert-base-arabertv02-twitter, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.401,0.259751,0.91,0.908898
40,0.1371,0.252194,0.935,0.934581
60,0.0957,0.23365,0.935,0.934581
80,0.0326,0.310276,0.9225,0.922145
100,0.0123,0.326713,0.9275,0.926941
120,0.0017,0.38783,0.9275,0.9273
140,0.0116,0.474908,0.9225,0.921594
160,0.0006,0.399772,0.92,0.919661
180,0.0011,0.478574,0.925,0.924388
200,0.0013,0.535372,0.91,0.90989


aubmindlab/bert-base-arabertv02-twitter, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.401,0.259751,0.91,0.908898
40,0.1371,0.252194,0.935,0.934581
60,0.0957,0.23365,0.935,0.934581
80,0.0326,0.310276,0.9225,0.922145
100,0.0123,0.326713,0.9275,0.926941
120,0.0017,0.38783,0.9275,0.9273
140,0.0116,0.474908,0.9225,0.921594
160,0.0006,0.399772,0.92,0.919661
180,0.0011,0.478574,0.925,0.924388
200,0.0013,0.535372,0.91,0.90989


aubmindlab/bert-base-arabertv02-twitter, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.401,0.259751,0.91,0.908898
40,0.1371,0.252194,0.935,0.934581
60,0.0957,0.23365,0.935,0.934581
80,0.0326,0.310276,0.9225,0.922145
100,0.0123,0.326713,0.9275,0.926941
120,0.0017,0.38783,0.9275,0.9273
140,0.0116,0.474908,0.9225,0.921594
160,0.0006,0.399772,0.92,0.919661
180,0.0011,0.478574,0.925,0.924388
200,0.0013,0.535372,0.91,0.90989


aubmindlab/bert-base-arabertv02-twitter, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.4038,0.241687,0.92,0.919418
40,0.1853,0.195937,0.9325,0.932092
60,0.0887,0.223949,0.9225,0.922461
80,0.0551,0.257207,0.9275,0.927478
100,0.0276,0.272109,0.9325,0.932347
120,0.0119,0.301962,0.94,0.939661
140,0.0135,0.403823,0.935,0.934985
160,0.0077,0.354402,0.9375,0.937412
180,0.003,0.322872,0.94,0.939878
200,0.0047,0.342716,0.94,0.939878


aubmindlab/bert-base-arabertv02-twitter, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.4038,0.241687,0.92,0.919418
40,0.1853,0.195937,0.9325,0.932092
60,0.0887,0.223949,0.9225,0.922461
80,0.0551,0.257207,0.9275,0.927478
100,0.0276,0.272109,0.9325,0.932347
120,0.0119,0.301962,0.94,0.939661
140,0.0135,0.403823,0.935,0.934985
160,0.0077,0.354402,0.9375,0.937412
180,0.003,0.322872,0.94,0.939878
200,0.0047,0.342716,0.94,0.939878


aubmindlab/bert-base-arabertv02-twitter, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.4038,0.241687,0.92,0.919418
40,0.1853,0.195937,0.9325,0.932092
60,0.0887,0.223949,0.9225,0.922461
80,0.0551,0.257207,0.9275,0.927478
100,0.0276,0.272109,0.9325,0.932347
120,0.0119,0.301962,0.94,0.939661
140,0.0135,0.403823,0.935,0.934985
160,0.0077,0.354402,0.9375,0.937412
180,0.003,0.322872,0.94,0.939878
200,0.0047,0.342716,0.94,0.939878


DatasetDict({
    train: Dataset({
        features: ['text', 'label'],
        num_rows: 1600
    })
    test: Dataset({
        features: ['text', 'label'],
        num_rows: 400
    })
})

CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.4333,0.323037,0.8775,0.875139
40,0.2222,0.336453,0.8975,0.896958
60,0.1536,0.337248,0.905,0.903727
80,0.0821,0.411854,0.885,0.883591
100,0.0575,0.465536,0.87,0.869736
120,0.0165,0.552018,0.8875,0.886729
140,0.0247,0.656902,0.89,0.888109
160,0.0154,0.62737,0.885,0.883591
180,0.0063,0.747533,0.8575,0.857242
200,0.0049,0.746329,0.8925,0.890995


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.4333,0.323037,0.8775,0.875139
40,0.2222,0.336453,0.8975,0.896958
60,0.1536,0.337248,0.905,0.903727
80,0.0821,0.411854,0.885,0.883591
100,0.0575,0.465536,0.87,0.869736
120,0.0165,0.552018,0.8875,0.886729
140,0.0247,0.656902,0.89,0.888109
160,0.0154,0.62737,0.885,0.883591
180,0.0063,0.747533,0.8575,0.857242
200,0.0049,0.746329,0.8925,0.890995


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.4333,0.323037,0.8775,0.875139
40,0.2222,0.336453,0.8975,0.896958
60,0.1536,0.337248,0.905,0.903727
80,0.0821,0.411854,0.885,0.883591
100,0.0575,0.465536,0.87,0.869736
120,0.0165,0.552018,0.8875,0.886729
140,0.0247,0.656902,0.89,0.888109
160,0.0154,0.62737,0.885,0.883591
180,0.0063,0.747533,0.8575,0.857242
200,0.0049,0.746329,0.8925,0.890995


CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.4993,0.349364,0.8625,0.859226
40,0.2299,0.322718,0.88,0.88
60,0.1531,0.332694,0.8875,0.887342
80,0.0804,0.372534,0.895,0.894989
100,0.0479,0.400789,0.9,0.89899
120,0.0162,0.532986,0.9025,0.901832
140,0.0018,0.742338,0.87,0.869971
160,0.0073,0.622347,0.9,0.899356
180,0.0006,0.650481,0.895,0.894236
200,0.0003,0.674286,0.895,0.894554


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.4993,0.349364,0.8625,0.859226
40,0.2299,0.322718,0.88,0.88
60,0.1531,0.332694,0.8875,0.887342
80,0.0804,0.372534,0.895,0.894989
100,0.0479,0.400789,0.9,0.89899
120,0.0162,0.532986,0.9025,0.901832
140,0.0018,0.742338,0.87,0.869971
160,0.0073,0.622347,0.9,0.899356
180,0.0006,0.650481,0.895,0.894236
200,0.0003,0.674286,0.895,0.894554


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.4993,0.349364,0.8625,0.859226
40,0.2299,0.322718,0.88,0.88
60,0.1531,0.332694,0.8875,0.887342
80,0.0804,0.372534,0.895,0.894989
100,0.0479,0.400789,0.9,0.89899
120,0.0162,0.532986,0.9025,0.901832
140,0.0018,0.742338,0.87,0.869971
160,0.0073,0.622347,0.9,0.899356
180,0.0006,0.650481,0.895,0.894236
200,0.0003,0.674286,0.895,0.894554


CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.4636,0.283265,0.8975,0.896412
40,0.2296,0.212772,0.9225,0.922196
60,0.1207,0.327897,0.9075,0.907486
80,0.0673,0.296734,0.9125,0.912456
100,0.048,0.334904,0.9275,0.927168
120,0.0274,0.374092,0.92,0.919838
140,0.0173,0.427769,0.9275,0.927168
160,0.0318,0.344557,0.9175,0.917064
180,0.0047,0.363004,0.9375,0.937359
200,0.0062,0.434106,0.9275,0.927445


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.4636,0.283265,0.8975,0.896412
40,0.2296,0.212772,0.9225,0.922196
60,0.1207,0.327897,0.9075,0.907486
80,0.0673,0.296734,0.9125,0.912456
100,0.048,0.334904,0.9275,0.927168
120,0.0274,0.374092,0.92,0.919838
140,0.0173,0.427769,0.9275,0.927168
160,0.0318,0.344557,0.9175,0.917064
180,0.0047,0.363004,0.9375,0.937359
200,0.0062,0.434106,0.9275,0.927445


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.4636,0.283265,0.8975,0.896412
40,0.2296,0.212772,0.9225,0.922196
60,0.1207,0.327897,0.9075,0.907486
80,0.0673,0.296734,0.9125,0.912456
100,0.048,0.334904,0.9275,0.927168
120,0.0274,0.374092,0.92,0.919838
140,0.0173,0.427769,0.9275,0.927168
160,0.0318,0.344557,0.9175,0.917064
180,0.0047,0.363004,0.9375,0.937359
200,0.0062,0.434106,0.9275,0.927445


DatasetDict({
    train: Dataset({
        features: ['text', 'label'],
        num_rows: 1600
    })
    test: Dataset({
        features: ['text', 'label'],
        num_rows: 400
    })
})

qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.4039,0.300697,0.91,0.909345
40,0.2004,0.265647,0.9125,0.911054
60,0.1027,0.30368,0.905,0.903836
80,0.0519,0.486875,0.885,0.884434
100,0.0232,0.562438,0.885,0.883953
120,0.0135,0.653945,0.8725,0.872269
140,0.0068,0.691417,0.895,0.894044
160,0.01,0.527782,0.9075,0.906518
180,0.0026,0.585768,0.915,0.914226
200,0.0069,0.657881,0.905,0.903367


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.4039,0.300697,0.91,0.909345
40,0.2004,0.265647,0.9125,0.911054
60,0.1027,0.30368,0.905,0.903836
80,0.0519,0.486875,0.885,0.884434
100,0.0232,0.562438,0.885,0.883953
120,0.0135,0.653945,0.8725,0.872269
140,0.0068,0.691417,0.895,0.894044
160,0.01,0.527782,0.9075,0.906518
180,0.0026,0.585768,0.915,0.914226
200,0.0069,0.657881,0.905,0.903367


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.4039,0.300697,0.91,0.909345
40,0.2004,0.265647,0.9125,0.911054
60,0.1027,0.30368,0.905,0.903836
80,0.0519,0.486875,0.885,0.884434
100,0.0232,0.562438,0.885,0.883953
120,0.0135,0.653945,0.8725,0.872269
140,0.0068,0.691417,0.895,0.894044
160,0.01,0.527782,0.9075,0.906518
180,0.0026,0.585768,0.915,0.914226
200,0.0069,0.657881,0.905,0.903367


qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.3839,0.237776,0.915,0.913758
40,0.1631,0.251016,0.92,0.919347
60,0.1258,0.218926,0.9375,0.937293
80,0.0717,0.477266,0.885,0.884997
100,0.0313,0.402906,0.92,0.919711
120,0.0013,0.509046,0.92,0.919606
140,0.0158,0.469213,0.9125,0.912377
160,0.0042,0.482765,0.915,0.914226
180,0.0049,0.486155,0.915,0.914828
200,0.011,0.563919,0.9275,0.927336


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.3839,0.237776,0.915,0.913758
40,0.1631,0.251016,0.92,0.919347
60,0.1258,0.218926,0.9375,0.937293
80,0.0717,0.477266,0.885,0.884997
100,0.0313,0.402906,0.92,0.919711
120,0.0013,0.509046,0.92,0.919606
140,0.0158,0.469213,0.9125,0.912377
160,0.0042,0.482765,0.915,0.914226
180,0.0049,0.486155,0.915,0.914828
200,0.011,0.563919,0.9275,0.927336


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.3839,0.237776,0.915,0.913758
40,0.1631,0.251016,0.92,0.919347
60,0.1258,0.218926,0.9375,0.937293
80,0.0717,0.477266,0.885,0.884997
100,0.0313,0.402906,0.92,0.919711
120,0.0013,0.509046,0.92,0.919606
140,0.0158,0.469213,0.9125,0.912377
160,0.0042,0.482765,0.915,0.914226
180,0.0049,0.486155,0.915,0.914828
200,0.011,0.563919,0.9275,0.927336


qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.4138,0.207872,0.9275,0.926941
40,0.1823,0.21237,0.93,0.929143
60,0.0957,0.165371,0.9525,0.952414
80,0.0751,0.209978,0.9375,0.937293
100,0.0383,0.242644,0.93,0.929825
120,0.0176,0.425738,0.9325,0.931979
140,0.0137,0.399561,0.935,0.934868
160,0.018,0.382697,0.9375,0.937387
180,0.0029,0.432516,0.94,0.939783
200,0.0038,0.468642,0.9325,0.932313


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.4138,0.207872,0.9275,0.926941
40,0.1823,0.21237,0.93,0.929143
60,0.0957,0.165371,0.9525,0.952414
80,0.0751,0.209978,0.9375,0.937293
100,0.0383,0.242644,0.93,0.929825
120,0.0176,0.425738,0.9325,0.931979
140,0.0137,0.399561,0.935,0.934868
160,0.018,0.382697,0.9375,0.937387
180,0.0029,0.432516,0.94,0.939783
200,0.0038,0.468642,0.9325,0.932313


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.4138,0.207872,0.9275,0.926941
40,0.1823,0.21237,0.93,0.929143
60,0.0957,0.165371,0.9525,0.952414
80,0.0751,0.209978,0.9375,0.937293
100,0.0383,0.242644,0.93,0.929825
120,0.0176,0.425738,0.9325,0.931979
140,0.0137,0.399561,0.935,0.934868
160,0.018,0.382697,0.9375,0.937387
180,0.0029,0.432516,0.94,0.939783
200,0.0038,0.468642,0.9325,0.932313


DatasetDict({
    train: Dataset({
        features: ['text', 'label'],
        num_rows: 1600
    })
    test: Dataset({
        features: ['text', 'label'],
        num_rows: 400
    })
})

UBC-NLP/MARBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.3833,0.345982,0.8875,0.88549
40,0.1934,0.304366,0.91,0.90918
60,0.2117,0.268805,0.9075,0.906419
80,0.0957,0.493631,0.87,0.869792
100,0.0784,0.475059,0.9075,0.905971
120,0.0727,0.379623,0.9025,0.901748
140,0.0325,0.488272,0.9025,0.902231
160,0.0146,0.729073,0.8975,0.896065
180,0.0045,0.808468,0.8825,0.881695
200,0.0096,0.78565,0.8975,0.896516


UBC-NLP/MARBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.3833,0.345982,0.8875,0.88549
40,0.1934,0.304366,0.91,0.90918
60,0.2117,0.268805,0.9075,0.906419
80,0.0957,0.493631,0.87,0.869792
100,0.0784,0.475059,0.9075,0.905971
120,0.0727,0.379623,0.9025,0.901748
140,0.0325,0.488272,0.9025,0.902231
160,0.0146,0.729073,0.8975,0.896065
180,0.0045,0.808468,0.8825,0.881695
200,0.0096,0.78565,0.8975,0.896516


UBC-NLP/MARBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.3833,0.345982,0.8875,0.88549
40,0.1934,0.304366,0.91,0.90918
60,0.2117,0.268805,0.9075,0.906419
80,0.0957,0.493631,0.87,0.869792
100,0.0784,0.475059,0.9075,0.905971
120,0.0727,0.379623,0.9025,0.901748
140,0.0325,0.488272,0.9025,0.902231
160,0.0146,0.729073,0.8975,0.896065
180,0.0045,0.808468,0.8825,0.881695
200,0.0096,0.78565,0.8975,0.896516


UBC-NLP/MARBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.3957,0.283554,0.9025,0.901911
40,0.1733,0.324287,0.9275,0.927336
60,0.1233,0.356819,0.9075,0.906941
80,0.1145,0.24648,0.9325,0.932037
100,0.0774,0.337088,0.915,0.914742
120,0.024,0.592234,0.895,0.894989
140,0.0246,0.572526,0.905,0.904848
160,0.0136,0.541905,0.9175,0.917272
180,0.0089,0.526254,0.9275,0.927062
200,0.0058,0.522684,0.92,0.919757


UBC-NLP/MARBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.3957,0.283554,0.9025,0.901911
40,0.1733,0.324287,0.9275,0.927336
60,0.1233,0.356819,0.9075,0.906941
80,0.1145,0.24648,0.9325,0.932037
100,0.0774,0.337088,0.915,0.914742
120,0.024,0.592234,0.895,0.894989
140,0.0246,0.572526,0.905,0.904848
160,0.0136,0.541905,0.9175,0.917272
180,0.0089,0.526254,0.9275,0.927062
200,0.0058,0.522684,0.92,0.919757


UBC-NLP/MARBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.3957,0.283554,0.9025,0.901911
40,0.1733,0.324287,0.9275,0.927336
60,0.1233,0.356819,0.9075,0.906941
80,0.1145,0.24648,0.9325,0.932037
100,0.0774,0.337088,0.915,0.914742
120,0.024,0.592234,0.895,0.894989
140,0.0246,0.572526,0.905,0.904848
160,0.0136,0.541905,0.9175,0.917272
180,0.0089,0.526254,0.9275,0.927062
200,0.0058,0.522684,0.92,0.919757


UBC-NLP/MARBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.4001,0.237339,0.93,0.929491
40,0.1927,0.285153,0.9225,0.922145
60,0.1386,0.256948,0.9275,0.927398
80,0.0852,0.30862,0.9275,0.927216
100,0.045,0.363562,0.9175,0.917384
120,0.0524,0.40662,0.9225,0.92236
140,0.0163,0.520462,0.9125,0.912456
160,0.0165,0.508206,0.9225,0.9225
180,0.019,0.324986,0.95,0.949955
200,0.0191,0.327342,0.9375,0.937359


UBC-NLP/MARBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.4001,0.237339,0.93,0.929491
40,0.1927,0.285153,0.9225,0.922145
60,0.1386,0.256948,0.9275,0.927398
80,0.0852,0.30862,0.9275,0.927216
100,0.045,0.363562,0.9175,0.917384
120,0.0524,0.40662,0.9225,0.92236
140,0.0163,0.520462,0.9125,0.912456
160,0.0165,0.508206,0.9225,0.9225
180,0.019,0.324986,0.95,0.949955
200,0.0191,0.327342,0.9375,0.937359


UBC-NLP/MARBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.4001,0.237339,0.93,0.929491
40,0.1927,0.285153,0.9225,0.922145
60,0.1386,0.256948,0.9275,0.927398
80,0.0852,0.30862,0.9275,0.927216
100,0.045,0.363562,0.9175,0.917384
120,0.0524,0.40662,0.9225,0.92236
140,0.0163,0.520462,0.9125,0.912456
160,0.0165,0.508206,0.9225,0.9225
180,0.019,0.324986,0.95,0.949955
200,0.0191,0.327342,0.9375,0.937359


DatasetDict({
    train: Dataset({
        features: ['text', 'label'],
        num_rows: 1600
    })
    test: Dataset({
        features: ['text', 'label'],
        num_rows: 400
    })
})

UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.4104,0.31493,0.8975,0.896958
40,0.2182,0.285901,0.9125,0.912038
60,0.1475,0.254794,0.925,0.92381
80,0.0877,0.295816,0.9225,0.922286
100,0.0969,0.334543,0.915,0.914923
120,0.0909,0.349554,0.915,0.914787
140,0.0463,0.404639,0.9125,0.912157
160,0.0166,0.433254,0.925,0.924081
180,0.0077,0.44449,0.9325,0.931783
200,0.0012,0.451769,0.935,0.934408


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.4104,0.31493,0.8975,0.896958
40,0.2182,0.285901,0.9125,0.912038
60,0.1475,0.254794,0.925,0.92381
80,0.0877,0.295816,0.9225,0.922286
100,0.0969,0.334543,0.915,0.914923
120,0.0909,0.349554,0.915,0.914787
140,0.0463,0.404639,0.9125,0.912157
160,0.0166,0.433254,0.925,0.924081
180,0.0077,0.44449,0.9325,0.931783
200,0.0012,0.451769,0.935,0.934408


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.4104,0.31493,0.8975,0.896958
40,0.2182,0.285901,0.9125,0.912038
60,0.1475,0.254794,0.925,0.92381
80,0.0877,0.295816,0.9225,0.922286
100,0.0969,0.334543,0.915,0.914923
120,0.0909,0.349554,0.915,0.914787
140,0.0463,0.404639,0.9125,0.912157
160,0.0166,0.433254,0.925,0.924081
180,0.0077,0.44449,0.9325,0.931783
200,0.0012,0.451769,0.935,0.934408


UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.43,0.226258,0.92,0.919485
40,0.1822,0.231745,0.92,0.919485
60,0.1295,0.243052,0.925,0.924682
80,0.0726,0.34606,0.905,0.904848
100,0.0807,0.36752,0.915,0.914896
120,0.0392,0.464584,0.8925,0.892499
140,0.0088,0.412751,0.915,0.914519
160,0.0166,0.41476,0.9125,0.912258
180,0.0067,0.459843,0.9275,0.926804
200,0.0047,0.485842,0.9175,0.916863


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.43,0.226258,0.92,0.919485
40,0.1822,0.231745,0.92,0.919485
60,0.1295,0.243052,0.925,0.924682
80,0.0726,0.34606,0.905,0.904848
100,0.0807,0.36752,0.915,0.914896
120,0.0392,0.464584,0.8925,0.892499
140,0.0088,0.412751,0.915,0.914519
160,0.0166,0.41476,0.9125,0.912258
180,0.0067,0.459843,0.9275,0.926804
200,0.0047,0.485842,0.9175,0.916863


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.43,0.226258,0.92,0.919485
40,0.1822,0.231745,0.92,0.919485
60,0.1295,0.243052,0.925,0.924682
80,0.0726,0.34606,0.905,0.904848
100,0.0807,0.36752,0.915,0.914896
120,0.0392,0.464584,0.8925,0.892499
140,0.0088,0.412751,0.915,0.914519
160,0.0166,0.41476,0.9125,0.912258
180,0.0067,0.459843,0.9275,0.926804
200,0.0047,0.485842,0.9175,0.916863


UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.4342,0.265469,0.9125,0.911477
40,0.2085,0.176375,0.9425,0.942341
60,0.1257,0.270741,0.93,0.929984
80,0.11,0.180492,0.945,0.944767
100,0.0711,0.182479,0.9575,0.957383
120,0.0344,0.197984,0.9525,0.952314
140,0.0144,0.314507,0.945,0.944729
160,0.0088,0.310951,0.935,0.934959
180,0.017,0.395095,0.9325,0.932037
200,0.0009,0.323503,0.95,0.949939


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.4342,0.265469,0.9125,0.911477
40,0.2085,0.176375,0.9425,0.942341
60,0.1257,0.270741,0.93,0.929984
80,0.11,0.180492,0.945,0.944767
100,0.0711,0.182479,0.9575,0.957383
120,0.0344,0.197984,0.9525,0.952314
140,0.0144,0.314507,0.945,0.944729
160,0.0088,0.310951,0.935,0.934959
180,0.017,0.395095,0.9325,0.932037
200,0.0009,0.323503,0.95,0.949939


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/1600 [00:00<?, ? examples/s]

Map:   0%|          | 0/400 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
20,0.4342,0.265469,0.9125,0.911477
40,0.2085,0.176375,0.9425,0.942341
60,0.1257,0.270741,0.93,0.929984
80,0.11,0.180492,0.945,0.944767
100,0.0711,0.182479,0.9575,0.957383
120,0.0344,0.197984,0.9525,0.952314
140,0.0144,0.314507,0.945,0.944729
160,0.0088,0.310951,0.935,0.934959
180,0.017,0.395095,0.9325,0.932037
200,0.0009,0.323503,0.95,0.949939


Unnamed: 0,Model,Accuracy,F1
0,CAMeL-Lab/bert-base-arabic-camelbert-da,0.9375,0.937359
3,UBC-NLP/MARBERT,0.95,0.949955
6,UBC-NLP/MARBERTv2,0.9575,0.957383
9,aubmindlab/bert-base-arabertv02-twitter,0.94,0.939878
15,qarib/bert-base-qarib,0.9525,0.952414
