In [1]:
import os
os.environ["CUDA_VISIBLE_DEVICES"]="1" 

import numpy as np
import tensorflow as tf
import pandas as pd
import pyarabic.araby as araby
import warnings
warnings.filterwarnings('ignore')
from sklearn.model_selection import train_test_split
from sklearn.metrics import classification_report
from tensorflow.keras.layers import Dense, Input
from tensorflow.keras.utils import to_categorical
from tensorflow.keras.optimizers import Adam
from tensorflow.keras.callbacks import EarlyStopping
from tensorflow.keras.initializers import TruncatedNormal
from tensorflow.keras.losses import CategoricalCrossentropy
from tensorflow.keras.metrics import CategoricalAccuracy
import torch
from sklearn.metrics import accuracy_score, f1_score
from transformers import Trainer, TrainingArguments
from transformers import AutoTokenizer, AutoModelForSequenceClassification
from datasets import load_dataset, Dataset, concatenate_datasets
pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', None)
pd.set_option('display.max_colwidth', 1000)


fname = 'Open_1'
log_file = fname + '.txt'

with open(log_file, 'w') as f:
    f.write('Model,Accuracy,F1\n')


df1 = pd.read_csv('datasets/OpenAccessArDialect/Sentiment_Anaysis.csv', encoding='utf-8', engine='python') #, quotechar="'"  , quoting=3
df2 = pd.read_csv('datasets/OpenAccessArDialect/dialect.csv', encoding='utf-8', engine='python') #, quotechar="'"  , quoting=3

df2 = df2[df2['dialect'] == 'Morocco']
      
display(df1.columns)
display(df1[:4])

display(df2.columns)
display(df2[:4])
display(len(df2))



df = df1[df1['Twits'].isin(df2['Twits'])]

display(df[:5])
display(len(df))

c = df['label'].value_counts()
display(c)

classes = set(df['label'].values)
display(classes)

df['label'] = df['label'].astype('category')
df['label'] = df['label'].cat.codes

df = df[['Twits', 'label']]
classes_num = len(classes)
display(classes_num)
display(len(df))



max_sequence_length = 128



models = [ 
        'aubmindlab/bert-base-arabertv02-twitter',
        'CAMeL-Lab/bert-base-arabic-camelbert-da',
        'qarib/bert-base-qarib', 
        'UBC-NLP/MARBERT',
        'UBC-NLP/MARBERTv2',
    'SI2M-Lab/DarijaBERT-mix',
    'SI2M-Lab/DarijaBERT-arabizi'
]


seeds = [0, 1, 42]

for model_name in models:
    for seed in seeds:
        ds = Dataset.from_pandas(df)
        ds = ds.train_test_split(test_size=0.2, seed = seed)
        if seed==0:
            display(ds)
            
        for i in range(3):
            print(f'{model_name}, try:{i}')
                  
            tokenizer = AutoTokenizer.from_pretrained(model_name)
            model = AutoModelForSequenceClassification.from_pretrained(model_name,
                                                                  num_labels=classes_num).to('cuda')                                                 
            dataset_train = ds['train']
            dataset_validation = ds['test']                                                    
            
          
    
            def preprocess_function(examples):
                return tokenizer(examples['Twits'], truncation=True, padding="max_length",
                                max_length=max_sequence_length)
            
            
            dataset_train = dataset_train.map(preprocess_function, batched=True)
            dataset_validation = dataset_validation.map(preprocess_function, batched=True)
            
           
            
            def compute_metrics(eval_pred):
                logits, labels = eval_pred
                predictions = np.argmax(logits, axis=-1)    
                acc = accuracy_score(labels, predictions)        
                f1 = f1_score(labels, predictions, average='macro')   
                with open(log_file, 'a') as f:
                    f.write(f'{model_name},{acc},{f1}\n')
                return {'accuracy': acc, 'f1_score': f1}
    
    
            
            
            epochs = 12
            save_steps = 10000 #save checkpoint every 10000 steps
            batch_size = 64
            
            training_args = TrainingArguments(
                output_dir = 'bert/',
                overwrite_output_dir=True,
                num_train_epochs = epochs,
                per_device_train_batch_size = batch_size,
                per_device_eval_batch_size = batch_size,
                save_steps = save_steps,
                save_total_limit = 1, #only save the last 5 checkpoints
                fp16=True,
                learning_rate = 5e-5,  # 5e-5 is the default
                logging_steps = 50, #50_000
                evaluation_strategy = 'steps',
                # evaluate_during_training = True,
                eval_steps = 50
                
            )
            
            trainer = Trainer(
                model = model,
                args = training_args,
                # data_collator=data_collator,
                train_dataset=dataset_train,
                eval_dataset=dataset_validation,
                compute_metrics = compute_metrics
            )
            
            
            trainer.train()


results = pd.read_csv(log_file)

best_results = results.groupby('Model', as_index=False)['F1'].max()

best_results = pd.merge(best_results, results, on=['Model', 'F1'])
best_results = best_results[['Model', 'Accuracy', 'F1']]
best_results = best_results.drop_duplicates()
best_results.to_csv(f'{fname}.csv')
display(best_results)



2024-09-18 10:10:12.368881: I tensorflow/core/util/port.cc:110] oneDNN custom operations are on. You may see slightly different numerical results due to floating-point round-off errors from different computation orders. To turn them off, set the environment variable `TF_ENABLE_ONEDNN_OPTS=0`.
2024-09-18 10:10:12.394067: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.
To enable the following instructions: AVX2 AVX512F AVX512_VNNI AVX512_BF16 FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.


Index(['Unnamed: 0', 'Twits', 'label'], dtype='object')

Unnamed: 0.1,Unnamed: 0,Twits,label
0,0,what happens,neu
1,1,😞😞,neg
2,2,ان شاء الله,neu
3,3,بالتوفيق ان شاء الله,pos


Index(['Twits', 'dialect'], dtype='object')

Unnamed: 0,Twits,dialect
13393,slawiya msikina tb9a f darha 😐😕😕,Morocco
13394,ناس د الرباط أش واقع عندكم تما ... ياكما شي شبه عائلية 😐,Morocco
13395,لي دوا مشاا 😂😂,Morocco
13396,: وزراء تقلقوا,Morocco


9965

Unnamed: 0.1,Unnamed: 0,Twits,label
8,8,ههههههههه,pos
9,9,"هههه ضروري بإذن الله , لفقر را عيب ؤ عار ؤ حشومة",neg
10,10,مع فاق كيم جون من المرض وهو اكتب لينا مشروع قانون شكرا كيم جون ، عاشت كوريا,pos
11,11,الوادافاكية: زوجة اليوسفي تعزي جلالة الملك في وفاة زوجها,neg
12,12,: ها علاش مكنقراوش للقصص للاطفال قبل النوم😂😂😂,neu


8520

label
neu    6923
neg    1200
pos     397
Name: count, dtype: int64

{'neg', 'neu', 'pos'}

3

8520

DatasetDict({
    train: Dataset({
        features: ['Twits', 'label', '__index_level_0__'],
        num_rows: 6816
    })
    test: Dataset({
        features: ['Twits', 'label', '__index_level_0__'],
        num_rows: 1704
    })
})

aubmindlab/bert-base-arabertv02-twitter, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3789,0.339218,0.873239,0.68326
100,0.3015,0.313107,0.877934,0.718619
150,0.2131,0.357511,0.891432,0.711395
200,0.2275,0.351177,0.879108,0.684438
250,0.1697,0.3546,0.879695,0.714416
300,0.0941,0.418645,0.893192,0.727131
350,0.0795,0.460789,0.880869,0.710618
400,0.0393,0.53649,0.875587,0.72037
450,0.0457,0.518401,0.887324,0.744105
500,0.0217,0.619335,0.867371,0.724274


aubmindlab/bert-base-arabertv02-twitter, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3914,0.334781,0.883803,0.686574
100,0.2968,0.314345,0.876761,0.706728
150,0.2085,0.35869,0.888498,0.704108
200,0.2223,0.356097,0.893192,0.709268
250,0.1587,0.369164,0.875587,0.711357
300,0.0891,0.439631,0.88615,0.721005
350,0.0728,0.482812,0.878521,0.711711
400,0.0435,0.531076,0.884977,0.721482
450,0.0336,0.582711,0.890845,0.729332
500,0.0174,0.623069,0.887324,0.730322


aubmindlab/bert-base-arabertv02-twitter, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3914,0.334781,0.883803,0.686574
100,0.2968,0.314345,0.876761,0.706728
150,0.2085,0.35869,0.888498,0.704108
200,0.2223,0.356097,0.893192,0.709268
250,0.1587,0.369164,0.875587,0.711357
300,0.0891,0.439631,0.88615,0.721005
350,0.0728,0.482812,0.878521,0.711711
400,0.0435,0.531076,0.884977,0.721482
450,0.0336,0.582711,0.890845,0.729332
500,0.0174,0.623069,0.887324,0.730322


aubmindlab/bert-base-arabertv02-twitter, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4016,0.323904,0.872066,0.67493
100,0.2872,0.313004,0.883803,0.68119
150,0.2434,0.333387,0.880282,0.680636
200,0.2204,0.32914,0.88615,0.697156
250,0.1477,0.387898,0.888498,0.6786
300,0.134,0.387046,0.887911,0.707644
350,0.0767,0.443253,0.88439,0.701535
400,0.0516,0.443742,0.88439,0.708933
450,0.034,0.495777,0.892606,0.731687
500,0.0353,0.510374,0.885563,0.72541


aubmindlab/bert-base-arabertv02-twitter, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4016,0.323904,0.872066,0.67493
100,0.2872,0.313004,0.883803,0.68119
150,0.2434,0.333387,0.880282,0.680636
200,0.2204,0.32914,0.88615,0.697156
250,0.1477,0.387898,0.888498,0.6786
300,0.134,0.387046,0.887911,0.707644
350,0.0767,0.443253,0.88439,0.701535
400,0.0516,0.443742,0.88439,0.708933
450,0.034,0.495777,0.892606,0.731687
500,0.0353,0.510374,0.885563,0.72541


aubmindlab/bert-base-arabertv02-twitter, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4016,0.323904,0.872066,0.67493
100,0.2872,0.313004,0.883803,0.68119
150,0.2434,0.333387,0.880282,0.680636
200,0.2204,0.32914,0.88615,0.697156
250,0.1477,0.387898,0.888498,0.6786
300,0.134,0.387046,0.887911,0.707644
350,0.0767,0.443253,0.88439,0.701535
400,0.0516,0.443742,0.88439,0.708933
450,0.034,0.495777,0.892606,0.731687
500,0.0353,0.510374,0.885563,0.72541


aubmindlab/bert-base-arabertv02-twitter, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4141,0.314625,0.879108,0.693768
100,0.2924,0.288695,0.896714,0.722354
150,0.2278,0.293057,0.89554,0.723519
200,0.2222,0.292757,0.903756,0.744286
250,0.1353,0.353117,0.900235,0.725896
300,0.1115,0.381814,0.8973,0.717646
350,0.0882,0.413401,0.892019,0.73926
400,0.05,0.42012,0.893192,0.72852
450,0.0355,0.504032,0.8973,0.723195
500,0.0261,0.556636,0.881455,0.714037


aubmindlab/bert-base-arabertv02-twitter, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4141,0.314625,0.879108,0.693768
100,0.2924,0.288695,0.896714,0.722354
150,0.2278,0.293057,0.89554,0.723519
200,0.2222,0.292757,0.903756,0.744286
250,0.1353,0.353117,0.900235,0.725896
300,0.1115,0.381814,0.8973,0.717646
350,0.0882,0.413401,0.892019,0.73926
400,0.05,0.42012,0.893192,0.72852
450,0.0355,0.504032,0.8973,0.723195
500,0.0261,0.556636,0.881455,0.714037


aubmindlab/bert-base-arabertv02-twitter, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at aubmindlab/bert-base-arabertv02-twitter and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4141,0.314625,0.879108,0.693768
100,0.2924,0.288695,0.896714,0.722354
150,0.2278,0.293057,0.89554,0.723519
200,0.2222,0.292757,0.903756,0.744286
250,0.1353,0.353117,0.900235,0.725896
300,0.1115,0.381814,0.8973,0.717646
350,0.0882,0.413401,0.892019,0.73926
400,0.05,0.42012,0.893192,0.72852
450,0.0355,0.504032,0.8973,0.723195
500,0.0261,0.556636,0.881455,0.714037


DatasetDict({
    train: Dataset({
        features: ['Twits', 'label', '__index_level_0__'],
        num_rows: 6816
    })
    test: Dataset({
        features: ['Twits', 'label', '__index_level_0__'],
        num_rows: 1704
    })
})

CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3987,0.342939,0.872653,0.640209
100,0.3239,0.33121,0.870305,0.66143
150,0.2208,0.351776,0.883216,0.725992
200,0.255,0.341469,0.876174,0.618767
250,0.1538,0.3948,0.875587,0.713178
300,0.121,0.389915,0.879695,0.705977
350,0.0934,0.496307,0.886737,0.715586
400,0.0522,0.526302,0.889085,0.722215
450,0.042,0.597528,0.88615,0.692499
500,0.0358,0.564113,0.887324,0.729515


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3987,0.342939,0.872653,0.640209
100,0.3239,0.33121,0.870305,0.66143
150,0.2208,0.351776,0.883216,0.725992
200,0.255,0.341469,0.876174,0.618767
250,0.1538,0.3948,0.875587,0.713178
300,0.121,0.389915,0.879695,0.705977
350,0.0934,0.496307,0.886737,0.715586
400,0.0522,0.526302,0.889085,0.722215
450,0.042,0.597528,0.88615,0.692499
500,0.0358,0.564113,0.887324,0.729515


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3987,0.342939,0.872653,0.640209
100,0.3239,0.33121,0.870305,0.66143
150,0.2208,0.351776,0.883216,0.725992
200,0.255,0.341469,0.876174,0.618767
250,0.1538,0.3948,0.875587,0.713178
300,0.121,0.389915,0.879695,0.705977
350,0.0934,0.496307,0.886737,0.715586
400,0.0522,0.526302,0.889085,0.722215
450,0.042,0.597528,0.88615,0.692499
500,0.0358,0.564113,0.887324,0.729515


CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4141,0.323997,0.873826,0.672636
100,0.2918,0.31762,0.88439,0.67616
150,0.2488,0.324174,0.88439,0.674413
200,0.2165,0.385363,0.863263,0.641085
250,0.1606,0.372284,0.886737,0.706062
300,0.1266,0.364767,0.890258,0.727278
350,0.1052,0.493382,0.889085,0.72759
400,0.07,0.407614,0.885563,0.706682
450,0.0559,0.476963,0.896714,0.73928
500,0.0463,0.577601,0.882629,0.678808


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4141,0.323997,0.873826,0.672636
100,0.2918,0.31762,0.88439,0.67616
150,0.2488,0.324174,0.88439,0.674413
200,0.2165,0.385363,0.863263,0.641085
250,0.1606,0.372284,0.886737,0.706062
300,0.1266,0.364767,0.890258,0.727278
350,0.1052,0.493382,0.889085,0.72759
400,0.07,0.407614,0.885563,0.706682
450,0.0559,0.476963,0.896714,0.73928
500,0.0463,0.577601,0.882629,0.678808


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4141,0.323997,0.873826,0.672636
100,0.2918,0.31762,0.88439,0.67616
150,0.2488,0.324174,0.88439,0.674413
200,0.2165,0.385363,0.863263,0.641085
250,0.1606,0.372284,0.886737,0.706062
300,0.1266,0.364767,0.890258,0.727278
350,0.1052,0.493382,0.889085,0.72759
400,0.07,0.407614,0.885563,0.706682
450,0.0559,0.476963,0.896714,0.73928
500,0.0463,0.577601,0.882629,0.678808


CAMeL-Lab/bert-base-arabic-camelbert-da, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4278,0.331018,0.882042,0.655535
100,0.2969,0.305003,0.889671,0.723374
150,0.2462,0.299948,0.892019,0.682186
200,0.2278,0.311186,0.892019,0.724106
250,0.1394,0.450745,0.890845,0.733504
300,0.1254,0.392701,0.889085,0.696543
350,0.1036,0.535241,0.875587,0.698606
400,0.1181,0.569499,0.866784,0.677643
450,0.069,0.510709,0.889085,0.731247
500,0.0465,0.563104,0.882629,0.706954


CAMeL-Lab/bert-base-arabic-camelbert-da, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4278,0.331018,0.882042,0.655535
100,0.2969,0.305003,0.889671,0.723374
150,0.2462,0.299948,0.892019,0.682186
200,0.2278,0.311186,0.892019,0.724106
250,0.1394,0.450745,0.890845,0.733504
300,0.1254,0.392701,0.889085,0.696543
350,0.1036,0.535241,0.875587,0.698606
400,0.1181,0.569499,0.866784,0.677643
450,0.069,0.510709,0.889085,0.731247
500,0.0465,0.563104,0.882629,0.706954


CAMeL-Lab/bert-base-arabic-camelbert-da, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at CAMeL-Lab/bert-base-arabic-camelbert-da and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4278,0.331018,0.882042,0.655535
100,0.2969,0.305003,0.889671,0.723374
150,0.2462,0.299948,0.892019,0.682186
200,0.2278,0.311186,0.892019,0.724106
250,0.1394,0.450745,0.890845,0.733504
300,0.1254,0.392701,0.889085,0.696543
350,0.1036,0.535241,0.875587,0.698606
400,0.1181,0.569499,0.866784,0.677643
450,0.069,0.510709,0.889085,0.731247
500,0.0465,0.563104,0.882629,0.706954


DatasetDict({
    train: Dataset({
        features: ['Twits', 'label', '__index_level_0__'],
        num_rows: 6816
    })
    test: Dataset({
        features: ['Twits', 'label', '__index_level_0__'],
        num_rows: 1704
    })
})

qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3882,0.346688,0.864437,0.69451
100,0.3005,0.31391,0.882042,0.696561
150,0.1975,0.367022,0.882042,0.702358
200,0.1995,0.352181,0.88615,0.701395
250,0.1253,0.424822,0.880869,0.706458
300,0.0667,0.502764,0.887324,0.719321
350,0.0599,0.546309,0.877347,0.687698
400,0.0484,0.576663,0.876174,0.694661
450,0.0454,0.610227,0.876174,0.696761
500,0.0169,0.702847,0.878521,0.724313


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3882,0.346688,0.864437,0.69451
100,0.3005,0.31391,0.882042,0.696561
150,0.1975,0.367022,0.882042,0.702358
200,0.1995,0.352181,0.88615,0.701395
250,0.1253,0.424822,0.880869,0.706458
300,0.0667,0.502764,0.887324,0.719321
350,0.0599,0.546309,0.877347,0.687698
400,0.0484,0.576663,0.876174,0.694661
450,0.0454,0.610227,0.876174,0.696761
500,0.0169,0.702847,0.878521,0.724313


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3882,0.346688,0.864437,0.69451
100,0.3005,0.31391,0.882042,0.696561
150,0.1975,0.367022,0.882042,0.702358
200,0.1995,0.352181,0.88615,0.701395
250,0.1253,0.424822,0.880869,0.706458
300,0.0667,0.502764,0.887324,0.719321
350,0.0599,0.546309,0.877347,0.687698
400,0.0484,0.576663,0.876174,0.694661
450,0.0454,0.610227,0.876174,0.696761
500,0.0169,0.702847,0.878521,0.724313


qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3926,0.323215,0.865023,0.703021
100,0.2832,0.317834,0.891432,0.684132
150,0.2163,0.320892,0.893192,0.726021
200,0.1852,0.40296,0.867958,0.663645
250,0.1209,0.44002,0.889671,0.699906
300,0.1016,0.408046,0.891432,0.715877
350,0.0561,0.488633,0.899648,0.728174
400,0.0401,0.510033,0.880869,0.711238
450,0.0426,0.563259,0.893192,0.71911
500,0.0247,0.567892,0.887324,0.723488


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3926,0.323215,0.865023,0.703021
100,0.2832,0.317834,0.891432,0.684132
150,0.2163,0.320892,0.893192,0.726021
200,0.1852,0.40296,0.867958,0.663645
250,0.1209,0.44002,0.889671,0.699906
300,0.1016,0.408046,0.891432,0.715877
350,0.0561,0.488633,0.899648,0.728174
400,0.0401,0.510033,0.880869,0.711238
450,0.0426,0.563259,0.893192,0.71911
500,0.0247,0.567892,0.887324,0.723488


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3926,0.323215,0.865023,0.703021
100,0.2832,0.317834,0.891432,0.684132
150,0.2163,0.320892,0.893192,0.726021
200,0.1852,0.40296,0.867958,0.663645
250,0.1209,0.44002,0.889671,0.699906
300,0.1016,0.408046,0.891432,0.715877
350,0.0561,0.488633,0.899648,0.728174
400,0.0401,0.510033,0.880869,0.711238
450,0.0426,0.563259,0.893192,0.71911
500,0.0247,0.567892,0.887324,0.723488


qarib/bert-base-qarib, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4105,0.292505,0.892606,0.728567
100,0.2981,0.292369,0.887324,0.735546
150,0.2164,0.288675,0.897887,0.751394
200,0.2077,0.300638,0.907277,0.749244
250,0.1103,0.402511,0.911972,0.767154
300,0.1024,0.377449,0.904343,0.732341
350,0.078,0.490071,0.896127,0.714848
400,0.0418,0.465074,0.897887,0.749318
450,0.042,0.546672,0.881455,0.716202
500,0.0335,0.590939,0.894953,0.723805


qarib/bert-base-qarib, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4105,0.292505,0.892606,0.728567
100,0.2981,0.292369,0.887324,0.735546
150,0.2164,0.288675,0.897887,0.751394
200,0.2077,0.300638,0.907277,0.749244
250,0.1103,0.402511,0.911972,0.767154
300,0.1024,0.377449,0.904343,0.732341
350,0.078,0.490071,0.896127,0.714848
400,0.0418,0.465074,0.897887,0.749318
450,0.042,0.546672,0.881455,0.716202
500,0.0335,0.590939,0.894953,0.723805


qarib/bert-base-qarib, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at qarib/bert-base-qarib and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4105,0.292505,0.892606,0.728567
100,0.2981,0.292369,0.887324,0.735546
150,0.2164,0.288675,0.897887,0.751394
200,0.2077,0.300638,0.907277,0.749244
250,0.1103,0.402511,0.911972,0.767154
300,0.1024,0.377449,0.904343,0.732341
350,0.078,0.490071,0.896127,0.714848
400,0.0418,0.465074,0.897887,0.749318
450,0.042,0.546672,0.881455,0.716202
500,0.0335,0.590939,0.894953,0.723805


DatasetDict({
    train: Dataset({
        features: ['Twits', 'label', '__index_level_0__'],
        num_rows: 6816
    })
    test: Dataset({
        features: ['Twits', 'label', '__index_level_0__'],
        num_rows: 1704
    })
})

UBC-NLP/MARBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4182,0.385937,0.843897,0.676074
100,0.3365,0.336083,0.870305,0.692658
150,0.223,0.364893,0.88615,0.74311
200,0.2324,0.358024,0.885563,0.675981
250,0.1333,0.458701,0.882629,0.721203
300,0.092,0.471768,0.890258,0.741695
350,0.0595,0.597967,0.873826,0.673654
400,0.049,0.580562,0.886737,0.72595
450,0.0404,0.598557,0.88615,0.749618
500,0.0327,0.666876,0.883803,0.731779


UBC-NLP/MARBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4182,0.385937,0.843897,0.676074
100,0.3365,0.336083,0.870305,0.692658
150,0.223,0.364893,0.88615,0.74311
200,0.2324,0.358024,0.885563,0.675981
250,0.1333,0.458701,0.882629,0.721203
300,0.092,0.471768,0.890258,0.741695
350,0.0595,0.597967,0.873826,0.673654
400,0.049,0.580562,0.886737,0.72595
450,0.0404,0.598557,0.88615,0.749618
500,0.0327,0.666876,0.883803,0.731779


UBC-NLP/MARBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4182,0.385937,0.843897,0.676074
100,0.3365,0.336083,0.870305,0.692658
150,0.223,0.364893,0.88615,0.74311
200,0.2324,0.358024,0.885563,0.675981
250,0.1333,0.458701,0.882629,0.721203
300,0.092,0.471768,0.890258,0.741695
350,0.0595,0.597967,0.873826,0.673654
400,0.049,0.580562,0.886737,0.72595
450,0.0404,0.598557,0.88615,0.749618
500,0.0327,0.666876,0.883803,0.731779


UBC-NLP/MARBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4246,0.326788,0.867371,0.707006
100,0.2996,0.314024,0.881455,0.669339
150,0.2679,0.33279,0.876761,0.68279
200,0.2067,0.332052,0.885563,0.701552
250,0.152,0.495805,0.869718,0.667408
300,0.1344,0.391609,0.876761,0.713434
350,0.0866,0.531933,0.879108,0.712245
400,0.0597,0.761587,0.860915,0.631199
450,0.0515,0.635859,0.881455,0.717747
500,0.0525,0.619462,0.872066,0.704569


UBC-NLP/MARBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4246,0.326788,0.867371,0.707006
100,0.2996,0.314024,0.881455,0.669339
150,0.2679,0.33279,0.876761,0.68279
200,0.2067,0.332052,0.885563,0.701552
250,0.152,0.495805,0.869718,0.667408
300,0.1344,0.391609,0.876761,0.713434
350,0.0866,0.531933,0.879108,0.712245
400,0.0597,0.761587,0.860915,0.631199
450,0.0515,0.635859,0.881455,0.717747
500,0.0525,0.619462,0.872066,0.704569


UBC-NLP/MARBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4246,0.326788,0.867371,0.707006
100,0.2996,0.314024,0.881455,0.669339
150,0.2679,0.33279,0.876761,0.68279
200,0.2067,0.332052,0.885563,0.701552
250,0.152,0.495805,0.869718,0.667408
300,0.1344,0.391609,0.876761,0.713434
350,0.0866,0.531933,0.879108,0.712245
400,0.0597,0.761587,0.860915,0.631199
450,0.0515,0.635859,0.881455,0.717747
500,0.0525,0.619462,0.872066,0.704569


UBC-NLP/MARBERT, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4334,0.330445,0.884977,0.704558
100,0.3014,0.331448,0.870892,0.721165
150,0.2274,0.32225,0.889671,0.710225
200,0.2331,0.301683,0.899061,0.754691
250,0.1321,0.481579,0.880869,0.712245
300,0.1019,0.396936,0.896714,0.744487
350,0.0747,0.535557,0.889671,0.714615
400,0.0541,0.727405,0.871479,0.68898
450,0.0434,0.614233,0.883803,0.744957
500,0.0288,0.625029,0.887324,0.71701


UBC-NLP/MARBERT, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4334,0.330445,0.884977,0.704558
100,0.3014,0.331448,0.870892,0.721165
150,0.2274,0.32225,0.889671,0.710225
200,0.2331,0.301683,0.899061,0.754691
250,0.1321,0.481579,0.880869,0.712245
300,0.1019,0.396936,0.896714,0.744487
350,0.0747,0.535557,0.889671,0.714615
400,0.0541,0.727405,0.871479,0.68898
450,0.0434,0.614233,0.883803,0.744957
500,0.0288,0.625029,0.887324,0.71701


UBC-NLP/MARBERT, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERT and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4334,0.330445,0.884977,0.704558
100,0.3014,0.331448,0.870892,0.721165
150,0.2274,0.32225,0.889671,0.710225
200,0.2331,0.301683,0.899061,0.754691
250,0.1321,0.481579,0.880869,0.712245
300,0.1019,0.396936,0.896714,0.744487
350,0.0747,0.535557,0.889671,0.714615
400,0.0541,0.727405,0.871479,0.68898
450,0.0434,0.614233,0.883803,0.744957
500,0.0288,0.625029,0.887324,0.71701


DatasetDict({
    train: Dataset({
        features: ['Twits', 'label', '__index_level_0__'],
        num_rows: 6816
    })
    test: Dataset({
        features: ['Twits', 'label', '__index_level_0__'],
        num_rows: 1704
    })
})

UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.49,0.413661,0.869718,0.535394
100,0.3769,0.334868,0.876761,0.680282
150,0.2768,0.357501,0.878521,0.679086
200,0.293,0.342061,0.888498,0.653253
250,0.2202,0.484667,0.836268,0.68218
300,0.1706,0.385676,0.872066,0.715907
350,0.1313,0.473165,0.86561,0.702938
400,0.1045,0.489506,0.876174,0.715471
450,0.0857,0.606536,0.857981,0.700209
500,0.0652,0.55475,0.866784,0.714071


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.49,0.413661,0.869718,0.535394
100,0.3769,0.334868,0.876761,0.680282
150,0.2768,0.357501,0.878521,0.679086
200,0.293,0.342061,0.888498,0.653253
250,0.2202,0.484667,0.836268,0.68218
300,0.1706,0.385676,0.872066,0.715907
350,0.1313,0.473165,0.86561,0.702938
400,0.1045,0.489506,0.876174,0.715471
450,0.0857,0.606536,0.857981,0.700209
500,0.0652,0.55475,0.866784,0.714071


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.49,0.413661,0.869718,0.535394
100,0.3769,0.334868,0.876761,0.680282
150,0.2768,0.357501,0.878521,0.679086
200,0.293,0.342061,0.888498,0.653253
250,0.2202,0.484667,0.836268,0.68218
300,0.1706,0.385676,0.872066,0.715907
350,0.1313,0.473165,0.86561,0.702938
400,0.1045,0.489506,0.876174,0.715471
450,0.0857,0.606536,0.857981,0.700209
500,0.0652,0.55475,0.866784,0.714071


UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4602,0.365337,0.856808,0.537172
100,0.3047,0.319271,0.882629,0.696219
150,0.2658,0.322362,0.889085,0.718554
200,0.2041,0.336036,0.879108,0.714494
250,0.1498,0.411267,0.880282,0.695828
300,0.1255,0.403416,0.889085,0.732738
350,0.091,0.523116,0.888498,0.738958
400,0.0742,0.543299,0.886737,0.712926
450,0.058,0.522441,0.882629,0.7275
500,0.0627,0.647229,0.881455,0.697129


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4602,0.365337,0.856808,0.537172
100,0.3047,0.319271,0.882629,0.696219
150,0.2658,0.322362,0.889085,0.718554
200,0.2041,0.336036,0.879108,0.714494
250,0.1498,0.411267,0.880282,0.695828
300,0.1255,0.403416,0.889085,0.732738
350,0.091,0.523116,0.888498,0.738958
400,0.0742,0.543299,0.886737,0.712926
450,0.058,0.522441,0.882629,0.7275
500,0.0627,0.647229,0.881455,0.697129


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4602,0.365337,0.856808,0.537172
100,0.3047,0.319271,0.882629,0.696219
150,0.2658,0.322362,0.889085,0.718554
200,0.2041,0.336036,0.879108,0.714494
250,0.1498,0.411267,0.880282,0.695828
300,0.1255,0.403416,0.889085,0.732738
350,0.091,0.523116,0.888498,0.738958
400,0.0742,0.543299,0.886737,0.712926
450,0.058,0.522441,0.882629,0.7275
500,0.0627,0.647229,0.881455,0.697129


UBC-NLP/MARBERTv2, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4629,0.345058,0.875,0.59796
100,0.3074,0.317026,0.888498,0.738483
150,0.2408,0.31689,0.882042,0.730322
200,0.2361,0.284062,0.900822,0.761729
250,0.1325,0.377538,0.900235,0.738877
300,0.1331,0.366016,0.903756,0.745798
350,0.1097,0.483929,0.88439,0.746526
400,0.0699,0.478821,0.876761,0.745694
450,0.0544,0.492437,0.886737,0.736352
500,0.0373,0.588746,0.881455,0.725518


UBC-NLP/MARBERTv2, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4629,0.345058,0.875,0.59796
100,0.3074,0.317026,0.888498,0.738483
150,0.2408,0.31689,0.882042,0.730322
200,0.2361,0.284062,0.900822,0.761729
250,0.1325,0.377538,0.900235,0.738877
300,0.1331,0.366016,0.903756,0.745798
350,0.1097,0.483929,0.88439,0.746526
400,0.0699,0.478821,0.876761,0.745694
450,0.0544,0.492437,0.886737,0.736352
500,0.0373,0.588746,0.881455,0.725518


UBC-NLP/MARBERTv2, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at UBC-NLP/MARBERTv2 and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4629,0.345058,0.875,0.59796
100,0.3074,0.317026,0.888498,0.738483
150,0.2408,0.31689,0.882042,0.730322
200,0.2361,0.284062,0.900822,0.761729
250,0.1325,0.377538,0.900235,0.738877
300,0.1331,0.366016,0.903756,0.745798
350,0.1097,0.483929,0.88439,0.746526
400,0.0699,0.478821,0.876761,0.745694
450,0.0544,0.492437,0.886737,0.736352
500,0.0373,0.588746,0.881455,0.725518


DatasetDict({
    train: Dataset({
        features: ['Twits', 'label', '__index_level_0__'],
        num_rows: 6816
    })
    test: Dataset({
        features: ['Twits', 'label', '__index_level_0__'],
        num_rows: 1704
    })
})

SI2M-Lab/DarijaBERT-mix, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.449,0.339839,0.875,0.643454
100,0.3274,0.339528,0.875587,0.668234
150,0.2768,0.372934,0.864437,0.601579
200,0.3246,0.359089,0.870305,0.573683
250,0.269,0.385934,0.86385,0.578385
300,0.2535,0.403381,0.870892,0.609743
350,0.2064,0.453557,0.862676,0.574584
400,0.1666,0.447394,0.85446,0.599853
450,0.1568,0.525373,0.859742,0.585869
500,0.1485,0.522486,0.846244,0.586019


SI2M-Lab/DarijaBERT-mix, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.449,0.339839,0.875,0.643454
100,0.3274,0.339528,0.875587,0.668234
150,0.2768,0.372934,0.864437,0.601579
200,0.3246,0.359089,0.870305,0.573683
250,0.269,0.385934,0.86385,0.578385
300,0.2535,0.403381,0.870892,0.609743
350,0.2064,0.453557,0.862676,0.574584
400,0.1666,0.447394,0.85446,0.599853
450,0.1568,0.525373,0.859742,0.585869
500,0.1485,0.522486,0.846244,0.586019


SI2M-Lab/DarijaBERT-mix, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.449,0.339839,0.875,0.643454
100,0.3274,0.339528,0.875587,0.668234
150,0.2768,0.372934,0.864437,0.601579
200,0.3246,0.359089,0.870305,0.573683
250,0.269,0.385934,0.86385,0.578385
300,0.2535,0.403381,0.870892,0.609743
350,0.2064,0.453557,0.862676,0.574584
400,0.1666,0.447394,0.85446,0.599853
450,0.1568,0.525373,0.859742,0.585869
500,0.1485,0.522486,0.846244,0.586019


SI2M-Lab/DarijaBERT-mix, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4749,0.398622,0.856221,0.550811
100,0.3463,0.364412,0.864437,0.564727
150,0.3268,0.346419,0.869131,0.612574
200,0.3169,0.355716,0.860329,0.634167
250,0.2461,0.388142,0.870305,0.639744
300,0.2408,0.329786,0.889085,0.720223
350,0.1872,0.375172,0.875,0.699298
400,0.1451,0.387904,0.879108,0.689961
450,0.1231,0.401983,0.890258,0.720801
500,0.0934,0.49184,0.874413,0.697849


SI2M-Lab/DarijaBERT-mix, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4749,0.398622,0.856221,0.550811
100,0.3463,0.364412,0.864437,0.564727
150,0.3268,0.346419,0.869131,0.612574
200,0.3169,0.355716,0.860329,0.634167
250,0.2461,0.388142,0.870305,0.639744
300,0.2408,0.329786,0.889085,0.720223
350,0.1872,0.375172,0.875,0.699298
400,0.1451,0.387904,0.879108,0.689961
450,0.1231,0.401983,0.890258,0.720801
500,0.0934,0.49184,0.874413,0.697849


SI2M-Lab/DarijaBERT-mix, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4749,0.398622,0.856221,0.550811
100,0.3463,0.364412,0.864437,0.564727
150,0.3268,0.346419,0.869131,0.612574
200,0.3169,0.355716,0.860329,0.634167
250,0.2461,0.388142,0.870305,0.639744
300,0.2408,0.329786,0.889085,0.720223
350,0.1872,0.375172,0.875,0.699298
400,0.1451,0.387904,0.879108,0.689961
450,0.1231,0.401983,0.890258,0.720801
500,0.0934,0.49184,0.874413,0.697849


SI2M-Lab/DarijaBERT-mix, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4633,0.335598,0.867958,0.578077
100,0.3283,0.327987,0.88615,0.67755
150,0.2856,0.314709,0.878521,0.710915
200,0.2967,0.305373,0.892019,0.735726
250,0.2511,0.317915,0.893779,0.735701
300,0.2328,0.475508,0.862089,0.59111
350,0.2173,0.334884,0.896714,0.755235
400,0.1698,0.338034,0.889085,0.715994
450,0.1299,0.373708,0.896127,0.744619
500,0.0908,0.491801,0.885563,0.720981


SI2M-Lab/DarijaBERT-mix, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4633,0.335598,0.867958,0.578077
100,0.3283,0.327987,0.88615,0.67755
150,0.2856,0.314709,0.878521,0.710915
200,0.2967,0.305373,0.892019,0.735726
250,0.2511,0.317915,0.893779,0.735701
300,0.2328,0.475508,0.862089,0.59111
350,0.2173,0.334884,0.896714,0.755235
400,0.1698,0.338034,0.889085,0.715994
450,0.1299,0.373708,0.896127,0.744619
500,0.0908,0.491801,0.885563,0.720981


SI2M-Lab/DarijaBERT-mix, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-mix and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4633,0.335598,0.867958,0.578077
100,0.3283,0.327987,0.88615,0.67755
150,0.2856,0.314709,0.878521,0.710915
200,0.2967,0.305373,0.892019,0.735726
250,0.2511,0.317915,0.893779,0.735701
300,0.2328,0.475508,0.862089,0.59111
350,0.2173,0.334884,0.896714,0.755235
400,0.1698,0.338034,0.889085,0.715994
450,0.1299,0.373708,0.896127,0.744619
500,0.0908,0.491801,0.885563,0.720981


DatasetDict({
    train: Dataset({
        features: ['Twits', 'label', '__index_level_0__'],
        num_rows: 6816
    })
    test: Dataset({
        features: ['Twits', 'label', '__index_level_0__'],
        num_rows: 1704
    })
})

SI2M-Lab/DarijaBERT-arabizi, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3971,0.322722,0.877934,0.654172
100,0.3218,0.333988,0.870305,0.696372
150,0.2107,0.372218,0.880869,0.72425
200,0.2267,0.347937,0.890258,0.717006
250,0.1389,0.42718,0.891432,0.718742
300,0.116,0.402117,0.879108,0.711232
350,0.0724,0.514306,0.886737,0.708341
400,0.0446,0.59175,0.878521,0.710693
450,0.0512,0.607801,0.882629,0.733303
500,0.0302,0.649584,0.873826,0.718679


SI2M-Lab/DarijaBERT-arabizi, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3971,0.322722,0.877934,0.654172
100,0.3218,0.333988,0.870305,0.696372
150,0.2107,0.372218,0.880869,0.72425
200,0.2267,0.347937,0.890258,0.717006
250,0.1389,0.42718,0.891432,0.718742
300,0.116,0.402117,0.879108,0.711232
350,0.0724,0.514306,0.886737,0.708341
400,0.0446,0.59175,0.878521,0.710693
450,0.0512,0.607801,0.882629,0.733303
500,0.0302,0.649584,0.873826,0.718679


SI2M-Lab/DarijaBERT-arabizi, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.3971,0.322722,0.877934,0.654172
100,0.3218,0.333988,0.870305,0.696372
150,0.2107,0.372218,0.880869,0.72425
200,0.2267,0.347937,0.890258,0.717006
250,0.1389,0.42718,0.891432,0.718742
300,0.116,0.402117,0.879108,0.711232
350,0.0724,0.514306,0.886737,0.708341
400,0.0446,0.59175,0.878521,0.710693
450,0.0512,0.607801,0.882629,0.733303
500,0.0302,0.649584,0.873826,0.718679


SI2M-Lab/DarijaBERT-arabizi, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.413,0.328082,0.866784,0.705141
100,0.3035,0.305381,0.88615,0.655909
150,0.2482,0.338294,0.873826,0.679073
200,0.2072,0.350865,0.869131,0.692027
250,0.1605,0.413721,0.892019,0.691957
300,0.1236,0.401068,0.885563,0.705774
350,0.0874,0.48808,0.88615,0.723611
400,0.05,0.696727,0.869131,0.681045
450,0.041,0.539332,0.889671,0.712464
500,0.0327,0.723454,0.879695,0.697246


SI2M-Lab/DarijaBERT-arabizi, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.413,0.328082,0.866784,0.705141
100,0.3035,0.305381,0.88615,0.655909
150,0.2482,0.338294,0.873826,0.679073
200,0.2072,0.350865,0.869131,0.692027
250,0.1605,0.413721,0.892019,0.691957
300,0.1236,0.401068,0.885563,0.705774
350,0.0874,0.48808,0.88615,0.723611
400,0.05,0.696727,0.869131,0.681045
450,0.041,0.539332,0.889671,0.712464
500,0.0327,0.723454,0.879695,0.697246


SI2M-Lab/DarijaBERT-arabizi, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.413,0.328082,0.866784,0.705141
100,0.3035,0.305381,0.88615,0.655909
150,0.2482,0.338294,0.873826,0.679073
200,0.2072,0.350865,0.869131,0.692027
250,0.1605,0.413721,0.892019,0.691957
300,0.1236,0.401068,0.885563,0.705774
350,0.0874,0.48808,0.88615,0.723611
400,0.05,0.696727,0.869131,0.681045
450,0.041,0.539332,0.889671,0.712464
500,0.0327,0.723454,0.879695,0.697246


SI2M-Lab/DarijaBERT-arabizi, try:0


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4294,0.332067,0.873826,0.698081
100,0.3071,0.306542,0.890845,0.709264
150,0.2364,0.294765,0.892606,0.725153
200,0.2304,0.284264,0.907864,0.765434
250,0.1394,0.398566,0.903756,0.741832
300,0.1247,0.378283,0.8973,0.695348
350,0.0933,0.433174,0.892606,0.744404
400,0.0564,0.478135,0.8973,0.729498
450,0.034,0.500728,0.902582,0.770524
500,0.031,0.562793,0.896127,0.743033


SI2M-Lab/DarijaBERT-arabizi, try:1


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4294,0.332067,0.873826,0.698081
100,0.3071,0.306542,0.890845,0.709264
150,0.2364,0.294765,0.892606,0.725153
200,0.2304,0.284264,0.907864,0.765434
250,0.1394,0.398566,0.903756,0.741832
300,0.1247,0.378283,0.8973,0.695348
350,0.0933,0.433174,0.892606,0.744404
400,0.0564,0.478135,0.8973,0.729498
450,0.034,0.500728,0.902582,0.770524
500,0.031,0.562793,0.896127,0.743033


SI2M-Lab/DarijaBERT-arabizi, try:2


Some weights of BertForSequenceClassification were not initialized from the model checkpoint at SI2M-Lab/DarijaBERT-arabizi and are newly initialized: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Map:   0%|          | 0/6816 [00:00<?, ? examples/s]

Map:   0%|          | 0/1704 [00:00<?, ? examples/s]

Step,Training Loss,Validation Loss,Accuracy,F1 Score
50,0.4294,0.332067,0.873826,0.698081
100,0.3071,0.306542,0.890845,0.709264
150,0.2364,0.294765,0.892606,0.725153
200,0.2304,0.284264,0.907864,0.765434
250,0.1394,0.398566,0.903756,0.741832
300,0.1247,0.378283,0.8973,0.695348
350,0.0933,0.433174,0.892606,0.744404
400,0.0564,0.478135,0.8973,0.729498
450,0.034,0.500728,0.902582,0.770524
500,0.031,0.562793,0.896127,0.743033


Unnamed: 0,Model,Accuracy,F1
0,CAMeL-Lab/bert-base-arabic-camelbert-da,0.888498,0.745876
3,SI2M-Lab/DarijaBERT-arabizi,0.902582,0.770524
6,SI2M-Lab/DarijaBERT-mix,0.900235,0.756567
9,UBC-NLP/MARBERT,0.899061,0.754691
12,UBC-NLP/MARBERTv2,0.900235,0.767904
15,aubmindlab/bert-base-arabertv02-twitter,0.893192,0.745771
18,qarib/bert-base-qarib,0.911972,0.767154
