<a href="https://colab.research.google.com/github/marco-siino/text_preprocessing_impact/blob/main/20N_DS/ELECTRA_20N_TextPreProImpact_NBx.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

## Text preprocessing worth the time: A comparative survey on the impact of common techniques on NLP model performances.
- - -
ELECTRA ON 20N DS EXPERIMENTS NOTEBOOK
- - -
ELECTRA on 20N Dataset.
Code by M. Siino.

From the paper: "Text preprocessing worth the time: A comparative survey on the impact of common techniques on NLP model performances." by M.Siino et al.



## Importing modules.

In [None]:
!pip install simpletransformers
!pip install tensorboardx

import matplotlib.pyplot as plt
import os
import re
import shutil
import string
import tensorflow as tf
import numpy as np
import torch
import nltk
import pandas as pd

from tensorflow.keras import layers
from tensorflow.keras import losses
from tensorflow.keras import preprocessing
from keras.models import Model
from tensorflow.keras.layers.experimental.preprocessing import TextVectorization
from nltk.corpus import stopwords
from nltk.tokenize import word_tokenize
from nltk.stem import PorterStemmer
from textblob import TextBlob
nltk.download('stopwords')
nltk.download('punkt')
from io import open
from pathlib import Path
from simpletransformers.classification import ClassificationModel, ClassificationArgs
from sklearn.metrics import accuracy_score

Collecting simpletransformers
  Using cached simpletransformers-0.63.11-py3-none-any.whl (250 kB)
Collecting transformers>=4.6.0
  Using cached transformers-4.30.2-py3-none-any.whl (7.2 MB)
Collecting datasets
  Using cached datasets-2.13.1-py3-none-any.whl (486 kB)
Collecting wandb>=0.10.32
  Using cached wandb-0.15.5-py3-none-any.whl (2.1 MB)
Collecting scikit-learn
  Downloading scikit_learn-1.3.0-cp39-cp39-win_amd64.whl (9.3 MB)
     ---------------------------------------- 9.3/9.3 MB 10.3 MB/s eta 0:00:00
Collecting tokenizers
  Using cached tokenizers-0.13.3-cp39-cp39-win_amd64.whl (3.5 MB)
Collecting seqeval
  Using cached seqeval-1.2.2-py3-none-any.whl
Collecting pandas
  Downloading pandas-2.0.3-cp39-cp39-win_amd64.whl (10.8 MB)
     --------------------------------------- 10.8/10.8 MB 24.2 MB/s eta 0:00:00
Collecting streamlit
  Using cached streamlit-1.24.1-py2.py3-none-any.whl (8.9 MB)
Collecting scipy
  Downloading scipy-1.11.1-cp39-cp39-win_amd64.whl (44.1 MB)
     ------

[nltk_data] Downloading package stopwords to
[nltk_data]     C:\Users\Domenico\AppData\Roaming\nltk_data...
[nltk_data]   Package stopwords is already up-to-date!
[nltk_data] Downloading package punkt to
[nltk_data]     C:\Users\Domenico\AppData\Roaming\nltk_data...
[nltk_data]   Package punkt is already up-to-date!


## Importing DS and extract in current working directory.

In [None]:
urlDataset = "https://github.com/marco-siino/text_preprocessing_impact/raw/main/20N_DS/20news-bydate.tar.gz"

dataset = tf.keras.utils.get_file("20news-bydate.tar.gz", urlDataset,
                                    extract=True, archive_format='tar',cache_dir='.',
                                    cache_subdir='')

test_dir = '20news-bydate-test'
train_dir = '20news-bydate-train'

## Build folders hierarchy to use Keras folders preprocessing function.

In [None]:
def walk_dir(targetdir,topdown=True):
    for root, dirs, files in os.walk(targetdir, topdown):
        for subfolder in dirs:
          #print(subfolder)
          #print(root)
          #print(dirs)
          #print(files)
          for subroot, subdirs, files in os.walk(root+'/'+subfolder, topdown):
            #print(files)
            for name in files:
              #print(name)
              os.rename(root+'/'+subfolder+'/'+name, root+'/'+subfolder+'/'+name+'.txt')

walk_dir(test_dir)
walk_dir(train_dir)

FileExistsError: ignored

## Building the dataset.

In [None]:
# Generate full randomized training set.
batch_size=1

train_ds = tf.keras.preprocessing.text_dataset_from_directory(
    train_dir,
    batch_size=batch_size,
    shuffle=False
    )

test_ds = tf.keras.preprocessing.text_dataset_from_directory(
    test_dir,
    batch_size=batch_size,
    shuffle=False
    )

train_ds=train_ds.shuffle(11314,seed=1, reshuffle_each_iteration=False)
test_ds=test_ds.shuffle(7532,seed=1, reshuffle_each_iteration=False)

train_ds_size=len(train_ds)
test_ds_size=len(test_ds)

train_ds = train_ds.take(200)
test_ds = test_ds.take(50)


#train_ds = train_ds.map(lambda x, y: (x, tf.one_hot(y, depth=20)))
#test_ds = test_ds.map(lambda x, y: (x, tf.one_hot(y, depth=20)))

Found 11314 files belonging to 20 classes.
Found 7532 files belonging to 20 classes.


## Functions to pre-process source text. (A detailed discussion on our paper)

In [None]:
# Do-Nothing preprocessing function.
def DON(input_data):
  tag_open_CDATA_removed = tf.strings.regex_replace(input_data, '<\!\[CDATA\[', ' ')
  tag_closed_CDATA_removed = tf.strings.regex_replace(tag_open_CDATA_removed,'\]{1,}>', ' ')
  tag_author_lang_en_removed = tf.strings.regex_replace(tag_closed_CDATA_removed,'<author lang="en">', ' ')
  tag_closed_author_removed = tf.strings.regex_replace(tag_author_lang_en_removed,'</author>', ' ')
  tag_open_documents_removed = tf.strings.regex_replace(tag_closed_author_removed,'<documents>\n(\t){0,2}', '')
  output_data = tf.strings.regex_replace(tag_open_documents_removed,'</documents>\n(\t){0,2}', ' ')
  return output_data

# Lowercasing preprocessing function.
def LOW(input_data):
  return tf.strings.lower(DON(input_data))

# Removing Stop Words function.
def RSW(input_data):
  output_data = DON(input_data)

  #print("\n\nInput data è il seguente tensore:")
  #print(output_data)

  #print("Lo converto in stringa e diventa:")
  # Il seguente try per l'adattamento del ts. Nell'except caso della simulazione vera e propria.
  try:
    input_string=output_data[0]

  # # # # # # # Questo è il caso della chiamata a funzione per la simulazione vera e propria.
  except:
    #print("\n\n****CASO DELLA SIMULAZIONE VERA E PROPRIA****\n\n")
    #print("\nQuesto è il contenuto di output data in caso di simulazione")
    #print(output_data)
    input_string=output_data

    try:
      input_string = input_string.numpy()

    except:
      #print("This one is not a tensor!")
      return output_data

    else:
      #print("\nEstraendo il contenuto del tensore risulta:")
      input_string=(str(input_string))[2:-1]

    #print(input_string)
    blob = TextBlob(str(input_string)).words

    outputlist = [word for word in blob if word not in stopwords.words('english')]
    #print("tolte le stopword inglesi diventa:")

    output_string = (' '.join(word for word in outputlist))
    #print(output_string)

    output_tensor=tf.constant(output_string)
    #print(output_tensor)

    return output_tensor

   # # # # # # # Questo è il caso dell'adattamento del TS.
  else:

    try:

      # input_string = input_string.numpy() [0]
      input_string = input_string.numpy()

    except:
      #print("This one is not a tensor!")
      return output_data

    else:
      input_string=(str(input_string))[2:-1]

    #print(input_string)
    blob = TextBlob(str(input_string)).words

    outputlist = [word for word in blob if word not in stopwords.words('english')]
    #print("Tolte le stopword inglesi diventa:")

    output_string = (' '.join(word for word in outputlist))
    #print(output_string)

    output_tensor=tf.constant([[output_string]])
    #print(output_tensor)

    return output_tensor

  return output_data

# Porter Stemmer preprocessing function.
def STM(input_data):
  output_data = DON(input_data)
  stemmer = PorterStemmer()

  #print("\n\nInput data è il seguente tensore:")
  #print(output_data)

  #print("Lo converto in stringa e diventa:")
  # Il seguente try per l'adattamento del ts. Nell'except caso della simulazione vera e propria.
  try:
    input_string=output_data[0]

  # # # # # # # Questo è il caso della chiamata a funzione per la simulazione vera e propria.
  except:
    #print("\n\n****CASO DELLA SIMULAZIONE VERA E PROPRIA****\n\n")
    #print("\nQuesto è il contenuto di output data in caso di simulazione")
    #print(output_data)
    input_string=output_data

    try:
      input_string = input_string.numpy()

    except:
      #print("This one is not a tensor!")
      return output_data

    else:
      #print("\nEstraendo il contenuto del tensore risulta:")
      #print(input_string)
      input_string=(str(input_string))[2:-1]

    #print(input_string)
    blob = TextBlob(str(input_string)).words

    outputlist = [stemmer.stem(word) for word in blob]

    output_string = (' '.join(word for word in outputlist))
    #print(output_string)

    output_tensor=tf.constant(output_string)
    #print(output_tensor)

    return output_tensor

   # # # # # # # Questo è il caso dell'adattamento del TS.
  else:

    try:
      #input_string = input_string.numpy()[0]
      input_string = input_string.numpy()
      #print(input_string)

    except:
      #print("This one is not a tensor!")
      return output_data

    else:
      input_string=(str(input_string))[2:-1]

    #print(input_string)
    blob = TextBlob(str(input_string)).words

    outputlist = [stemmer.stem(word) for word in blob]

    output_string = (' '.join(word for word in outputlist))

    output_tensor=tf.constant([[output_string]])
    #print(output_tensor)

    return output_tensor

  return output_data

## Define the combined preprocessing functions. (The base functions are: DON, LOW, RSW and STM).

In [None]:
## SECTION WITH PAIRS OF PREPRO FUNCTIONS. APPLICATION ORDER MATTERS (...IN FOLLOWING SECTIONS TOO).
#...5
def LOW_RSW(input_data):
  return RSW(LOW(input_data))

# 6
def LOW_STM(input_data):
  return STM(LOW(input_data))

# 7
def RSW_LOW(input_data):
  return LOW(RSW(input_data))

# 8
def RSW_STM(input_data):
  return STM(RSW(input_data))

# 9
def STM_LOW(input_data):
  return LOW(STM(input_data))

# 10
def STM_RSW(input_data):
  return RSW(STM(input_data))

# 11
def LOW_STM_RSW(input_data):
  return RSW(STM(LOW(input_data)))

# 12
def LOW_RSW_STM(input_data):
  return STM(RSW(LOW(input_data)))

# 13
def STM_LOW_RSW(input_data):
  return RSW(LOW(STM(input_data)))

# 14
def STM_RSW_LOW(input_data):
  return LOW(RSW(STM(input_data)))

# 15
def RSW_LOW_STM(input_data):
  return STM(LOW(RSW(input_data)))

# 16
def RSW_STM_LOW(input_data):
  return LOW(STM(RSW(input_data)))

## Define a dictionary with -> function_names:prepro_function_caller. And a dictionary to store model results.

In [None]:
model_results = {}
prepro_functions_dict_base = {
    'DON':DON,
    'LOW':LOW,
    'RSW':RSW,
    'STM':STM
    }

# 3 prepro functions = 15 combs...+1 for do_nothing

prepro_functions_dict_comb = {
    # 1. Do nothing
    'DON': DON,
    # 2. Lowercasing
    'LOW':LOW,
    # 3. Removing Stopwords
    'RSW':RSW,
    # 4. Porter Stemming
    'STM':STM,
    # 5. LOW->RSW
    'LOW_RSW':LOW_RSW,
    # 6. LOW->STM
    'LOW_STM':LOW_STM,
    # 7. RSW->LOW
    'RSW_LOW':RSW_LOW,
    # 8. RSW->STM
    'RSW_STM':RSW_STM,
    # 9. STM->LOW
    'STM_LOW':STM_LOW,
    # 10. STM->RSW
    'STM_RSW':STM_RSW,
    # 11. LOW->STM->RSW
    'LOW_STM_RSW':LOW_STM_RSW,
    # 12. LOW->RSW->STM
    'LOW_RSW_STM':LOW_RSW_STM,
    # 13. STM->LOW->RSW
    'STM_LOW_RSW':STM_LOW_RSW,
    # 14. STM->RSW->LOW
    'STM_RSW_LOW':STM_RSW_LOW,
    # 15. RSW->LOW->STM
    'RSW_LOW_STM':RSW_LOW_STM,
    # 16. RSW->STM->LOW
    'RSW_STM_LOW':RSW_STM_LOW
}

for key in prepro_functions_dict_comb:
  print(key)
  model_results[key]=[]

DON
LOW
RSW
STM
LOW_RSW
LOW_STM
RSW_LOW
RSW_STM
STM_LOW
STM_RSW
LOW_STM_RSW
LOW_RSW_STM
STM_LOW_RSW
STM_RSW_LOW
RSW_LOW_STM
RSW_STM_LOW


## Function to convert DSs to Pandas Dataframe

In [None]:
def preprocess_and_convert_ds(preprocessing_function):
  # Convert English dataset.
  train_df = [] # will contain text and label
  for element in train_ds:
    authorDocument=element[0]
    label = element[1].numpy()[0]
    #print(element[1].numpy()[0])
    #label=list(element[1].numpy()[0].astype(int))
    #print(authorDocument[0])
    #print(label)
    text = preprocessing_function(authorDocument[0].numpy()).numpy().decode('ISO-8859-1')
    #print(text)
    train_df.append({
        'text':text,
        'label':label
    })
  train_df = pd.DataFrame(train_df)

  test_df = [] # will contain text and label
  for element in test_ds:
    authorDocument=element[0]
    label = element[1].numpy()[0]
    #label=list(element[1].numpy()[0].astype(int))
    #print(authorDocument[0])
    text = preprocessing_function(authorDocument[0].numpy()).numpy().decode('ISO-8859-1')
    test_df.append({
        'text':text,
        'label':label
    })
  test_df = pd.DataFrame(test_df)

  return train_df, test_df


## Print some RAW and preprocessed samples (No need to execute)

In [None]:
for idx, element in enumerate(raw_train_ds_es):
  if idx>1: break
  authorDocument=element[0]
  label=element[1]
  temp = custom_standardization(authorDocument[0].numpy()).numpy().decode('UTF-8')
  print("Not-Preprocessed samples: \n",authorDocument)
  print("Preprocessed samples: \n",temp)

NameError: ignored

## Some parameters definition...

In [None]:
# check gpu
cuda_available = torch.cuda.is_available()

print('Cuda available? ',cuda_available)

num_epochs_per_run = 20
num_runs = 5

Cuda available?  False


## Training and evaluation of the model

In [None]:
for key in prepro_functions_dict_comb:
  model_results[key]=[]

for key in prepro_functions_dict_comb:

  model_args = ClassificationArgs(num_train_epochs=1,
                                      no_save=True,
                                      no_cache=True,
                                      overwrite_output_dir=True)

  model = ClassificationModel("electra",
                                  'google/electra-base-discriminator',
                                  args = model_args,
                                  num_labels=20,
                                  use_cuda=cuda_available)

  runs_accuracy = []

  print("\n\n* * * * EVALUATION USING", key, "AS PREPROCESSING FUNCTION * * * *")

  # Preprocess train and test set and convert to DFs.
  train_df,test_df = preprocess_and_convert_ds(prepro_functions_dict_comb[key])

  for run in range(1,(num_runs+1)):
    epochs_accuracy=[]
    model = ClassificationModel("electra",
                                  'google/electra-base-discriminator',
                                    args = model_args,
                                    num_labels=20,
                                    use_cuda=cuda_available)
    for epoch in range (0,num_epochs_per_run):
      print("\nEPOCH NUMBER: ", epoch)
      # train model
      print("\nNOW TRAIN THE MODEL.")
      model.train_model(train_df,show_running_loss=False)
      print("\nNOW EVALUATE THE TEST DF.")
      result, model_outputs, wrong_predictions = model.eval_model(test_df, acc=accuracy_score)
      # Results on test set.
      print(result)
      #correct_predictions = result['tp']+result['tn']
      #print("Correct predictions are: ",correct_predictions)
      #total_predictions = result['tp']+result['tn']+result['fp']+result['fn']
      #print("Total predictions are: ",total_predictions)
      #accuracy = correct_predictions/total_predictions
      print("Accuracy on test set is:",result['acc'],"\n\n")
      epochs_accuracy.append(result['acc'])

    print(epochs_accuracy)
    runs_accuracy.append(max(epochs_accuracy))

  runs_accuracy.sort()
  print("\n\n Over all runs maximum accuracies are:", runs_accuracy)
  print("The median is:",runs_accuracy[2])

  if (runs_accuracy[2]-runs_accuracy[0])>(runs_accuracy[4]-runs_accuracy[2]):
    max_range_from_median = runs_accuracy[2]-runs_accuracy[0]
  else:
    max_range_from_median = runs_accuracy[4]-runs_accuracy[2]
  final_result = str(runs_accuracy[2])+" +/- "+ str(max_range_from_median)
  model_results[key].append(final_result)
  print("ELECTRA Accuracy Score on Test set -> ",model_results[key])


Some weights of the model checkpoint at google/electra-base-discriminator were not used when initializing ElectraForSequenceClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense_prediction.weight']
- This IS expected if you are initializing ElectraForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForSequenceClassification were not initialized from the model checkpoint at google/electra-base-discriminator and are newly initialized: ['classifier.o



* * * * EVALUATION USING DON AS PREPROCESSING FUNCTION * * * *


Some weights of the model checkpoint at google/electra-base-discriminator were not used when initializing ElectraForSequenceClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense_prediction.weight']
- This IS expected if you are initializing ElectraForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForSequenceClassification were not initialized from the model checkpoint at google/electra-base-discriminator and are newly initialized: ['classifier.o


EPOCH NUMBER:  0

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.002091812188062224, 'acc': 0.02, 'eval_loss': 3.026423624583653}
Accuracy on test set is: 0.02 



EPOCH NUMBER:  1

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.0, 'acc': 0.02, 'eval_loss': 3.0179145336151123}
Accuracy on test set is: 0.02 



EPOCH NUMBER:  2

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.0342454093832835, 'acc': 0.04, 'eval_loss': 3.034071786063058}
Accuracy on test set is: 0.04 



EPOCH NUMBER:  3

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.016023575560283224, 'acc': 0.04, 'eval_loss': 3.0269524369921004}
Accuracy on test set is: 0.04 



EPOCH NUMBER:  4

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.02245276918501188, 'acc': 0.04, 'eval_loss': 3.029223305838449}
Accuracy on test set is: 0.04 



EPOCH NUMBER:  5

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.01903354881158958, 'acc': 0.04, 'eval_loss': 2.953260660171509}
Accuracy on test set is: 0.04 



EPOCH NUMBER:  6

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.007446502881059473, 'acc': 0.04, 'eval_loss': 2.902585131781442}
Accuracy on test set is: 0.04 



EPOCH NUMBER:  7

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.05078254054394018, 'acc': 0.08, 'eval_loss': 2.882653202329363}
Accuracy on test set is: 0.08 



EPOCH NUMBER:  8

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.08729661357522359, 'acc': 0.12, 'eval_loss': 2.7790125778743198}
Accuracy on test set is: 0.12 



EPOCH NUMBER:  9

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.10176307453853066, 'acc': 0.12, 'eval_loss': 2.7760301998683383}
Accuracy on test set is: 0.12 



EPOCH NUMBER:  10

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.088002175705257, 'acc': 0.12, 'eval_loss': 2.6891815662384033}
Accuracy on test set is: 0.12 



EPOCH NUMBER:  11

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.06472891067044882, 'acc': 0.1, 'eval_loss': 2.6641721044267928}
Accuracy on test set is: 0.1 



EPOCH NUMBER:  12

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.10609014430524502, 'acc': 0.14, 'eval_loss': 2.634011438914708}
Accuracy on test set is: 0.14 



EPOCH NUMBER:  13

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.1726277623478402, 'acc': 0.2, 'eval_loss': 2.604148728506906}
Accuracy on test set is: 0.2 



EPOCH NUMBER:  14

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.21201330702057478, 'acc': 0.24, 'eval_loss': 2.5348448753356934}
Accuracy on test set is: 0.24 



EPOCH NUMBER:  15

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.15406050321095366, 'acc': 0.18, 'eval_loss': 2.6388135296957835}
Accuracy on test set is: 0.18 



EPOCH NUMBER:  16

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.21789188727567116, 'acc': 0.24, 'eval_loss': 2.5795037746429443}
Accuracy on test set is: 0.24 



EPOCH NUMBER:  17

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.18909908729038566, 'acc': 0.22, 'eval_loss': 2.525509629930769}
Accuracy on test set is: 0.22 



EPOCH NUMBER:  18

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.1680261620729794, 'acc': 0.2, 'eval_loss': 2.567049264907837}
Accuracy on test set is: 0.2 



EPOCH NUMBER:  19

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.17135200537028336, 'acc': 0.2, 'eval_loss': 2.5760617596762523}
Accuracy on test set is: 0.2 


[0.02, 0.02, 0.04, 0.04, 0.04, 0.04, 0.04, 0.08, 0.12, 0.12, 0.12, 0.1, 0.14, 0.2, 0.24, 0.18, 0.24, 0.22, 0.2, 0.2]


Some weights of the model checkpoint at google/electra-base-discriminator were not used when initializing ElectraForSequenceClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense_prediction.weight']
- This IS expected if you are initializing ElectraForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForSequenceClassification were not initialized from the model checkpoint at google/electra-base-discriminator and are newly initialized: ['classifier.o


EPOCH NUMBER:  0

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.040639867034387225, 'acc': 0.04, 'eval_loss': 2.99642961365836}
Accuracy on test set is: 0.04 



EPOCH NUMBER:  1

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': -0.029782538480455364, 'acc': 0.06, 'eval_loss': 2.9844397476741245}
Accuracy on test set is: 0.06 



EPOCH NUMBER:  2

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.004880895105478522, 'acc': 0.04, 'eval_loss': 2.996624708175659}
Accuracy on test set is: 0.04 



EPOCH NUMBER:  3

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.0, 'acc': 0.02, 'eval_loss': 3.0299673080444336}
Accuracy on test set is: 0.02 



EPOCH NUMBER:  4

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.036291585075163446, 'acc': 0.06, 'eval_loss': 3.007265363420759}
Accuracy on test set is: 0.06 



EPOCH NUMBER:  5

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.04317475205618936, 'acc': 0.08, 'eval_loss': 2.9756927149636403}
Accuracy on test set is: 0.08 



EPOCH NUMBER:  6

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.02396679400621821, 'acc': 0.06, 'eval_loss': 2.9542334420340404}
Accuracy on test set is: 0.06 



EPOCH NUMBER:  7

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.08494830907177937, 'acc': 0.12, 'eval_loss': 2.9187424864087785}
Accuracy on test set is: 0.12 



EPOCH NUMBER:  8

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.11164178939652818, 'acc': 0.14, 'eval_loss': 2.8995517662593295}
Accuracy on test set is: 0.14 



EPOCH NUMBER:  9

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.15941065217382802, 'acc': 0.18, 'eval_loss': 2.844754593712943}
Accuracy on test set is: 0.18 



EPOCH NUMBER:  10

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.1662889659936733, 'acc': 0.2, 'eval_loss': 2.781874316079276}
Accuracy on test set is: 0.2 



EPOCH NUMBER:  11

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.12317245567642854, 'acc': 0.16, 'eval_loss': 2.7509275504520962}
Accuracy on test set is: 0.16 



EPOCH NUMBER:  12

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.1886775582573559, 'acc': 0.22, 'eval_loss': 2.6565021787370955}
Accuracy on test set is: 0.22 



EPOCH NUMBER:  13

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.16971461586635517, 'acc': 0.2, 'eval_loss': 2.6086659090859547}
Accuracy on test set is: 0.2 



EPOCH NUMBER:  14

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.23170948466731156, 'acc': 0.26, 'eval_loss': 2.5339135783059255}
Accuracy on test set is: 0.26 



EPOCH NUMBER:  15

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.16772530925854112, 'acc': 0.2, 'eval_loss': 2.5023810863494873}
Accuracy on test set is: 0.2 



EPOCH NUMBER:  16

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.20781895863464608, 'acc': 0.24, 'eval_loss': 2.4203729118619646}
Accuracy on test set is: 0.24 



EPOCH NUMBER:  17

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.23713838798925926, 'acc': 0.26, 'eval_loss': 2.4067465237208774}
Accuracy on test set is: 0.26 



EPOCH NUMBER:  18

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.27714915483155006, 'acc': 0.3, 'eval_loss': 2.3212738377707347}
Accuracy on test set is: 0.3 



EPOCH NUMBER:  19

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.23554353516567778, 'acc': 0.26, 'eval_loss': 2.3599341256277904}
Accuracy on test set is: 0.26 


[0.04, 0.06, 0.04, 0.02, 0.06, 0.08, 0.06, 0.12, 0.14, 0.18, 0.2, 0.16, 0.22, 0.2, 0.26, 0.2, 0.24, 0.26, 0.3, 0.26]


Some weights of the model checkpoint at google/electra-base-discriminator were not used when initializing ElectraForSequenceClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense_prediction.weight']
- This IS expected if you are initializing ElectraForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForSequenceClassification were not initialized from the model checkpoint at google/electra-base-discriminator and are newly initialized: ['classifier.o


EPOCH NUMBER:  0

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.0, 'acc': 0.06, 'eval_loss': 3.005564178739275}
Accuracy on test set is: 0.06 



EPOCH NUMBER:  1

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.0, 'acc': 0.06, 'eval_loss': 3.0144905703408376}
Accuracy on test set is: 0.06 



EPOCH NUMBER:  2

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.06315505607444591, 'acc': 0.1, 'eval_loss': 3.003762994493757}
Accuracy on test set is: 0.1 



EPOCH NUMBER:  3

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': -0.0062494619636165845, 'acc': 0.02, 'eval_loss': 3.0312297344207764}
Accuracy on test set is: 0.02 



EPOCH NUMBER:  4

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': -0.0059778512482351305, 'acc': 0.02, 'eval_loss': 3.0300874369485036}
Accuracy on test set is: 0.02 



EPOCH NUMBER:  5

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.06507081322479333, 'acc': 0.06, 'eval_loss': 3.018787281853812}
Accuracy on test set is: 0.06 



EPOCH NUMBER:  6

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.06236274376388373, 'acc': 0.06, 'eval_loss': 2.9618758133479526}
Accuracy on test set is: 0.06 



EPOCH NUMBER:  7

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.1068714609007346, 'acc': 0.1, 'eval_loss': 2.932307686124529}
Accuracy on test set is: 0.1 



EPOCH NUMBER:  8

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.12450542401460657, 'acc': 0.14, 'eval_loss': 2.845488820757185}
Accuracy on test set is: 0.14 



EPOCH NUMBER:  9

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.10294994629970185, 'acc': 0.12, 'eval_loss': 2.8460469245910645}
Accuracy on test set is: 0.12 



EPOCH NUMBER:  10

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.09909106645462508, 'acc': 0.12, 'eval_loss': 2.777816499982561}
Accuracy on test set is: 0.12 



EPOCH NUMBER:  11

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.13914715146466014, 'acc': 0.16, 'eval_loss': 2.7231038979121616}
Accuracy on test set is: 0.16 



EPOCH NUMBER:  12

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.17999858111303438, 'acc': 0.2, 'eval_loss': 2.677007402692522}
Accuracy on test set is: 0.2 



EPOCH NUMBER:  13

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.17796271641381842, 'acc': 0.2, 'eval_loss': 2.6367058413369313}
Accuracy on test set is: 0.2 



EPOCH NUMBER:  14

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.19704126087622179, 'acc': 0.22, 'eval_loss': 2.6297316210610524}
Accuracy on test set is: 0.22 



EPOCH NUMBER:  15

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.22708009938970547, 'acc': 0.26, 'eval_loss': 2.508166824068342}
Accuracy on test set is: 0.26 



EPOCH NUMBER:  16

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.25289879287547, 'acc': 0.28, 'eval_loss': 2.496908732822963}
Accuracy on test set is: 0.28 



EPOCH NUMBER:  17

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.2519196169400486, 'acc': 0.28, 'eval_loss': 2.5029098646981374}
Accuracy on test set is: 0.28 



EPOCH NUMBER:  18

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.21658832827827396, 'acc': 0.24, 'eval_loss': 2.539804662976946}
Accuracy on test set is: 0.24 



EPOCH NUMBER:  19

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.20370900023896266, 'acc': 0.24, 'eval_loss': 2.574921114104135}
Accuracy on test set is: 0.24 


[0.06, 0.06, 0.1, 0.02, 0.02, 0.06, 0.06, 0.1, 0.14, 0.12, 0.12, 0.16, 0.2, 0.2, 0.22, 0.26, 0.28, 0.28, 0.24, 0.24]


Some weights of the model checkpoint at google/electra-base-discriminator were not used when initializing ElectraForSequenceClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense_prediction.weight']
- This IS expected if you are initializing ElectraForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForSequenceClassification were not initialized from the model checkpoint at google/electra-base-discriminator and are newly initialized: ['classifier.o


EPOCH NUMBER:  0

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': -0.014436278486635649, 'acc': 0.0, 'eval_loss': 3.0055218764713834}
Accuracy on test set is: 0.0 



EPOCH NUMBER:  1

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': -0.07173421497882156, 'acc': 0.04, 'eval_loss': 3.033768824168614}
Accuracy on test set is: 0.04 



EPOCH NUMBER:  2

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.002091812188062224, 'acc': 0.06, 'eval_loss': 2.999885218484061}
Accuracy on test set is: 0.06 



EPOCH NUMBER:  3

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.003699409670642617, 'acc': 0.06, 'eval_loss': 3.019707679748535}
Accuracy on test set is: 0.06 



EPOCH NUMBER:  4

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': -0.044030295698435924, 'acc': 0.0, 'eval_loss': 2.970705713544573}
Accuracy on test set is: 0.0 



EPOCH NUMBER:  5

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.08342854051563875, 'acc': 0.1, 'eval_loss': 2.968245949063982}
Accuracy on test set is: 0.1 



EPOCH NUMBER:  6

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.1125337486285867, 'acc': 0.14, 'eval_loss': 2.9514431612832204}
Accuracy on test set is: 0.14 



EPOCH NUMBER:  7

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.1088428134681489, 'acc': 0.14, 'eval_loss': 2.873826163155692}
Accuracy on test set is: 0.14 



EPOCH NUMBER:  8

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.13342219466610925, 'acc': 0.16, 'eval_loss': 2.7925331933157787}
Accuracy on test set is: 0.16 



EPOCH NUMBER:  9

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.15236489749555912, 'acc': 0.18, 'eval_loss': 2.782574244907924}
Accuracy on test set is: 0.18 



EPOCH NUMBER:  10

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.2010789001146469, 'acc': 0.24, 'eval_loss': 2.698875938143049}
Accuracy on test set is: 0.24 



EPOCH NUMBER:  11

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.16605713217609783, 'acc': 0.2, 'eval_loss': 2.6561290877205983}
Accuracy on test set is: 0.2 



EPOCH NUMBER:  12

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.2049883513306542, 'acc': 0.24, 'eval_loss': 2.614553792136056}
Accuracy on test set is: 0.24 



EPOCH NUMBER:  13

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.20879940702103, 'acc': 0.24, 'eval_loss': 2.5725809846605574}
Accuracy on test set is: 0.24 



EPOCH NUMBER:  14

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.19248767485107104, 'acc': 0.22, 'eval_loss': 2.5247467245374406}
Accuracy on test set is: 0.22 



EPOCH NUMBER:  15

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.27322968530926217, 'acc': 0.3, 'eval_loss': 2.4096095051084245}
Accuracy on test set is: 0.3 



EPOCH NUMBER:  16

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.30468372748977773, 'acc': 0.34, 'eval_loss': 2.3426869426454817}
Accuracy on test set is: 0.34 



EPOCH NUMBER:  17

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.2411651367359038, 'acc': 0.28, 'eval_loss': 2.420368637357439}
Accuracy on test set is: 0.28 



EPOCH NUMBER:  18

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.2833656252481542, 'acc': 0.32, 'eval_loss': 2.2859082221984863}
Accuracy on test set is: 0.32 



EPOCH NUMBER:  19

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.30818636302246494, 'acc': 0.34, 'eval_loss': 2.2323402166366577}
Accuracy on test set is: 0.34 


[0.0, 0.04, 0.06, 0.06, 0.0, 0.1, 0.14, 0.14, 0.16, 0.18, 0.24, 0.2, 0.24, 0.24, 0.22, 0.3, 0.34, 0.28, 0.32, 0.34]


Some weights of the model checkpoint at google/electra-base-discriminator were not used when initializing ElectraForSequenceClassification: ['discriminator_predictions.dense_prediction.bias', 'discriminator_predictions.dense.weight', 'discriminator_predictions.dense.bias', 'discriminator_predictions.dense_prediction.weight']
- This IS expected if you are initializing ElectraForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing ElectraForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of ElectraForSequenceClassification were not initialized from the model checkpoint at google/electra-base-discriminator and are newly initialized: ['classifier.o


EPOCH NUMBER:  0

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.011778571185788636, 'acc': 0.06, 'eval_loss': 3.020096472331456}
Accuracy on test set is: 0.06 



EPOCH NUMBER:  1

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.0, 'acc': 0.02, 'eval_loss': 2.985994338989258}
Accuracy on test set is: 0.02 



EPOCH NUMBER:  2

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.021019298392969468, 'acc': 0.06, 'eval_loss': 3.0286547797066823}
Accuracy on test set is: 0.06 



EPOCH NUMBER:  3

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.0, 'acc': 0.06, 'eval_loss': 3.0078300748552596}
Accuracy on test set is: 0.06 



EPOCH NUMBER:  4

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.030167066876356594, 'acc': 0.08, 'eval_loss': 2.978862626211984}
Accuracy on test set is: 0.08 



EPOCH NUMBER:  5

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]


NOW EVALUATE THE TEST DF.




  0%|          | 0/50 [00:00<?, ?it/s]

Running Evaluation:   0%|          | 0/7 [00:00<?, ?it/s]

{'mcc': 0.02407728751204372, 'acc': 0.06, 'eval_loss': 2.928691864013672}
Accuracy on test set is: 0.06 



EPOCH NUMBER:  6

NOW TRAIN THE MODEL.




  0%|          | 0/200 [00:00<?, ?it/s]

Epoch:   0%|          | 0/1 [00:00<?, ?it/s]

Running Epoch 0 of 1:   0%|          | 0/25 [00:00<?, ?it/s]

## Now show compact results in a table.

In [None]:
print(" PREPRO FUNCTION    |  Test Accuracy   |",end = '')

print("\n")
for prepro_func in prepro_functions_dict_comb:
  #print(prepro_func,"\t\t\t",format(round(model_results[prepro_func][0],4),'.4f'),"\t\t",end='')
  result = model_results[prepro_func][0]
  # result = format(round(model_results[prepro_func][0],4),'.4f')
  print(f'{prepro_func:27}{ result :12}')
  print("\n")