In [1]:
import numpy as np
import matplotlib.pyplot as plt
import torch
import transformers
import os

In [2]:
# MODEL

_LANGUAGE_         = 'es'
_PRETRAINED_LM_    = 'pysentimiento/robertuito-base-cased'
_PREPROCESS_TEXT_  = True
_TWEET_BATCH_SIZE_ = 5
_ADAPTER_CONFIG_   = transformers.ParallelConfig(mh_adapter = True, reduction_factor = 32)
_MAX_SEQ_LEN_      = 128
_OUTPUT_DIR_       = 'adapter_checkPoints'
_LOGGING_STEPS_    = 2
_NUM_AUTHORS_      = [8]
_K_FOLD_CV_        = 5

# TRAIN

_NO_GPUS_          = 2
_BATCH_SIZE_       = int(64 / _NO_GPUS_)
_EPOCHS_           = {'gender': 20, 'variety': 20}
_LEARNING_RATE_    = 1e-5

## Base

In [3]:
# LABEL DICTONARIES -----------------------------------------------------------------------

gender_dict    = {'female': 0, 
                  'male':   1}

varietyEN_dict = {'australia'    : 0,
                  'canada'       : 1,
                  'great britain' : 2,
                  'ireland'      : 3,
                  'new zealand'   : 4,
                  'united states': 5}

varietyES_dict = {'argentina': 0,
                  'chile'    : 1,
                  'colombia' : 2,
                  'mexico'   : 3,
                  'peru'     : 4,
                  'spain'    : 5,
                  'venezuela': 6}    

In [4]:
# SET LANGUAGE DIRECTORY

if _LANGUAGE_ == 'en':
    variety_dict = varietyEN_dict

elif _LANGUAGE_ == 'es':
    variety_dict = varietyES_dict

In [5]:
# SET LANGUAGE TOKENIZER
from transformers import AutoTokenizer

tokenizer = AutoTokenizer.from_pretrained(_PRETRAINED_LM_)
vocab = tokenizer.get_vocab()

## Dataset

In [6]:
from DatasetPAN17 import BasePAN17, DatasetPAN17, DatasetCrossVal

In [7]:
baseTrain  = BasePAN17(Dir             = '../data',
                      split            = 'train',
                      language         = _LANGUAGE_,
                      tokenizer        = tokenizer,
                      gender_dict      = gender_dict,
                      variety_dict     = variety_dict,
                      tweet_batch_size = _TWEET_BATCH_SIZE_,
                      max_seq_len      = _MAX_SEQ_LEN_,
                      preprocess_text  = _PREPROCESS_TEXT_)

baseTest  = BasePAN17(Dir             = '../data',
                      split            = 'test',
                      language         = _LANGUAGE_,
                      tokenizer        = tokenizer,
                      gender_dict      = gender_dict,
                      variety_dict     = variety_dict,
                      tweet_batch_size = _TWEET_BATCH_SIZE_,
                      max_seq_len      = _MAX_SEQ_LEN_,
                      preprocess_text  = _PREPROCESS_TEXT_)


Reading data...
    Done
Preprocessing text...
    Done
Tokenizing...
    Done
Merging data...
    Done

Total Instances: 84000


Reading data...
    Done
Preprocessing text...
    Done
Tokenizing...
    Done
Merging data...
    Done

Total Instances: 56000



In [8]:
Test = DatasetPAN17(Base_Dataset = baseTest, label = 'gender')

## Training

In [9]:
tasks = ['gender']

In [10]:
from transformers import AutoModelForSequenceClassification, AutoAdapterModel
from transformers import TrainingArguments, Trainer, AdapterTrainer, EarlyStoppingCallback
from TestingPAN17 import compute_accuracy, compute_test_metrics

num_v           = len(baseTest.variety_dict)
num_labels_dict = {"gender": 2, "variety": num_v,}

FewShot_Results = {}

for num in _NUM_AUTHORS_:
    # SHOW CURRENT PORTION
    print("Working with " + str(num) + " authors per label ... ")
    
    dataset_dict = {}
    models = {}
    
    for task_name in tasks:
        
        acc = []
        f1s = []
        
        for val_idx in range(_K_FOLD_CV_):
            print("Train,Val split number " + str(val_idx + 1) + " of " + str(_K_FOLD_CV_))
        
            # INITIALIZE MODEL-----------------------------------------
            models[task_name] = AutoModelForSequenceClassification.from_pretrained(
                _PRETRAINED_LM_,
                num_labels = num_labels_dict[task_name]
            )
            
            # GENERATES DATASET WITH CURRENT PORTION ----------------------
            
            data_train, data_val = baseTrain.cross_val(k = _K_FOLD_CV_, val_idx = val_idx, num_authors = num)
            Train = DatasetCrossVal(Base_Data = data_train, label = 'gender')
            Val   = DatasetCrossVal(Base_Data = data_val  , label = 'gender')

            # TRAIN ADAPTER--------------------------------------------

            training_args = TrainingArguments(
                learning_rate               = _LEARNING_RATE_,
                num_train_epochs            = _EPOCHS_[task_name],
                per_device_train_batch_size = _BATCH_SIZE_,
                per_device_eval_batch_size  = _BATCH_SIZE_,
                output_dir                  = _OUTPUT_DIR_ + '/' + task_name,
                save_total_limit            = 5,
                overwrite_output_dir        = True,
                remove_unused_columns       = False,
                evaluation_strategy         = 'epoch',
                logging_strategy            = 'epoch',
                save_strategy               = 'epoch',
                metric_for_best_model       = 'eval_acc',
                load_best_model_at_end      = True,
            )

            trainer = Trainer(
                model           = models[task_name],
                args            = training_args,
                train_dataset   = Train,
                eval_dataset    = Val,
                compute_metrics = compute_accuracy,
                callbacks       = [EarlyStoppingCallback(early_stopping_patience = 2, early_stopping_threshold = 0.0001)]
            )
            trainer.args._n_gpu = _NO_GPUS_

            trainer.train()

            # TEST MODEL ------------------------------------

            results = trainer.predict(Test)
            metrics = compute_test_metrics(baseTest, results.predictions, 'gender')
            
            acc.append(metrics['accuracy'])
            f1s.append(metrics['f1-score'])
           
        acc = np.array(acc)
        f1s = np.array(f1s)
        
        FewShot_Results[num] = {'accuracy': [acc.mean(), acc.std()], 'f1-score': [f1s.mean(), f1s.std()]}
        print("Results with " + str(num) + " authors per label: ", FewShot_Results[num])

Working with 8 authors per label ... 
Train,Val split number 1 of 5


Some weights of the model checkpoint at pysentimiento/robertuito-base-cased were not used when initializing RobertaForSequenceClassification: ['lm_head.dense.weight', 'lm_head.bias', 'lm_head.layer_norm.weight', 'lm_head.layer_norm.bias', 'lm_head.dense.bias']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RobertaForSequenceClassification were not initialized from the model checkpoint at pysentimiento/robertuito-base-cased and are newly initialized: ['classifier.out_proj.weight', 'classifier.dense.weight', 'classifier.dense.bi

Epoch,Training Loss,Validation Loss,Acc
1,0.6761,0.699052,0.507619
2,0.6223,0.697157,0.526071
3,0.5833,0.696875,0.536012
4,0.529,0.700067,0.541012
5,0.4821,0.707808,0.540893
6,0.4286,0.718779,0.543214
7,0.3786,0.731943,0.544107
8,0.3483,0.74785,0.544167
9,0.309,0.765231,0.541845


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-5
Configuration saved in adapter_checkPoints/gender/checkpoint-5/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-5/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-10] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-10
Configuration saved in adapter_checkPoints/gender/checkpoint-10/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-10/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-20] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-15
Configuration saved in adapter_checkPoints/gender/checkpoint-15/config.

acc: 0.57: 100%|███████████████████████████████████████████████████████████████████| 2800/2800 [00:19<00:00, 142.62it/s]


Train,Val split number 2 of 5


loading configuration file https://huggingface.co/pysentimiento/robertuito-base-cased/resolve/main/config.json from cache at /001/usuarios/isaac.bribiesca/.cache/huggingface/transformers/3f85c0ee804baf604258892a88dd52cdf051d2418a511dcab7cab99a85a3a1b3.4cce50d5a926bf18fe43f2ea8d4596b505e97a64e6e700e993def66b06f1c83b
Model config RobertaConfig {
  "_name_or_path": "pysentimiento/robertuito-base-cased",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 130,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "torch_dtype": "float32",
  "transformers_version": "4.21

Epoch,Training Loss,Validation Loss,Acc
1,0.7129,0.686068,0.546726
2,0.647,0.678914,0.572679
3,0.6107,0.673023,0.586607
4,0.5906,0.668605,0.595714
5,0.554,0.665147,0.601071
6,0.515,0.662452,0.606429
7,0.4926,0.660634,0.609881
8,0.4732,0.660187,0.61119
9,0.4386,0.661424,0.610714
10,0.4173,0.660498,0.613214


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-5
Configuration saved in adapter_checkPoints/gender/checkpoint-5/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-5/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-25] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-10
Configuration saved in adapter_checkPoints/gender/checkpoint-10/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-10/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-30] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-15
Configuration saved in adapter_checkPoints/gender/checkpoint-15/config.

***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-65
Configuration saved in adapter_checkPoints/gender/checkpoint-65/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-65/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-40] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-70
Configuration saved in adapter_checkPoints/gender/checkpoint-70/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-70/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-45] due to args.save_total_limit


Training completed. Do not forget to share your model on huggingface.co/models =)


Loading best model from adapter_checkPoints/gender/checkpoint-60 (score: 0.6142857142857143).
***** Running Prediction ***

acc: 0.6742857142857143: 100%|█████████████████████████████████████████████████████| 2800/2800 [00:19<00:00, 141.12it/s]


Train,Val split number 3 of 5


loading configuration file https://huggingface.co/pysentimiento/robertuito-base-cased/resolve/main/config.json from cache at /001/usuarios/isaac.bribiesca/.cache/huggingface/transformers/3f85c0ee804baf604258892a88dd52cdf051d2418a511dcab7cab99a85a3a1b3.4cce50d5a926bf18fe43f2ea8d4596b505e97a64e6e700e993def66b06f1c83b
Model config RobertaConfig {
  "_name_or_path": "pysentimiento/robertuito-base-cased",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 130,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "torch_dtype": "float32",
  "transformers_version": "4.21

Epoch,Training Loss,Validation Loss,Acc
1,0.7064,0.68244,0.5625
2,0.6392,0.671467,0.595119
3,0.6006,0.662092,0.615357
4,0.5579,0.655118,0.624762
5,0.517,0.649915,0.631488
6,0.4926,0.645817,0.636548
7,0.4567,0.641993,0.640536
8,0.4272,0.639628,0.642738
9,0.4,0.639295,0.641488
10,0.3778,0.638436,0.643036


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-5
Configuration saved in adapter_checkPoints/gender/checkpoint-5/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-5/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-50] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-10
Configuration saved in adapter_checkPoints/gender/checkpoint-10/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-10/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-55] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-15
Configuration saved in adapter_checkPoints/gender/checkpoint-15/config.

***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-65
Configuration saved in adapter_checkPoints/gender/checkpoint-65/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-65/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-40] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-70
Configuration saved in adapter_checkPoints/gender/checkpoint-70/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-70/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-45] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-75
Configuration saved in adapter_checkPoints/gender/checkpoint-75/conf

acc: 0.6610714285714285: 100%|█████████████████████████████████████████████████████| 2800/2800 [00:20<00:00, 139.19it/s]


Train,Val split number 4 of 5


loading configuration file https://huggingface.co/pysentimiento/robertuito-base-cased/resolve/main/config.json from cache at /001/usuarios/isaac.bribiesca/.cache/huggingface/transformers/3f85c0ee804baf604258892a88dd52cdf051d2418a511dcab7cab99a85a3a1b3.4cce50d5a926bf18fe43f2ea8d4596b505e97a64e6e700e993def66b06f1c83b
Model config RobertaConfig {
  "_name_or_path": "pysentimiento/robertuito-base-cased",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 130,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "torch_dtype": "float32",
  "transformers_version": "4.21

Epoch,Training Loss,Validation Loss,Acc
1,0.669,0.674633,0.585179
2,0.6082,0.664706,0.610476
3,0.5742,0.659438,0.619464
4,0.5357,0.657033,0.620714
5,0.4967,0.657665,0.618393
6,0.467,0.65776,0.620357


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-5
Configuration saved in adapter_checkPoints/gender/checkpoint-5/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-5/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-70] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-10
Configuration saved in adapter_checkPoints/gender/checkpoint-10/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-10/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-75] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-15
Configuration saved in adapter_checkPoints/gender/checkpoint-15/config.

acc: 0.655: 100%|██████████████████████████████████████████████████████████████████| 2800/2800 [00:20<00:00, 139.36it/s]


Train,Val split number 5 of 5


loading configuration file https://huggingface.co/pysentimiento/robertuito-base-cased/resolve/main/config.json from cache at /001/usuarios/isaac.bribiesca/.cache/huggingface/transformers/3f85c0ee804baf604258892a88dd52cdf051d2418a511dcab7cab99a85a3a1b3.4cce50d5a926bf18fe43f2ea8d4596b505e97a64e6e700e993def66b06f1c83b
Model config RobertaConfig {
  "_name_or_path": "pysentimiento/robertuito-base-cased",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 130,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "torch_dtype": "float32",
  "transformers_version": "4.21

Epoch,Training Loss,Validation Loss,Acc
1,0.6532,0.668472,0.601667
2,0.6111,0.658887,0.617619
3,0.5754,0.650002,0.630179
4,0.5186,0.643739,0.638869
5,0.4851,0.64046,0.640536
6,0.4525,0.638994,0.640357
7,0.4142,0.63797,0.64244
8,0.3937,0.63846,0.642738
9,0.3561,0.640098,0.644464
10,0.3372,0.639729,0.645893


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-5
Configuration saved in adapter_checkPoints/gender/checkpoint-5/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-5/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-10] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-10
Configuration saved in adapter_checkPoints/gender/checkpoint-10/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-10/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-15] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-15
Configuration saved in adapter_checkPoints/gender/checkpoint-15/config.

***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-65
Configuration saved in adapter_checkPoints/gender/checkpoint-65/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-65/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-40] due to args.save_total_limit


Training completed. Do not forget to share your model on huggingface.co/models =)


Loading best model from adapter_checkPoints/gender/checkpoint-55 (score: 0.6469047619047619).
***** Running Prediction *****
  Num examples = 56000
  Batch size = 64


acc: 0.6714285714285714: 100%|█████████████████████████████████████████████████████| 2800/2800 [00:20<00:00, 138.43it/s]


Results with 8 authors per label:  {'accuracy': [0.6463571428571429, 0.038807741706089145], 'f1-score': [0.675614778161259, 0.05229066275650628]}
Working with 16 authors per label ... 
Train,Val split number 1 of 5


loading configuration file https://huggingface.co/pysentimiento/robertuito-base-cased/resolve/main/config.json from cache at /001/usuarios/isaac.bribiesca/.cache/huggingface/transformers/3f85c0ee804baf604258892a88dd52cdf051d2418a511dcab7cab99a85a3a1b3.4cce50d5a926bf18fe43f2ea8d4596b505e97a64e6e700e993def66b06f1c83b
Model config RobertaConfig {
  "_name_or_path": "pysentimiento/robertuito-base-cased",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 130,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "torch_dtype": "float32",
  "transformers_version": "4.21

Epoch,Training Loss,Validation Loss,Acc
1,0.6959,0.68341,0.552679
2,0.6215,0.66625,0.58744
3,0.5639,0.657527,0.610714
4,0.5136,0.662672,0.606726
5,0.4708,0.672755,0.606786


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-10
Configuration saved in adapter_checkPoints/gender/checkpoint-10/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-10/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-45] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-20
Configuration saved in adapter_checkPoints/gender/checkpoint-20/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-20/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-50] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-30
Configuration saved in adapter_checkPoints/gender/checkpoint-30/conf

acc: 0.6392857142857142: 100%|█████████████████████████████████████████████████████| 2800/2800 [00:20<00:00, 134.67it/s]


Train,Val split number 2 of 5


loading configuration file https://huggingface.co/pysentimiento/robertuito-base-cased/resolve/main/config.json from cache at /001/usuarios/isaac.bribiesca/.cache/huggingface/transformers/3f85c0ee804baf604258892a88dd52cdf051d2418a511dcab7cab99a85a3a1b3.4cce50d5a926bf18fe43f2ea8d4596b505e97a64e6e700e993def66b06f1c83b
Model config RobertaConfig {
  "_name_or_path": "pysentimiento/robertuito-base-cased",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 130,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "torch_dtype": "float32",
  "transformers_version": "4.21

Epoch,Training Loss,Validation Loss,Acc
1,0.7004,0.681026,0.553095
2,0.6136,0.66255,0.59631
3,0.5495,0.654685,0.61369
4,0.5005,0.653301,0.613274
5,0.4456,0.655705,0.616964
6,0.4045,0.664231,0.621369
7,0.3608,0.672209,0.61881
8,0.3272,0.686081,0.618571


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-10
Configuration saved in adapter_checkPoints/gender/checkpoint-10/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-10/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-20
Configuration saved in adapter_checkPoints/gender/checkpoint-20/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-20/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-30
Configuration saved in adapter_checkPoints/gender/checkpoint-30/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-30/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter

acc: 0.6785714285714286: 100%|█████████████████████████████████████████████████████| 2800/2800 [00:21<00:00, 131.74it/s]


Train,Val split number 3 of 5


loading configuration file https://huggingface.co/pysentimiento/robertuito-base-cased/resolve/main/config.json from cache at /001/usuarios/isaac.bribiesca/.cache/huggingface/transformers/3f85c0ee804baf604258892a88dd52cdf051d2418a511dcab7cab99a85a3a1b3.4cce50d5a926bf18fe43f2ea8d4596b505e97a64e6e700e993def66b06f1c83b
Model config RobertaConfig {
  "_name_or_path": "pysentimiento/robertuito-base-cased",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 130,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "torch_dtype": "float32",
  "transformers_version": "4.21

Epoch,Training Loss,Validation Loss,Acc
1,0.6777,0.676555,0.57256
2,0.6054,0.652451,0.621786
3,0.5513,0.638769,0.64
4,0.4902,0.63206,0.642202
5,0.4433,0.629266,0.645476
6,0.4017,0.636041,0.644405
7,0.3569,0.638745,0.647024
8,0.3159,0.648327,0.648214
9,0.2808,0.65887,0.647381
10,0.2552,0.669372,0.646488


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-10
Configuration saved in adapter_checkPoints/gender/checkpoint-10/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-10/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-40] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-20
Configuration saved in adapter_checkPoints/gender/checkpoint-20/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-20/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-50] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-30
Configuration saved in adapter_checkPoints/gender/checkpoint-30/conf

acc: 0.6810714285714285: 100%|█████████████████████████████████████████████████████| 2800/2800 [00:18<00:00, 147.61it/s]


Train,Val split number 4 of 5


loading configuration file https://huggingface.co/pysentimiento/robertuito-base-cased/resolve/main/config.json from cache at /001/usuarios/isaac.bribiesca/.cache/huggingface/transformers/3f85c0ee804baf604258892a88dd52cdf051d2418a511dcab7cab99a85a3a1b3.4cce50d5a926bf18fe43f2ea8d4596b505e97a64e6e700e993def66b06f1c83b
Model config RobertaConfig {
  "_name_or_path": "pysentimiento/robertuito-base-cased",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 130,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "torch_dtype": "float32",
  "transformers_version": "4.21

Epoch,Training Loss,Validation Loss,Acc
1,0.7033,0.682389,0.567083
2,0.6241,0.662165,0.605714
3,0.5654,0.656514,0.606905
4,0.5166,0.65155,0.61625
5,0.4653,0.650754,0.625417
6,0.4141,0.659619,0.622619
7,0.3703,0.664133,0.628631
8,0.3268,0.678446,0.627083
9,0.2975,0.68504,0.634286
10,0.2596,0.700194,0.633095


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-10
Configuration saved in adapter_checkPoints/gender/checkpoint-10/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-10/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-60] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-20
Configuration saved in adapter_checkPoints/gender/checkpoint-20/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-20/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-70] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-30
Configuration saved in adapter_checkPoints/gender/checkpoint-30/conf

acc: 0.6853571428571429: 100%|█████████████████████████████████████████████████████| 2800/2800 [00:18<00:00, 147.82it/s]


Train,Val split number 5 of 5


loading configuration file https://huggingface.co/pysentimiento/robertuito-base-cased/resolve/main/config.json from cache at /001/usuarios/isaac.bribiesca/.cache/huggingface/transformers/3f85c0ee804baf604258892a88dd52cdf051d2418a511dcab7cab99a85a3a1b3.4cce50d5a926bf18fe43f2ea8d4596b505e97a64e6e700e993def66b06f1c83b
Model config RobertaConfig {
  "_name_or_path": "pysentimiento/robertuito-base-cased",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 130,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "torch_dtype": "float32",
  "transformers_version": "4.21

Epoch,Training Loss,Validation Loss,Acc
1,0.6778,0.6762,0.582976
2,0.609,0.657082,0.615238
3,0.5603,0.644828,0.629286
4,0.4979,0.635279,0.639345
5,0.4514,0.631386,0.645179
6,0.4032,0.636126,0.643333
7,0.3595,0.638243,0.647381
8,0.3196,0.64703,0.645655
9,0.2898,0.6558,0.644464


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-10
Configuration saved in adapter_checkPoints/gender/checkpoint-10/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-10/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-70] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-20
Configuration saved in adapter_checkPoints/gender/checkpoint-20/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-20/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-80] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-30
Configuration saved in adapter_checkPoints/gender/checkpoint-30/conf

acc: 0.6682142857142858: 100%|█████████████████████████████████████████████████████| 2800/2800 [00:18<00:00, 152.66it/s]


Results with 16 authors per label:  {'accuracy': [0.6705, 0.01659634825828275], 'f1-score': [0.6892745171156573, 0.02207377870412438]}
Working with 32 authors per label ... 
Train,Val split number 1 of 5


loading configuration file https://huggingface.co/pysentimiento/robertuito-base-cased/resolve/main/config.json from cache at /001/usuarios/isaac.bribiesca/.cache/huggingface/transformers/3f85c0ee804baf604258892a88dd52cdf051d2418a511dcab7cab99a85a3a1b3.4cce50d5a926bf18fe43f2ea8d4596b505e97a64e6e700e993def66b06f1c83b
Model config RobertaConfig {
  "_name_or_path": "pysentimiento/robertuito-base-cased",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 130,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "torch_dtype": "float32",
  "transformers_version": "4.21

Epoch,Training Loss,Validation Loss,Acc
1,0.6877,0.673765,0.57381
2,0.6067,0.659639,0.594643
3,0.5475,0.666789,0.589702
4,0.4897,0.680066,0.59125


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-20
Configuration saved in adapter_checkPoints/gender/checkpoint-20/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-20/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-50] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-40
Configuration saved in adapter_checkPoints/gender/checkpoint-40/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-40/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-60] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-60
Configuration saved in adapter_checkPoints/gender/checkpoint-60/conf

acc: 0.6621428571428571: 100%|█████████████████████████████████████████████████████| 2800/2800 [00:19<00:00, 147.11it/s]


Train,Val split number 2 of 5


loading configuration file https://huggingface.co/pysentimiento/robertuito-base-cased/resolve/main/config.json from cache at /001/usuarios/isaac.bribiesca/.cache/huggingface/transformers/3f85c0ee804baf604258892a88dd52cdf051d2418a511dcab7cab99a85a3a1b3.4cce50d5a926bf18fe43f2ea8d4596b505e97a64e6e700e993def66b06f1c83b
Model config RobertaConfig {
  "_name_or_path": "pysentimiento/robertuito-base-cased",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 130,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "torch_dtype": "float32",
  "transformers_version": "4.21

Epoch,Training Loss,Validation Loss,Acc
1,0.6687,0.659408,0.600238
2,0.5875,0.651759,0.616488
3,0.5239,0.655559,0.62381
4,0.4585,0.666596,0.629107
5,0.3946,0.704322,0.626369
6,0.341,0.732233,0.628274


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-20
Configuration saved in adapter_checkPoints/gender/checkpoint-20/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-20/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-40
Configuration saved in adapter_checkPoints/gender/checkpoint-40/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-40/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-60
Configuration saved in adapter_checkPoints/gender/checkpoint-60/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-60/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter

acc: 0.6807142857142857: 100%|█████████████████████████████████████████████████████| 2800/2800 [00:18<00:00, 153.41it/s]


Train,Val split number 3 of 5


loading configuration file https://huggingface.co/pysentimiento/robertuito-base-cased/resolve/main/config.json from cache at /001/usuarios/isaac.bribiesca/.cache/huggingface/transformers/3f85c0ee804baf604258892a88dd52cdf051d2418a511dcab7cab99a85a3a1b3.4cce50d5a926bf18fe43f2ea8d4596b505e97a64e6e700e993def66b06f1c83b
Model config RobertaConfig {
  "_name_or_path": "pysentimiento/robertuito-base-cased",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 130,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "torch_dtype": "float32",
  "transformers_version": "4.21

Epoch,Training Loss,Validation Loss,Acc
1,0.6487,0.633959,0.655714
2,0.5685,0.623559,0.665119
3,0.5031,0.623642,0.665238
4,0.448,0.619589,0.673155
5,0.3816,0.659452,0.65875
6,0.3257,0.679911,0.657202


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-20
Configuration saved in adapter_checkPoints/gender/checkpoint-20/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-20/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-80] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-40
Configuration saved in adapter_checkPoints/gender/checkpoint-40/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-40/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-60
Configuration saved in adapter_checkPoints/gender/checkpoint-60/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-60/pytorch_model.bin
***** Ru

acc: 0.6842857142857143: 100%|█████████████████████████████████████████████████████| 2800/2800 [00:19<00:00, 146.32it/s]


Train,Val split number 4 of 5


loading configuration file https://huggingface.co/pysentimiento/robertuito-base-cased/resolve/main/config.json from cache at /001/usuarios/isaac.bribiesca/.cache/huggingface/transformers/3f85c0ee804baf604258892a88dd52cdf051d2418a511dcab7cab99a85a3a1b3.4cce50d5a926bf18fe43f2ea8d4596b505e97a64e6e700e993def66b06f1c83b
Model config RobertaConfig {
  "_name_or_path": "pysentimiento/robertuito-base-cased",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 130,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "torch_dtype": "float32",
  "transformers_version": "4.21

Epoch,Training Loss,Validation Loss,Acc
1,0.6487,0.650831,0.617857
2,0.5685,0.647267,0.632857
3,0.5031,0.651502,0.636964
4,0.448,0.650399,0.641369
5,0.3816,0.694828,0.635952
6,0.3257,0.719544,0.635357


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-20
Configuration saved in adapter_checkPoints/gender/checkpoint-20/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-20/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-40
Configuration saved in adapter_checkPoints/gender/checkpoint-40/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-40/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-60] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-60
Configuration saved in adapter_checkPoints/gender/checkpoint-60/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-60/pytorch_model.bin
Deleting

acc: 0.6842857142857143: 100%|█████████████████████████████████████████████████████| 2800/2800 [00:19<00:00, 145.30it/s]


Train,Val split number 5 of 5


loading configuration file https://huggingface.co/pysentimiento/robertuito-base-cased/resolve/main/config.json from cache at /001/usuarios/isaac.bribiesca/.cache/huggingface/transformers/3f85c0ee804baf604258892a88dd52cdf051d2418a511dcab7cab99a85a3a1b3.4cce50d5a926bf18fe43f2ea8d4596b505e97a64e6e700e993def66b06f1c83b
Model config RobertaConfig {
  "_name_or_path": "pysentimiento/robertuito-base-cased",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 130,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "torch_dtype": "float32",
  "transformers_version": "4.21

Epoch,Training Loss,Validation Loss,Acc
1,0.6487,0.638646,0.644643
2,0.5685,0.631308,0.654345
3,0.5031,0.63419,0.656071
4,0.448,0.6312,0.660714
5,0.3816,0.6757,0.651786
6,0.3257,0.702042,0.647738


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-20
Configuration saved in adapter_checkPoints/gender/checkpoint-20/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-20/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-80] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-40
Configuration saved in adapter_checkPoints/gender/checkpoint-40/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-40/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-60
Configuration saved in adapter_checkPoints/gender/checkpoint-60/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-60/pytorch_model.bin
***** Ru

acc: 0.6842857142857143: 100%|█████████████████████████████████████████████████████| 2800/2800 [00:18<00:00, 148.69it/s]


Results with 32 authors per label:  {'accuracy': [0.679142857142857, 0.008611809641772302], 'f1-score': [0.6896027128017307, 0.006236413401855358]}
Working with 48 authors per label ... 
Train,Val split number 1 of 5


loading configuration file https://huggingface.co/pysentimiento/robertuito-base-cased/resolve/main/config.json from cache at /001/usuarios/isaac.bribiesca/.cache/huggingface/transformers/3f85c0ee804baf604258892a88dd52cdf051d2418a511dcab7cab99a85a3a1b3.4cce50d5a926bf18fe43f2ea8d4596b505e97a64e6e700e993def66b06f1c83b
Model config RobertaConfig {
  "_name_or_path": "pysentimiento/robertuito-base-cased",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 130,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "torch_dtype": "float32",
  "transformers_version": "4.21

Epoch,Training Loss,Validation Loss,Acc
1,0.6694,0.65344,0.60875
2,0.5664,0.671338,0.593929
3,0.4832,0.694248,0.596667


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-30
Configuration saved in adapter_checkPoints/gender/checkpoint-30/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-30/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-60] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-60
Configuration saved in adapter_checkPoints/gender/checkpoint-60/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-60/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-100] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-90
Configuration saved in adapter_checkPoints/gender/checkpoint-90/con

acc: 0.6542857142857142: 100%|█████████████████████████████████████████████████████| 2800/2800 [00:19<00:00, 144.72it/s]


Train,Val split number 2 of 5


loading configuration file https://huggingface.co/pysentimiento/robertuito-base-cased/resolve/main/config.json from cache at /001/usuarios/isaac.bribiesca/.cache/huggingface/transformers/3f85c0ee804baf604258892a88dd52cdf051d2418a511dcab7cab99a85a3a1b3.4cce50d5a926bf18fe43f2ea8d4596b505e97a64e6e700e993def66b06f1c83b
Model config RobertaConfig {
  "_name_or_path": "pysentimiento/robertuito-base-cased",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 130,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "torch_dtype": "float32",
  "transformers_version": "4.21

Epoch,Training Loss,Validation Loss,Acc
1,0.6499,0.660337,0.607321
2,0.565,0.660121,0.620536
3,0.4915,0.681453,0.616548
4,0.4283,0.707673,0.621726
5,0.3672,0.723056,0.628929
6,0.3173,0.75243,0.633869
7,0.2719,0.789026,0.631905
8,0.2246,0.850971,0.629167


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-30
Configuration saved in adapter_checkPoints/gender/checkpoint-30/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-30/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-60
Configuration saved in adapter_checkPoints/gender/checkpoint-60/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-60/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-90
Configuration saved in adapter_checkPoints/gender/checkpoint-90/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-90/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter

acc: 0.6882142857142857: 100%|█████████████████████████████████████████████████████| 2800/2800 [00:18<00:00, 147.94it/s]


Train,Val split number 3 of 5


loading configuration file https://huggingface.co/pysentimiento/robertuito-base-cased/resolve/main/config.json from cache at /001/usuarios/isaac.bribiesca/.cache/huggingface/transformers/3f85c0ee804baf604258892a88dd52cdf051d2418a511dcab7cab99a85a3a1b3.4cce50d5a926bf18fe43f2ea8d4596b505e97a64e6e700e993def66b06f1c83b
Model config RobertaConfig {
  "_name_or_path": "pysentimiento/robertuito-base-cased",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 130,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "torch_dtype": "float32",
  "transformers_version": "4.21

Epoch,Training Loss,Validation Loss,Acc
1,0.6589,0.633269,0.654821
2,0.5597,0.613434,0.670714
3,0.4839,0.628318,0.664048
4,0.4109,0.648896,0.66369


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-30
Configuration saved in adapter_checkPoints/gender/checkpoint-30/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-30/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-120] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-60
Configuration saved in adapter_checkPoints/gender/checkpoint-60/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-60/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-150] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-90
Configuration saved in adapter_checkPoints/gender/checkpoint-90/co

acc: 0.68: 100%|███████████████████████████████████████████████████████████████████| 2800/2800 [00:19<00:00, 144.59it/s]


Train,Val split number 4 of 5


loading configuration file https://huggingface.co/pysentimiento/robertuito-base-cased/resolve/main/config.json from cache at /001/usuarios/isaac.bribiesca/.cache/huggingface/transformers/3f85c0ee804baf604258892a88dd52cdf051d2418a511dcab7cab99a85a3a1b3.4cce50d5a926bf18fe43f2ea8d4596b505e97a64e6e700e993def66b06f1c83b
Model config RobertaConfig {
  "_name_or_path": "pysentimiento/robertuito-base-cased",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 130,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "torch_dtype": "float32",
  "transformers_version": "4.21

Epoch,Training Loss,Validation Loss,Acc
1,0.6523,0.65304,0.631071
2,0.5579,0.645706,0.636429
3,0.4787,0.668099,0.634583
4,0.4152,0.693787,0.637024
5,0.3514,0.726987,0.636667
6,0.2949,0.762566,0.640298
7,0.2426,0.812519,0.637381
8,0.1969,0.883757,0.637262


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-30
Configuration saved in adapter_checkPoints/gender/checkpoint-30/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-30/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-60
Configuration saved in adapter_checkPoints/gender/checkpoint-60/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-60/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-90
Configuration saved in adapter_checkPoints/gender/checkpoint-90/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-90/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter

acc: 0.6946428571428571: 100%|█████████████████████████████████████████████████████| 2800/2800 [00:19<00:00, 146.05it/s]


Train,Val split number 5 of 5


loading configuration file https://huggingface.co/pysentimiento/robertuito-base-cased/resolve/main/config.json from cache at /001/usuarios/isaac.bribiesca/.cache/huggingface/transformers/3f85c0ee804baf604258892a88dd52cdf051d2418a511dcab7cab99a85a3a1b3.4cce50d5a926bf18fe43f2ea8d4596b505e97a64e6e700e993def66b06f1c83b
Model config RobertaConfig {
  "_name_or_path": "pysentimiento/robertuito-base-cased",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 130,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "torch_dtype": "float32",
  "transformers_version": "4.21

Epoch,Training Loss,Validation Loss,Acc
1,0.6589,0.633858,0.66006
2,0.5597,0.616724,0.675
3,0.4839,0.636408,0.668214
4,0.4109,0.662292,0.666131


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-30
Configuration saved in adapter_checkPoints/gender/checkpoint-30/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-30/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-120] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-60
Configuration saved in adapter_checkPoints/gender/checkpoint-60/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-60/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-150] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-90
Configuration saved in adapter_checkPoints/gender/checkpoint-90/co

acc: 0.68: 100%|███████████████████████████████████████████████████████████████████| 2800/2800 [00:19<00:00, 145.41it/s]


Results with 48 authors per label:  {'accuracy': [0.6794285714285715, 0.013722095990312377], 'f1-score': [0.6935243485276106, 0.025162403949095986]}
Working with 64 authors per label ... 
Train,Val split number 1 of 5


loading configuration file https://huggingface.co/pysentimiento/robertuito-base-cased/resolve/main/config.json from cache at /001/usuarios/isaac.bribiesca/.cache/huggingface/transformers/3f85c0ee804baf604258892a88dd52cdf051d2418a511dcab7cab99a85a3a1b3.4cce50d5a926bf18fe43f2ea8d4596b505e97a64e6e700e993def66b06f1c83b
Model config RobertaConfig {
  "_name_or_path": "pysentimiento/robertuito-base-cased",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 130,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "torch_dtype": "float32",
  "transformers_version": "4.21

Epoch,Training Loss,Validation Loss,Acc
1,0.6578,0.656426,0.59619
2,0.5547,0.670281,0.60119
3,0.4801,0.722978,0.59744
4,0.419,0.762094,0.59994


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-40
Configuration saved in adapter_checkPoints/gender/checkpoint-40/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-40/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-240] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-80
Configuration saved in adapter_checkPoints/gender/checkpoint-80/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-80/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-30] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-120
Configuration saved in adapter_checkPoints/gender/checkpoint-120/c

acc: 0.6225: 100%|█████████████████████████████████████████████████████████████████| 2800/2800 [00:19<00:00, 142.98it/s]


Train,Val split number 2 of 5


loading configuration file https://huggingface.co/pysentimiento/robertuito-base-cased/resolve/main/config.json from cache at /001/usuarios/isaac.bribiesca/.cache/huggingface/transformers/3f85c0ee804baf604258892a88dd52cdf051d2418a511dcab7cab99a85a3a1b3.4cce50d5a926bf18fe43f2ea8d4596b505e97a64e6e700e993def66b06f1c83b
Model config RobertaConfig {
  "_name_or_path": "pysentimiento/robertuito-base-cased",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 130,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "torch_dtype": "float32",
  "transformers_version": "4.21

Epoch,Training Loss,Validation Loss,Acc
1,0.6546,0.643228,0.622679
2,0.5652,0.639114,0.636964
3,0.4883,0.65525,0.639286
4,0.4118,0.697719,0.638452
5,0.3454,0.732488,0.639821
6,0.2947,0.779493,0.642143
7,0.2358,0.837255,0.64256
8,0.1908,0.899205,0.641786
9,0.1471,0.977406,0.640893


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-40
Configuration saved in adapter_checkPoints/gender/checkpoint-40/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-40/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-80
Configuration saved in adapter_checkPoints/gender/checkpoint-80/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-80/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-120
Configuration saved in adapter_checkPoints/gender/checkpoint-120/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-120/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adap

acc: 0.7089285714285715: 100%|█████████████████████████████████████████████████████| 2800/2800 [00:19<00:00, 141.80it/s]


Train,Val split number 3 of 5


loading configuration file https://huggingface.co/pysentimiento/robertuito-base-cased/resolve/main/config.json from cache at /001/usuarios/isaac.bribiesca/.cache/huggingface/transformers/3f85c0ee804baf604258892a88dd52cdf051d2418a511dcab7cab99a85a3a1b3.4cce50d5a926bf18fe43f2ea8d4596b505e97a64e6e700e993def66b06f1c83b
Model config RobertaConfig {
  "_name_or_path": "pysentimiento/robertuito-base-cased",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 130,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "torch_dtype": "float32",
  "transformers_version": "4.21

Epoch,Training Loss,Validation Loss,Acc
1,0.6558,0.618105,0.670774
2,0.5685,0.59958,0.679881
3,0.5003,0.602091,0.680476
4,0.4221,0.624915,0.674464
5,0.3511,0.665167,0.674524


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-40
Configuration saved in adapter_checkPoints/gender/checkpoint-40/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-40/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-200] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-80
Configuration saved in adapter_checkPoints/gender/checkpoint-80/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-80/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-240] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-120
Configuration saved in adapter_checkPoints/gender/checkpoint-120/

acc: 0.7107142857142857: 100%|█████████████████████████████████████████████████████| 2800/2800 [00:19<00:00, 143.45it/s]


Train,Val split number 4 of 5


loading configuration file https://huggingface.co/pysentimiento/robertuito-base-cased/resolve/main/config.json from cache at /001/usuarios/isaac.bribiesca/.cache/huggingface/transformers/3f85c0ee804baf604258892a88dd52cdf051d2418a511dcab7cab99a85a3a1b3.4cce50d5a926bf18fe43f2ea8d4596b505e97a64e6e700e993def66b06f1c83b
Model config RobertaConfig {
  "_name_or_path": "pysentimiento/robertuito-base-cased",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 130,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "torch_dtype": "float32",
  "transformers_version": "4.21

Epoch,Training Loss,Validation Loss,Acc
1,0.6558,0.64937,0.630952
2,0.5705,0.640664,0.636786
3,0.494,0.652628,0.64
4,0.4148,0.687382,0.634583
5,0.3529,0.730098,0.636905


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-40
Configuration saved in adapter_checkPoints/gender/checkpoint-40/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-40/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-80
Configuration saved in adapter_checkPoints/gender/checkpoint-80/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-80/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-120
Configuration saved in adapter_checkPoints/gender/checkpoint-120/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-120/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adap

acc: 0.6996428571428571: 100%|█████████████████████████████████████████████████████| 2800/2800 [00:19<00:00, 145.07it/s]


Train,Val split number 5 of 5


loading configuration file https://huggingface.co/pysentimiento/robertuito-base-cased/resolve/main/config.json from cache at /001/usuarios/isaac.bribiesca/.cache/huggingface/transformers/3f85c0ee804baf604258892a88dd52cdf051d2418a511dcab7cab99a85a3a1b3.4cce50d5a926bf18fe43f2ea8d4596b505e97a64e6e700e993def66b06f1c83b
Model config RobertaConfig {
  "_name_or_path": "pysentimiento/robertuito-base-cased",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 130,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "torch_dtype": "float32",
  "transformers_version": "4.21

Epoch,Training Loss,Validation Loss,Acc
1,0.6558,0.638516,0.645476
2,0.5705,0.625606,0.655476
3,0.494,0.632415,0.659702
4,0.4148,0.661333,0.651429
5,0.3529,0.702288,0.652738


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-40
Configuration saved in adapter_checkPoints/gender/checkpoint-40/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-40/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-80
Configuration saved in adapter_checkPoints/gender/checkpoint-80/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-80/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-120
Configuration saved in adapter_checkPoints/gender/checkpoint-120/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-120/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adap

acc: 0.6996428571428571: 100%|█████████████████████████████████████████████████████| 2800/2800 [00:19<00:00, 144.88it/s]


Results with 64 authors per label:  {'accuracy': [0.6882857142857143, 0.03321113656345916], 'f1-score': [0.6787820866714995, 0.048350822584644085]}
Working with 128 authors per label ... 
Train,Val split number 1 of 5


loading configuration file https://huggingface.co/pysentimiento/robertuito-base-cased/resolve/main/config.json from cache at /001/usuarios/isaac.bribiesca/.cache/huggingface/transformers/3f85c0ee804baf604258892a88dd52cdf051d2418a511dcab7cab99a85a3a1b3.4cce50d5a926bf18fe43f2ea8d4596b505e97a64e6e700e993def66b06f1c83b
Model config RobertaConfig {
  "_name_or_path": "pysentimiento/robertuito-base-cased",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 130,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "torch_dtype": "float32",
  "transformers_version": "4.21

Epoch,Training Loss,Validation Loss,Acc
1,0.6393,0.630892,0.633452
2,0.5501,0.635357,0.640714
3,0.4739,0.648297,0.646786
4,0.4006,0.683748,0.647857
5,0.3294,0.733024,0.64869
6,0.2607,0.790741,0.643869
7,0.208,0.865234,0.635298


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-80
Configuration saved in adapter_checkPoints/gender/checkpoint-80/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-80/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-160
Configuration saved in adapter_checkPoints/gender/checkpoint-160/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-160/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-240
Configuration saved in adapter_checkPoints/gender/checkpoint-240/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-240/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-40] due to args.save_total_limit
**

acc: 0.7164285714285714: 100%|█████████████████████████████████████████████████████| 2800/2800 [00:19<00:00, 146.84it/s]


Train,Val split number 2 of 5


loading configuration file https://huggingface.co/pysentimiento/robertuito-base-cased/resolve/main/config.json from cache at /001/usuarios/isaac.bribiesca/.cache/huggingface/transformers/3f85c0ee804baf604258892a88dd52cdf051d2418a511dcab7cab99a85a3a1b3.4cce50d5a926bf18fe43f2ea8d4596b505e97a64e6e700e993def66b06f1c83b
Model config RobertaConfig {
  "_name_or_path": "pysentimiento/robertuito-base-cased",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 130,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "torch_dtype": "float32",
  "transformers_version": "4.21

Epoch,Training Loss,Validation Loss,Acc
1,0.6314,0.647354,0.630238
2,0.5355,0.639391,0.648869
3,0.4611,0.658887,0.654583
4,0.3866,0.682248,0.659226
5,0.3154,0.738015,0.658631
6,0.2532,0.798669,0.65881


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-80
Configuration saved in adapter_checkPoints/gender/checkpoint-80/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-80/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-240] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-160
Configuration saved in adapter_checkPoints/gender/checkpoint-160/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-160/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-320] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-240
Configuration saved in adapter_checkPoints/gender/checkpoint-2

acc: 0.7360714285714286: 100%|█████████████████████████████████████████████████████| 2800/2800 [00:19<00:00, 145.34it/s]


Train,Val split number 3 of 5


loading configuration file https://huggingface.co/pysentimiento/robertuito-base-cased/resolve/main/config.json from cache at /001/usuarios/isaac.bribiesca/.cache/huggingface/transformers/3f85c0ee804baf604258892a88dd52cdf051d2418a511dcab7cab99a85a3a1b3.4cce50d5a926bf18fe43f2ea8d4596b505e97a64e6e700e993def66b06f1c83b
Model config RobertaConfig {
  "_name_or_path": "pysentimiento/robertuito-base-cased",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 130,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "torch_dtype": "float32",
  "transformers_version": "4.21

Epoch,Training Loss,Validation Loss,Acc
1,0.6127,0.600431,0.68506
2,0.514,0.596502,0.687202
3,0.4392,0.62,0.68881
4,0.3619,0.64807,0.688571
5,0.2913,0.690581,0.68375


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-80
Configuration saved in adapter_checkPoints/gender/checkpoint-80/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-80/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-160] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-160
Configuration saved in adapter_checkPoints/gender/checkpoint-160/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-160/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-240] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-240
Configuration saved in adapter_checkPoints/gender/checkpoint-2

acc: 0.7367857142857143: 100%|█████████████████████████████████████████████████████| 2800/2800 [00:19<00:00, 146.60it/s]


Train,Val split number 4 of 5


loading configuration file https://huggingface.co/pysentimiento/robertuito-base-cased/resolve/main/config.json from cache at /001/usuarios/isaac.bribiesca/.cache/huggingface/transformers/3f85c0ee804baf604258892a88dd52cdf051d2418a511dcab7cab99a85a3a1b3.4cce50d5a926bf18fe43f2ea8d4596b505e97a64e6e700e993def66b06f1c83b
Model config RobertaConfig {
  "_name_or_path": "pysentimiento/robertuito-base-cased",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 130,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "torch_dtype": "float32",
  "transformers_version": "4.21

Epoch,Training Loss,Validation Loss,Acc
1,0.625,0.639465,0.647679
2,0.5286,0.630644,0.663929
3,0.4526,0.65746,0.664821
4,0.3786,0.68347,0.663512
5,0.3111,0.746672,0.662857


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-80
Configuration saved in adapter_checkPoints/gender/checkpoint-80/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-80/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-160
Configuration saved in adapter_checkPoints/gender/checkpoint-160/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-160/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-240
Configuration saved in adapter_checkPoints/gender/checkpoint-240/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-240/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to a

acc: 0.7271428571428571: 100%|█████████████████████████████████████████████████████| 2800/2800 [00:19<00:00, 145.93it/s]


Train,Val split number 5 of 5


loading configuration file https://huggingface.co/pysentimiento/robertuito-base-cased/resolve/main/config.json from cache at /001/usuarios/isaac.bribiesca/.cache/huggingface/transformers/3f85c0ee804baf604258892a88dd52cdf051d2418a511dcab7cab99a85a3a1b3.4cce50d5a926bf18fe43f2ea8d4596b505e97a64e6e700e993def66b06f1c83b
Model config RobertaConfig {
  "_name_or_path": "pysentimiento/robertuito-base-cased",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 130,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "torch_dtype": "float32",
  "transformers_version": "4.21

Epoch,Training Loss,Validation Loss,Acc
1,0.625,0.620442,0.661726
2,0.5286,0.605438,0.674345
3,0.4526,0.624865,0.674464
4,0.3786,0.648827,0.673333
5,0.3111,0.701599,0.678155
6,0.2391,0.764512,0.676786
7,0.1825,0.821654,0.677143


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-80
Configuration saved in adapter_checkPoints/gender/checkpoint-80/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-80/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-160
Configuration saved in adapter_checkPoints/gender/checkpoint-160/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-160/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-240
Configuration saved in adapter_checkPoints/gender/checkpoint-240/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-240/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to a

acc: 0.7296428571428571: 100%|█████████████████████████████████████████████████████| 2800/2800 [00:19<00:00, 144.06it/s]


Results with 128 authors per label:  {'accuracy': [0.7292142857142858, 0.007379646581881108], 'f1-score': [0.7342845402829002, 0.013718943601915282]}
Working with 256 authors per label ... 
Train,Val split number 1 of 5


loading configuration file https://huggingface.co/pysentimiento/robertuito-base-cased/resolve/main/config.json from cache at /001/usuarios/isaac.bribiesca/.cache/huggingface/transformers/3f85c0ee804baf604258892a88dd52cdf051d2418a511dcab7cab99a85a3a1b3.4cce50d5a926bf18fe43f2ea8d4596b505e97a64e6e700e993def66b06f1c83b
Model config RobertaConfig {
  "_name_or_path": "pysentimiento/robertuito-base-cased",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 130,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "torch_dtype": "float32",
  "transformers_version": "4.21

Epoch,Training Loss,Validation Loss,Acc
1,0.6254,0.608448,0.661726
2,0.5321,0.596824,0.679702
3,0.4465,0.61803,0.67994
4,0.3619,0.654262,0.681964
5,0.2822,0.7027,0.684107
6,0.2169,0.785139,0.682798
7,0.1576,0.908229,0.687024
8,0.1116,1.020597,0.67244
9,0.0797,1.156024,0.678929


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-160
Configuration saved in adapter_checkPoints/gender/checkpoint-160/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-160/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-240] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-320
Configuration saved in adapter_checkPoints/gender/checkpoint-320/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-320/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-480
Configuration saved in adapter_checkPoints/gender/checkpoint-480/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-480/pytorch_model.bi

acc: 0.8021428571428572: 100%|█████████████████████████████████████████████████████| 2800/2800 [00:17<00:00, 160.07it/s]


Train,Val split number 2 of 5


loading configuration file https://huggingface.co/pysentimiento/robertuito-base-cased/resolve/main/config.json from cache at /001/usuarios/isaac.bribiesca/.cache/huggingface/transformers/3f85c0ee804baf604258892a88dd52cdf051d2418a511dcab7cab99a85a3a1b3.4cce50d5a926bf18fe43f2ea8d4596b505e97a64e6e700e993def66b06f1c83b
Model config RobertaConfig {
  "_name_or_path": "pysentimiento/robertuito-base-cased",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 130,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "torch_dtype": "float32",
  "transformers_version": "4.21

Epoch,Training Loss,Validation Loss,Acc
1,0.6133,0.604408,0.666607
2,0.513,0.606181,0.678571
3,0.4317,0.635277,0.684345
4,0.3538,0.685791,0.689167
5,0.2754,0.739154,0.686786
6,0.211,0.810942,0.691012
7,0.1648,0.906659,0.687083
8,0.1222,0.993968,0.686488


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-160
Configuration saved in adapter_checkPoints/gender/checkpoint-160/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-160/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-800] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-320
Configuration saved in adapter_checkPoints/gender/checkpoint-320/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-320/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-960] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-480
Configuration saved in adapter_checkPoints/gender/checkpoin

acc: 0.7867857142857143: 100%|█████████████████████████████████████████████████████| 2800/2800 [00:16<00:00, 164.82it/s]


Train,Val split number 3 of 5


loading configuration file https://huggingface.co/pysentimiento/robertuito-base-cased/resolve/main/config.json from cache at /001/usuarios/isaac.bribiesca/.cache/huggingface/transformers/3f85c0ee804baf604258892a88dd52cdf051d2418a511dcab7cab99a85a3a1b3.4cce50d5a926bf18fe43f2ea8d4596b505e97a64e6e700e993def66b06f1c83b
Model config RobertaConfig {
  "_name_or_path": "pysentimiento/robertuito-base-cased",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 130,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "torch_dtype": "float32",
  "transformers_version": "4.21

Epoch,Training Loss,Validation Loss,Acc
1,0.6095,0.580996,0.688929
2,0.5054,0.576294,0.699107
3,0.424,0.604686,0.699345
4,0.3392,0.646093,0.701964
5,0.2646,0.716445,0.695357
6,0.1987,0.797181,0.699821


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-160
Configuration saved in adapter_checkPoints/gender/checkpoint-160/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-160/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-640] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-320
Configuration saved in adapter_checkPoints/gender/checkpoint-320/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-320/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-800] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-480
Configuration saved in adapter_checkPoints/gender/checkpoin

acc: 0.7696428571428572: 100%|█████████████████████████████████████████████████████| 2800/2800 [00:17<00:00, 156.73it/s]


Train,Val split number 4 of 5


loading configuration file https://huggingface.co/pysentimiento/robertuito-base-cased/resolve/main/config.json from cache at /001/usuarios/isaac.bribiesca/.cache/huggingface/transformers/3f85c0ee804baf604258892a88dd52cdf051d2418a511dcab7cab99a85a3a1b3.4cce50d5a926bf18fe43f2ea8d4596b505e97a64e6e700e993def66b06f1c83b
Model config RobertaConfig {
  "_name_or_path": "pysentimiento/robertuito-base-cased",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 130,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "torch_dtype": "float32",
  "transformers_version": "4.21

Epoch,Training Loss,Validation Loss,Acc
1,0.6018,0.589458,0.67875
2,0.5008,0.592655,0.687202
3,0.4149,0.617783,0.695
4,0.3311,0.67553,0.692262
5,0.2501,0.738575,0.692917


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-160
Configuration saved in adapter_checkPoints/gender/checkpoint-160/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-160/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-320] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-320
Configuration saved in adapter_checkPoints/gender/checkpoint-320/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-320/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-480] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-480
Configuration saved in adapter_checkPoints/gender/checkpoin

acc: 0.775: 100%|██████████████████████████████████████████████████████████████████| 2800/2800 [00:16<00:00, 166.77it/s]


Train,Val split number 5 of 5


loading configuration file https://huggingface.co/pysentimiento/robertuito-base-cased/resolve/main/config.json from cache at /001/usuarios/isaac.bribiesca/.cache/huggingface/transformers/3f85c0ee804baf604258892a88dd52cdf051d2418a511dcab7cab99a85a3a1b3.4cce50d5a926bf18fe43f2ea8d4596b505e97a64e6e700e993def66b06f1c83b
Model config RobertaConfig {
  "_name_or_path": "pysentimiento/robertuito-base-cased",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 130,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "torch_dtype": "float32",
  "transformers_version": "4.21

Epoch,Training Loss,Validation Loss,Acc
1,0.6112,0.575416,0.690893
2,0.5116,0.561788,0.707262
3,0.428,0.578867,0.70869
4,0.3427,0.615145,0.708274
5,0.266,0.674154,0.703512


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-160
Configuration saved in adapter_checkPoints/gender/checkpoint-160/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-160/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-320
Configuration saved in adapter_checkPoints/gender/checkpoint-320/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-320/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-480
Configuration saved in adapter_checkPoints/gender/checkpoint-480/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-480/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint t

acc: 0.7703571428571429: 100%|█████████████████████████████████████████████████████| 2800/2800 [00:17<00:00, 162.37it/s]


Results with 256 authors per label:  {'accuracy': [0.7807857142857142, 0.012316821084705786], 'f1-score': [0.775970202717284, 0.014919221734025953]}
Working with 512 authors per label ... 
Train,Val split number 1 of 5


loading configuration file https://huggingface.co/pysentimiento/robertuito-base-cased/resolve/main/config.json from cache at /001/usuarios/isaac.bribiesca/.cache/huggingface/transformers/3f85c0ee804baf604258892a88dd52cdf051d2418a511dcab7cab99a85a3a1b3.4cce50d5a926bf18fe43f2ea8d4596b505e97a64e6e700e993def66b06f1c83b
Model config RobertaConfig {
  "_name_or_path": "pysentimiento/robertuito-base-cased",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 130,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "torch_dtype": "float32",
  "transformers_version": "4.21

Epoch,Training Loss,Validation Loss,Acc
1,0.596,0.590273,0.68506
2,0.491,0.579206,0.700298
3,0.4064,0.61387,0.707024
4,0.3246,0.686476,0.700655
5,0.2513,0.763468,0.702381


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-320
Configuration saved in adapter_checkPoints/gender/checkpoint-320/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-320/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-640
Configuration saved in adapter_checkPoints/gender/checkpoint-640/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-640/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-960
Configuration saved in adapter_checkPoints/gender/checkpoint-960/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-960/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-160] due to args.save_total_limi

acc: 0.8207142857142857: 100%|█████████████████████████████████████████████████████| 2800/2800 [00:17<00:00, 161.37it/s]


Train,Val split number 2 of 5


loading configuration file https://huggingface.co/pysentimiento/robertuito-base-cased/resolve/main/config.json from cache at /001/usuarios/isaac.bribiesca/.cache/huggingface/transformers/3f85c0ee804baf604258892a88dd52cdf051d2418a511dcab7cab99a85a3a1b3.4cce50d5a926bf18fe43f2ea8d4596b505e97a64e6e700e993def66b06f1c83b
Model config RobertaConfig {
  "_name_or_path": "pysentimiento/robertuito-base-cased",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 130,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "torch_dtype": "float32",
  "transformers_version": "4.21

Epoch,Training Loss,Validation Loss,Acc
1,0.5942,0.599927,0.680536
2,0.4896,0.597196,0.696726
3,0.3987,0.665928,0.693452
4,0.3216,0.693193,0.698214
5,0.2448,0.776772,0.697083
6,0.1852,0.868872,0.699226
7,0.1335,0.994927,0.694405
8,0.0971,1.179136,0.690417


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-320
Configuration saved in adapter_checkPoints/gender/checkpoint-320/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-320/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-640] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-640
Configuration saved in adapter_checkPoints/gender/checkpoint-640/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-640/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-800] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-960
Configuration saved in adapter_checkPoints/gender/checkpoin

acc: 0.8114285714285714: 100%|█████████████████████████████████████████████████████| 2800/2800 [00:17<00:00, 159.90it/s]


Train,Val split number 3 of 5


loading configuration file https://huggingface.co/pysentimiento/robertuito-base-cased/resolve/main/config.json from cache at /001/usuarios/isaac.bribiesca/.cache/huggingface/transformers/3f85c0ee804baf604258892a88dd52cdf051d2418a511dcab7cab99a85a3a1b3.4cce50d5a926bf18fe43f2ea8d4596b505e97a64e6e700e993def66b06f1c83b
Model config RobertaConfig {
  "_name_or_path": "pysentimiento/robertuito-base-cased",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 130,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "torch_dtype": "float32",
  "transformers_version": "4.21

Epoch,Training Loss,Validation Loss,Acc
1,0.5954,0.574063,0.693333
2,0.4888,0.591658,0.692381
3,0.4003,0.621338,0.697024
4,0.3177,0.679599,0.686786
5,0.2477,0.739347,0.701429
6,0.1827,0.889384,0.682976
7,0.1315,0.98505,0.69619


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-320
Configuration saved in adapter_checkPoints/gender/checkpoint-320/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-320/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-640
Configuration saved in adapter_checkPoints/gender/checkpoint-640/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-640/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-960
Configuration saved in adapter_checkPoints/gender/checkpoint-960/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-960/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-320] due to args.save_total_limi

acc: 0.8153571428571429: 100%|█████████████████████████████████████████████████████| 2800/2800 [00:17<00:00, 160.18it/s]


Train,Val split number 4 of 5


loading configuration file https://huggingface.co/pysentimiento/robertuito-base-cased/resolve/main/config.json from cache at /001/usuarios/isaac.bribiesca/.cache/huggingface/transformers/3f85c0ee804baf604258892a88dd52cdf051d2418a511dcab7cab99a85a3a1b3.4cce50d5a926bf18fe43f2ea8d4596b505e97a64e6e700e993def66b06f1c83b
Model config RobertaConfig {
  "_name_or_path": "pysentimiento/robertuito-base-cased",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 130,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "torch_dtype": "float32",
  "transformers_version": "4.21

Epoch,Training Loss,Validation Loss,Acc
1,0.6003,0.588046,0.68256
2,0.4957,0.606565,0.688155
3,0.4034,0.643012,0.691429
4,0.3236,0.70405,0.680774
5,0.2541,0.787207,0.687262


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-320
Configuration saved in adapter_checkPoints/gender/checkpoint-320/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-320/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-960] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-640
Configuration saved in adapter_checkPoints/gender/checkpoint-640/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-640/pytorch_model.bin
Deleting older checkpoint [adapter_checkPoints/gender/checkpoint-1280] due to args.save_total_limit
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-960
Configuration saved in adapter_checkPoints/gender/checkpoi

acc: 0.7989285714285714: 100%|█████████████████████████████████████████████████████| 2800/2800 [00:17<00:00, 162.89it/s]


Train,Val split number 5 of 5


loading configuration file https://huggingface.co/pysentimiento/robertuito-base-cased/resolve/main/config.json from cache at /001/usuarios/isaac.bribiesca/.cache/huggingface/transformers/3f85c0ee804baf604258892a88dd52cdf051d2418a511dcab7cab99a85a3a1b3.4cce50d5a926bf18fe43f2ea8d4596b505e97a64e6e700e993def66b06f1c83b
Model config RobertaConfig {
  "_name_or_path": "pysentimiento/robertuito-base-cased",
  "architectures": [
    "RobertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "eos_token_id": 2,
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 130,
  "model_type": "roberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "position_embedding_type": "absolute",
  "torch_dtype": "float32",
  "transformers_version": "4.21

Epoch,Training Loss,Validation Loss,Acc
1,0.5989,0.560749,0.70625
2,0.4969,0.578273,0.706964
3,0.4054,0.59835,0.713333
4,0.3258,0.654239,0.70244
5,0.2537,0.72339,0.710238


***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-320
Configuration saved in adapter_checkPoints/gender/checkpoint-320/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-320/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-640
Configuration saved in adapter_checkPoints/gender/checkpoint-640/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-640/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint to adapter_checkPoints/gender/checkpoint-960
Configuration saved in adapter_checkPoints/gender/checkpoint-960/config.json
Model weights saved in adapter_checkPoints/gender/checkpoint-960/pytorch_model.bin
***** Running Evaluation *****
  Num examples = 16800
  Batch size = 64
Saving model checkpoint t

acc: 0.8028571428571428: 100%|█████████████████████████████████████████████████████| 2800/2800 [00:17<00:00, 163.03it/s]

Results with 512 authors per label:  {'accuracy': [0.8098571428571427, 0.007987873462253879], 'f1-score': [0.8000596537338568, 0.013255013701296225]}





In [11]:
FewShot_Results

{8: {'accuracy': [0.6463571428571429, 0.038807741706089145],
  'f1-score': [0.675614778161259, 0.05229066275650628]},
 16: {'accuracy': [0.6705, 0.01659634825828275],
  'f1-score': [0.6892745171156573, 0.02207377870412438]},
 32: {'accuracy': [0.679142857142857, 0.008611809641772302],
  'f1-score': [0.6896027128017307, 0.006236413401855358]},
 48: {'accuracy': [0.6794285714285715, 0.013722095990312377],
  'f1-score': [0.6935243485276106, 0.025162403949095986]},
 64: {'accuracy': [0.6882857142857143, 0.03321113656345916],
  'f1-score': [0.6787820866714995, 0.048350822584644085]},
 128: {'accuracy': [0.7292142857142858, 0.007379646581881108],
  'f1-score': [0.7342845402829002, 0.013718943601915282]},
 256: {'accuracy': [0.7807857142857142, 0.012316821084705786],
  'f1-score': [0.775970202717284, 0.014919221734025953]},
 512: {'accuracy': [0.8098571428571427, 0.007987873462253879],
  'f1-score': [0.8000596537338568, 0.013255013701296225]}}