# Abstractive summaries - Train DistilBART on TWEETSUMM dataset, continued

In [1]:
!ls /kaggle/input/

bart-res-p1-2409  bertdata2207	gptdata


In [2]:
!cp -r /kaggle/input/bart-res-p1-2409/* /kaggle/working

In [3]:
from huggingface_hub import login
import pandas as pd
import numpy as np
import os, time, datetime, shutil

from datasets import Dataset, DatasetDict

from transformers import DataCollatorForSeq2Seq, AutoTokenizer, set_seed
from transformers import AutoModelForSeq2SeqLM, Seq2SeqTrainingArguments, Seq2SeqTrainer
from transformers import TrainerCallback, TrainingArguments, TrainerState, TrainerControl

import wandb

In [4]:
!pip freeze > requirements_bart.txt

  pid, fd = os.forkpty()


In [5]:
def get_current_time(underscore=False):
    return datetime.datetime.now().strftime("%d%m-%H%M" if not underscore else "%d%m_%H%M")

In [6]:
run_name = f"bart-abs-{get_current_time()}"
models_dir = os.path.join(os.getcwd(), 'models')
os.makedirs(models_dir, exist_ok=True)
results_dir = os.path.join(os.getcwd(), 'results', 'bart')
os.makedirs(results_dir, exist_ok=True)
ds_dir = os.path.join(os.getcwd(), 'data')
print(run_name)

bart-abs-2409-1947


In [7]:
try:
    HF_TOKEN =  os.environ['HF_TOKEN']
except:
    HF_TOKEN = ""

if 'google.colab' in str(get_ipython()):
    print("Running on Colab")
    from google.colab import drive, userdata
    drive.mount('/content/drive')
    HF_TOKEN = userdata.get('HF_TOKEN')
elif os.environ.get('KAGGLE_KERNEL_RUN_TYPE') != None:
    ds_dir = '/kaggle/input/bertdata2207/'
    from kaggle_secrets import UserSecretsClient
    print("Running on Kaggle")
    user_secrets = UserSecretsClient()
    HF_TOKEN = user_secrets.get_secret("HF_TOKEN")
    WANDB_API_KEY = user_secrets.get_secret("WANDB_API_KEY")
    os.environ['WANDB_API_KEY'] = WANDB_API_KEY
    os.makedirs(os.path.join(os.getcwd(), "results"), exist_ok=True)
    os.makedirs(os.path.join(os.getcwd(), 'results', 'bart'), exist_ok=True)


Running on Kaggle


In [8]:
set_seed(17)

In [9]:
os.environ["WANDB_PROJECT"] = f"aiml-thesis-train-{run_name}"
os.environ["WANDB_WATCH"] = "false"
wandb.init(settings=wandb.Settings(start_method="thread"), id=run_name)

[34m[1mwandb[0m: Using wandb-core as the SDK backend. Please refer to https://wandb.me/wandb-core for more information.
[34m[1mwandb[0m: Currently logged in as: [33mdawidk5[0m ([33mdawidk5ul[0m). Use [1m`wandb login --relogin`[0m to force relogin
[34m[1mwandb[0m: Tracking run with wandb version 0.18.1
[34m[1mwandb[0m: Run data is saved locally in [35m[1m/kaggle/working/wandb/run-20240924_194754-bart-abs-2409-1947[0m
[34m[1mwandb[0m: Run [1m`wandb offline`[0m to turn off syncing.
[34m[1mwandb[0m: Syncing run [33mbart-abs-2409-1947[0m
[34m[1mwandb[0m: ⭐️ View project at [34m[4mhttps://wandb.ai/dawidk5ul/aiml-thesis-train-bart-abs-2409-1947[0m
[34m[1mwandb[0m: 🚀 View run at [34m[4mhttps://wandb.ai/dawidk5ul/aiml-thesis-train-bart-abs-2409-1947/runs/bart-abs-2409-1947[0m


In [10]:
login(token=HF_TOKEN)

The token has not been saved to the git credentials helper. Pass `add_to_git_credential=True` in this function directly or `--add-to-git-credential` if using via `huggingface-cli` if you want to set the git credential as well.
Token is valid (permission: write).
Your token has been saved to /root/.cache/huggingface/token
Login successful


## Load data

In [11]:
print(ds_dir)

/kaggle/input/bertdata2207/


In [12]:
checkpoint_bart = "sshleifer/distilbart-xsum-12-6"

In [13]:
def csv_to_pandas(file_name, ds_dir, drop_conv_id=True):
    df = pd.read_csv(os.path.join(ds_dir, file_name), names=['conv_id', 'dialogue', 'summary'], encoding='utf-8', dtype={'conv_id': 'string', 'dialogue': 'string', 'summary': 'string'})
    df = df.convert_dtypes()
    if drop_conv_id:
        df.drop(columns=['conv_id'], inplace=True)
    df.reset_index(drop=True, inplace=True)
    return df

In [14]:
train_df_temp = csv_to_pandas("dials_abs_2607_1312_train_spc.csv", ds_dir)
val_df_temp = csv_to_pandas("dials_abs_2607_1312_valid_spc.csv", ds_dir)
test_df = csv_to_pandas("dials_abs_2607_1312_test_spc.csv", ds_dir, drop_conv_id=False)

print(train_df_temp.dtypes)
print(train_df_temp.head(), len(train_df_temp))

dialogue    string[python]
summary     string[python]
dtype: object
                                            dialogue  \
0  Customer: So neither my iPhone nor my Apple Wa...   
1  Customer: @115850 hi team! i m planning to get...   
2  Customer: @AskAmex Where do I write to address...   
3  Customer: @AmazonHelp @115821 Wow, expected 4 ...   
4  Customer: @GWRHelp I'd rather you spent some t...   

                                             summary  
0  Customer enquired about his Iphone and Apple w...  
1  Customer is eager to know about the replacemen...  
2  Signed up for an AmexCard with Delta but it di...  
3  The customer have a problem. The agent is very...  
4  Customer cannot purchase a train ticket on the...   867


In [15]:
tweetsumm_abs = DatasetDict(
    {
        'train': Dataset.from_pandas(train_df_temp),
        'validation': Dataset.from_pandas(val_df_temp),
        'test': Dataset.from_pandas(test_df)
    }
)

In [16]:
tokenizer = AutoTokenizer.from_pretrained(checkpoint_bart)
print(tokenizer)

tokenizer_config.json:   0%|          | 0.00/26.0 [00:00<?, ?B/s]

config.json:   0%|          | 0.00/1.59k [00:00<?, ?B/s]

vocab.json:   0%|          | 0.00/899k [00:00<?, ?B/s]

merges.txt:   0%|          | 0.00/456k [00:00<?, ?B/s]

BartTokenizerFast(name_or_path='sshleifer/distilbart-xsum-12-6', vocab_size=50265, model_max_length=1024, is_fast=True, padding_side='right', truncation_side='right', special_tokens={'bos_token': '<s>', 'eos_token': '</s>', 'unk_token': '<unk>', 'sep_token': '</s>', 'pad_token': '<pad>', 'cls_token': '<s>', 'mask_token': '<mask>'}, clean_up_tokenization_spaces=True),  added_tokens_decoder={
	0: AddedToken("<s>", rstrip=False, lstrip=False, single_word=False, normalized=True, special=True),
	1: AddedToken("<pad>", rstrip=False, lstrip=False, single_word=False, normalized=True, special=True),
	2: AddedToken("</s>", rstrip=False, lstrip=False, single_word=False, normalized=True, special=True),
	3: AddedToken("<unk>", rstrip=False, lstrip=False, single_word=False, normalized=True, special=True),
	50264: AddedToken("<mask>", rstrip=False, lstrip=True, single_word=False, normalized=True, special=True),
}




In [17]:
# Source: https://huggingface.co/docs/transformers/en/tasks/summarization

def preprocess_function(examples):
    prefix = "summarize: "
    inputs = [str(prefix) + str(dial) for dial in examples["dialogue"]]
    model_inputs = tokenizer(inputs, max_length=512, truncation=True) # same params as tweetsumm paper
    labels = tokenizer(text_target=examples["summary"], max_length=80, truncation=True)
    model_inputs["labels"] = labels["input_ids"]
    return model_inputs

In [18]:
tokenized_tweetsumm_abs = tweetsumm_abs.map(preprocess_function, batched=True, remove_columns=['dialogue','summary'])
print(tokenized_tweetsumm_abs["train"][1])

Map:   0%|          | 0/867 [00:00<?, ? examples/s]

Map:   0%|          | 0/110 [00:00<?, ? examples/s]

Map:   0%|          | 0/109 [00:00<?, ? examples/s]

{'input_ids': [0, 18581, 3916, 2072, 35, 19458, 35, 787, 1225, 4432, 1096, 20280, 165, 328, 939, 475, 1884, 7, 120, 1257, 1754, 510, 20529, 27785, 24, 924, 15, 5, 998, 24, 34, 158, 360, 5010, 21784, 6, 64, 1717, 3922, 162, 99, 16, 24, 17487, 50118, 45443, 35, 787, 2481, 3897, 2036, 166, 348, 10, 158, 7033, 5010, 714, 114, 5, 6880, 47, 829, 16, 5009, 50, 31559, 4, 37249, 10237, 50118, 44799, 35, 787, 25146, 28780, 5148, 27785, 125, 99, 114, 939, 399, 17, 27, 90, 101, 5, 1152, 8, 236, 7, 671, 24, 50118, 45443, 35, 787, 2481, 3897, 2036, 166, 1979, 75, 28, 441, 7, 3264, 5, 23312, 2886, 4, 286, 55, 335, 15, 1830, 2886, 714, 4, 17161, 352, 3753, 15, 5, 3104, 1373, 259, 35, 1205, 640, 90, 4, 876, 73, 571, 40969, 9380, 530, 4154, 510, 975, 4, 3166, 19954, 877, 110, 2969, 4, 50118, 44799, 35, 787, 25146, 28780, 5148, 2446, 27785, 125, 209, 32, 5567, 15797, 98, 473, 24, 1266, 276, 714, 3253, 13, 209, 25, 157, 50118, 45443, 35, 787, 2481, 3897, 2036, 3216, 6, 30845, 73, 5567, 15797, 32, 45, 4973

## Setup Training Evaluation

In [19]:
!pip install -U nltk

  pid, fd = os.forkpty()
huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


Collecting nltk
  Downloading nltk-3.9.1-py3-none-any.whl.metadata (2.9 kB)
Downloading nltk-3.9.1-py3-none-any.whl (1.5 MB)
[2K   [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m1.5/1.5 MB[0m [31m23.9 MB/s[0m eta [36m0:00:00[0m
[?25hInstalling collected packages: nltk
  Attempting uninstall: nltk
    Found existing installation: nltk 3.2.4
    Uninstalling nltk-3.2.4:
      Successfully uninstalled nltk-3.2.4
[31mERROR: pip's dependency resolver does not currently take into account all the packages that are installed. This behaviour is the source of the following dependency conflicts.
preprocessing 0.1.13 requires nltk==3.2.4, but you have nltk 3.9.1 which is incompatible.[0m[31m
[0mSuccessfully installed nltk-3.9.1


In [20]:
!pip install evaluate pyrouge rouge_score bert_score meteor

huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


Collecting evaluate
  Downloading evaluate-0.4.3-py3-none-any.whl.metadata (9.2 kB)
Collecting pyrouge
  Downloading pyrouge-0.1.3.tar.gz (60 kB)
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m60.5/60.5 kB[0m [31m2.5 MB/s[0m eta [36m0:00:00[0m
[?25h  Preparing metadata (setup.py) ... [?25l- done
[?25hCollecting rouge_score
  Downloading rouge_score-0.1.2.tar.gz (17 kB)
  Preparing metadata (setup.py) ... [?25l- done
[?25hCollecting bert_score
  Downloading bert_score-0.3.13-py3-none-any.whl.metadata (15 kB)
Collecting meteor
  Downloading meteor-2.0.16-py3-none-any.whl.metadata (8.3 kB)
Collecting bgzip<0.6.0,>=0.5.0 (from meteor)
  Downloading bgzip-0.5.0.tar.gz (100 kB)
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m100.2/100.2 kB[0m [31m5.1 MB/s[0m eta [36m0:00:00[0m
[?25h  Preparing metadata (setup.py) ... [?25l- done
[?25hCollecting biom-format<3.0.0,>=2.1.15 (from meteor)
  Downloading biom-format-2.1.16.t

In [21]:
import evaluate, nltk, csv
rouge = evaluate.load("rouge")
meteor = evaluate.load("meteor")
bertscore = evaluate.load("bertscore")

nltk.download('punkt_tab')

Downloading builder script:   0%|          | 0.00/6.27k [00:00<?, ?B/s]

Downloading builder script:   0%|          | 0.00/7.02k [00:00<?, ?B/s]

[nltk_data] Downloading package wordnet to /usr/share/nltk_data...
[nltk_data]   Package wordnet is already up-to-date!
[nltk_data] Downloading package punkt_tab to /usr/share/nltk_data...
[nltk_data]   Unzipping tokenizers/punkt_tab.zip.
[nltk_data] Downloading package omw-1.4 to /usr/share/nltk_data...


Downloading builder script:   0%|          | 0.00/7.95k [00:00<?, ?B/s]

[nltk_data] Downloading package punkt_tab to /usr/share/nltk_data...
[nltk_data]   Package punkt_tab is already up-to-date!


True

In [22]:
# Main source, official HUggingFace documentation: https://huggingface.co/docs/transformers/tasks/summarization
def compute_metrics_abs(eval_pred):
    predictions, labels = eval_pred
    # Extra line added to address an overflow: https://github.com/huggingface/transformers/issues/22634
    predictions = np.where(predictions != -100, predictions, tokenizer.pad_token_id)
    decoded_preds = tokenizer.batch_decode(predictions, skip_special_tokens=True)
    labels = np.where(labels != -100, labels, tokenizer.pad_token_id)
    decoded_labels = tokenizer.batch_decode(labels, skip_special_tokens=True)
    prediction_lens = [np.count_nonzero(pred != tokenizer.pad_token_id) for pred in predictions]

    rouge_scores = rouge.compute(predictions=decoded_preds, references=decoded_labels, use_stemmer=True, use_aggregator=True)
    bert_scores = bertscore.compute(predictions=decoded_preds, references=decoded_labels, lang="en")
    bert_scores.pop('hashcode')
    result = {
      **{f"rouge/{k}": round(v, 4) for k,v in rouge_scores.items()},
      **{f"bertscore/bertscore-{k}": round(np.mean(v), 4) for k,v in bert_scores.items()},
      'meteor': round(meteor.compute(predictions=decoded_preds, references=decoded_labels)['meteor'], 4),
    }
   
    result["gen_len"] = np.mean(prediction_lens)
    return result


## Train and Evaluate

In [23]:
model = AutoModelForSeq2SeqLM.from_pretrained(checkpoint_bart)

pytorch_model.bin:   0%|          | 0.00/611M [00:00<?, ?B/s]

In [24]:
data_collator = DataCollatorForSeq2Seq(tokenizer=tokenizer, model=model)

In [25]:
EXPERIMENT_PARAMS = []
BASE_PARAMS = {'lr':3e-5, 'batch_size':4, 'epochs': 6}
EXPERIMENT_PARAMS.append(BASE_PARAMS)

In [26]:
LEARN_RATES = (3e-5, 3e-4, 3e-6)
BATCH_SIZES = (4, 2, 8)
EPOCHS = (6,10)

for lr in LEARN_RATES:
    for batch_size in BATCH_SIZES:
        for epoch in EPOCHS:
            if lr == BASE_PARAMS['lr'] and batch_size == BASE_PARAMS['batch_size'] and epoch == BASE_PARAMS['epochs']:
                continue
            experiment = {'lr':lr, 'batch_size':batch_size, 'epochs': epoch}
            EXPERIMENT_PARAMS.append(experiment)

In [27]:
os.listdir(results_dir)

['log_bart_abs_2409_0144_lr_3e_05_bs_4_maxep_10.csv',
 'test_metrics_bart_abs_2409_0144_lr_3e_05_bs_4_maxep_6_s1085_bart.csv',
 'test_metrics_bart_abs_2409_0144_lr_3e_05_bs_4_maxep_10_s1302_bart.csv',
 'test_preds_bart_abs_2409_0144_lr_3e_05_bs_4_maxep_6_s1085_bart.csv',
 'log_bart_abs_2409_0144_lr_3e_05_bs_2_maxep_6.csv',
 'test_preds_bart_abs_2409_0144_lr_3e_05_bs_4_maxep_10_s1302_bart.csv',
 'test_preds_bart_abs_2409_0144_lr_3e_05_bs_2_maxep_6_s2604_bart.csv',
 'log_bart_abs_2409_0144_lr_3e_05_bs_4_maxep_6.csv',
 'test_metrics_bart_abs_2409_0144_lr_3e_05_bs_2_maxep_6_s2604_bart.csv']

In [28]:
FINISHED_EXPERIMENTS = []
for exp in EXPERIMENT_PARAMS:
    exp_name = f"lr_{exp['lr']}_bs-{exp['batch_size']}_maxep_{exp['epochs']}".replace('-','_')
    files_found = sum([(exp_name in filename) for filename in os.listdir(results_dir)])
    if files_found == 3:
        # Experiment finished
        FINISHED_EXPERIMENTS.append(exp)
EXPERIMENT_PARAMS = [exp for exp in EXPERIMENT_PARAMS if exp not in FINISHED_EXPERIMENTS]
print("Experiments left:", len(EXPERIMENT_PARAMS))

Experiments left: 15


In [29]:
def run_post_training(split, test_details, test_df_temp: pd.DataFrame, tokenizer, experiment, run_name_model, epoch, results_dir):
    # First line added due to label error, see 
    predictions = np.where(test_details.predictions != -100, test_details.predictions, tokenizer.pad_token_id)
    preds = tokenizer.batch_decode(predictions, skip_special_tokens=True)
    test_df_temp['response'] = preds
    exp_res = {**experiment, **(test_details.metrics)}
    test_metrics_df = pd.DataFrame([exp_res])
    test_df_temp = test_df_temp.convert_dtypes()
    test_metrics_df = test_metrics_df.convert_dtypes()
    wandb.log({run_name_model: test_details.metrics})
    preds_name = f"{split}_preds_{run_name_model.replace('-','_')}_s{epoch}_bart.csv"
    metrics_name =  f"{split}_metrics_{run_name_model.replace('-','_')}_s{epoch}_bart.csv"
    test_df_temp.to_csv(os.path.join(results_dir, preds_name), index=False, header=False, encoding='utf-8', quoting=csv.QUOTE_ALL)
    test_metrics_df.to_csv(os.path.join(results_dir, metrics_name), index=False, header=True, encoding='utf-8', quoting=csv.QUOTE_ALL)

In [30]:
class ExtraCallback(TrainerCallback):        
    def on_train_end(self, args, state, control, **kwargs):
        # Save and upload CSVs
        super().on_train_end(args, state, control, **kwargs)
        df = pd.DataFrame(state.log_history)
        df = df.convert_dtypes()
        df = df.groupby(['epoch'], as_index=False).sum()
        df.to_csv(os.path.join(results_dir, "log_" + args.run_name.replace('-','_') + ".csv"), header=True, index=False)

In [31]:
for count, exp in enumerate(EXPERIMENT_PARAMS):
    run_name_model = f"{run_name}-lr-{exp['lr']}-bs-{exp['batch_size']}-maxep-{exp['epochs']}"
    print("=== Starting experiment", count, f"on {get_current_time()}:", run_name_model, "training")
    wandb.run.name = run_name_model
    wandb.run.save()

    training_args = Seq2SeqTrainingArguments(
        output_dir=os.path.join(models_dir, run_name_model),
        eval_strategy="epoch",
        logging_strategy="epoch",
        save_only_model=True,
        learning_rate=exp['lr'],
        per_device_train_batch_size=exp['batch_size'],
        per_device_eval_batch_size=exp['batch_size'],
        weight_decay=0.1,
        save_strategy="epoch",
        save_total_limit=1,
        load_best_model_at_end=True,
        metric_for_best_model="eval_rouge/rougeL",
        greater_is_better=True,
        num_train_epochs=exp['epochs'],
        predict_with_generate=True,
        fp16=True,
        generation_max_length=80,
        push_to_hub=False,
        report_to="wandb",
        run_name=run_name_model,
    )
    trainer = Seq2SeqTrainer(
        model=model,
        args=training_args,
        train_dataset=tokenized_tweetsumm_abs["train"], # .select(range(0,50)),
        eval_dataset=tokenized_tweetsumm_abs["validation"], # .select(range(0,10)),
        tokenizer=tokenizer,
        data_collator=data_collator,
        compute_metrics=compute_metrics_abs,
    )
    trainer.add_callback(ExtraCallback)
    training_start = time.time()
    trainer.train()
    training_end = time.time()
    print(f"Finished experiment {count}: {run_name_model} - time it took for training:", str(datetime.timedelta(seconds=(training_end-training_start))))
    test_details = trainer.predict(tokenized_tweetsumm_abs['test'], metric_key_prefix='test')
    run_post_training('test', test_details, test_df, tokenizer, exp, run_name_model, trainer.state.best_model_checkpoint.split('-')[-1], results_dir)
    trainer.push_to_hub()
    shutil.rmtree(models_dir)
    os.makedirs(models_dir)



=== Starting experiment 0 on 2409-1949: bart-abs-2409-1947-lr-3e-05-bs-2-maxep-10 training


  self.scaler = torch.cuda.amp.GradScaler(**kwargs)


Epoch,Training Loss,Validation Loss,Rouge/rouge1,Rouge/rouge2,Rouge/rougel,Rouge/rougelsum,Bertscore/bertscore-precision,Bertscore/bertscore-recall,Bertscore/bertscore-f1,Meteor,Gen Len
1,2.3299,2.199738,0.4484,0.2127,0.3842,0.3856,0.8939,0.8904,0.892,0.4107,38.427273
2,1.6174,2.058076,0.4617,0.2158,0.3919,0.393,0.8972,0.8907,0.8938,0.4049,36.054545
3,1.1854,2.188786,0.4631,0.2153,0.3893,0.3914,0.9,0.891,0.8953,0.4044,35.827273
4,0.8568,2.377647,0.4518,0.201,0.3822,0.3839,0.8973,0.8895,0.8932,0.3907,34.763636
5,0.6056,2.646757,0.4731,0.2207,0.4031,0.4036,0.8974,0.8946,0.8959,0.4173,37.581818
6,0.4235,2.922561,0.4816,0.2258,0.4055,0.4064,0.8989,0.8955,0.897,0.4317,36.890909
7,0.2995,3.193845,0.4541,0.1989,0.3839,0.3843,0.8941,0.8916,0.8927,0.4071,37.009091
8,0.2079,3.417814,0.4684,0.2094,0.3926,0.3931,0.8941,0.8942,0.894,0.4177,39.454545
9,0.1527,3.534687,0.4716,0.2151,0.3989,0.4009,0.8937,0.8942,0.8938,0.4277,39.590909
10,0.1203,3.654172,0.4733,0.2228,0.409,0.4103,0.8957,0.8945,0.8949,0.4257,38.072727


tokenizer_config.json:   0%|          | 0.00/25.0 [00:00<?, ?B/s]

config.json:   0%|          | 0.00/482 [00:00<?, ?B/s]

vocab.json:   0%|          | 0.00/899k [00:00<?, ?B/s]

merges.txt:   0%|          | 0.00/456k [00:00<?, ?B/s]

tokenizer.json:   0%|          | 0.00/1.36M [00:00<?, ?B/s]



model.safetensors:   0%|          | 0.00/1.42G [00:00<?, ?B/s]

Some weights of RobertaModel were not initialized from the model checkpoint at roberta-large and are newly initialized: ['roberta.pooler.dense.bias', 'roberta.pooler.dense.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repea

Finished experiment 0: bart-abs-2409-1947-lr-3e-05-bs-2-maxep-10 - time it took for training: 0:27:02.968852


Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}


Upload 2 LFS files:   0%|          | 0/2 [00:00<?, ?it/s]

training_args.bin:   0%|          | 0.00/5.50k [00:00<?, ?B/s]

model.safetensors:   0%|          | 0.00/1.22G [00:00<?, ?B/s]

=== Starting experiment 1 on 2409-2018: bart-abs-2409-1947-lr-3e-05-bs-8-maxep-6 training


  self.scaler = torch.cuda.amp.GradScaler(**kwargs)


Epoch,Training Loss,Validation Loss,Rouge/rouge1,Rouge/rouge2,Rouge/rougel,Rouge/rougelsum,Bertscore/bertscore-precision,Bertscore/bertscore-recall,Bertscore/bertscore-f1,Meteor,Gen Len
1,0.1721,3.576116,0.4573,0.2036,0.3842,0.3851,0.8952,0.8917,0.8933,0.405,36.972727
2,0.1505,3.572369,0.45,0.1979,0.3854,0.3855,0.8956,0.8912,0.8933,0.3964,36.327273
3,0.1132,3.725115,0.4535,0.2052,0.385,0.3867,0.8955,0.8917,0.8934,0.4043,37.427273
4,0.0881,3.846108,0.4676,0.2097,0.397,0.3983,0.8967,0.8917,0.8941,0.4047,35.709091
5,0.0734,3.838491,0.458,0.21,0.3905,0.3919,0.8939,0.8927,0.8931,0.4105,38.018182
6,0.0612,3.898042,0.462,0.2198,0.4014,0.4029,0.8957,0.8926,0.894,0.4124,37.372727


Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_l

Finished experiment 1: bart-abs-2409-1947-lr-3e-05-bs-8-maxep-6 - time it took for training: 0:12:38.492568


Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}


Upload 2 LFS files:   0%|          | 0/2 [00:00<?, ?it/s]

model.safetensors:   0%|          | 0.00/1.22G [00:00<?, ?B/s]

training_args.bin:   0%|          | 0.00/5.50k [00:00<?, ?B/s]

=== Starting experiment 2 on 2409-2032: bart-abs-2409-1947-lr-3e-05-bs-8-maxep-10 training


  self.scaler = torch.cuda.amp.GradScaler(**kwargs)


Epoch,Training Loss,Validation Loss,Rouge/rouge1,Rouge/rouge2,Rouge/rougel,Rouge/rougelsum,Bertscore/bertscore-precision,Bertscore/bertscore-recall,Bertscore/bertscore-f1,Meteor,Gen Len
1,0.0785,3.983774,0.4581,0.1987,0.3887,0.3892,0.8957,0.8906,0.893,0.4019,35.645455
2,0.0862,3.907476,0.4574,0.2028,0.3856,0.3863,0.8923,0.8918,0.8919,0.4091,39.154545
3,0.0792,3.979428,0.4593,0.1972,0.3807,0.3814,0.889,0.8926,0.8906,0.4145,41.918182
4,0.0673,4.041896,0.4634,0.2047,0.3928,0.3937,0.8948,0.8918,0.8931,0.4133,36.690909
5,0.0604,4.1048,0.4629,0.2112,0.396,0.3971,0.8956,0.8926,0.8939,0.4118,36.972727
6,0.0548,4.133064,0.4556,0.2042,0.3904,0.391,0.8938,0.8917,0.8926,0.4079,38.154545
7,0.0508,4.173976,0.4546,0.1949,0.383,0.3842,0.8925,0.8903,0.8913,0.4028,37.527273
8,0.0473,4.164255,0.4653,0.212,0.401,0.4026,0.8949,0.8939,0.8942,0.4212,38.481818
9,0.0438,4.191323,0.472,0.2155,0.4063,0.4071,0.8969,0.8947,0.8956,0.4223,37.909091
10,0.0401,4.208365,0.4731,0.2204,0.4091,0.4105,0.8963,0.8954,0.8957,0.4281,38.318182


Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_l

Finished experiment 2: bart-abs-2409-1947-lr-3e-05-bs-8-maxep-10 - time it took for training: 0:21:08.197410


Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}


Upload 2 LFS files:   0%|          | 0/2 [00:00<?, ?it/s]

training_args.bin:   0%|          | 0.00/5.50k [00:00<?, ?B/s]

model.safetensors:   0%|          | 0.00/1.22G [00:00<?, ?B/s]

=== Starting experiment 3 on 2409-2055: bart-abs-2409-1947-lr-0.0003-bs-4-maxep-6 training


  self.scaler = torch.cuda.amp.GradScaler(**kwargs)


Epoch,Training Loss,Validation Loss,Rouge/rouge1,Rouge/rouge2,Rouge/rougel,Rouge/rougelsum,Bertscore/bertscore-precision,Bertscore/bertscore-recall,Bertscore/bertscore-f1,Meteor,Gen Len
1,2.1377,3.921995,0.3283,0.1009,0.2612,0.2612,0.8785,0.8638,0.871,0.2695,33.0
2,3.3219,3.752268,0.2756,0.0805,0.2368,0.237,0.8845,0.8545,0.8692,0.2111,25.0
3,2.115,4.07831,0.282,0.0747,0.2116,0.2118,0.8663,0.8623,0.8642,0.2582,41.0
4,1.1461,4.879511,0.251,0.0501,0.21,0.2102,0.8497,0.8506,0.8501,0.2025,37.0
5,0.6272,5.80943,0.2811,0.0751,0.229,0.2293,0.8628,0.8693,0.866,0.2058,44.0
6,0.3841,6.342303,0.2439,0.0504,0.2065,0.2067,0.8544,0.8581,0.8562,0.229,46.0


Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_l

Finished experiment 3: bart-abs-2409-1947-lr-0.0003-bs-4-maxep-6 - time it took for training: 0:13:12.737365


Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}


training_args.bin:   0%|          | 0.00/5.50k [00:00<?, ?B/s]

Upload 2 LFS files:   0%|          | 0/2 [00:00<?, ?it/s]

model.safetensors:   0%|          | 0.00/1.22G [00:00<?, ?B/s]

=== Starting experiment 4 on 2409-2110: bart-abs-2409-1947-lr-0.0003-bs-4-maxep-10 training


  self.scaler = torch.cuda.amp.GradScaler(**kwargs)


Epoch,Training Loss,Validation Loss,Rouge/rouge1,Rouge/rouge2,Rouge/rougel,Rouge/rougelsum,Bertscore/bertscore-precision,Bertscore/bertscore-recall,Bertscore/bertscore-f1,Meteor,Gen Len
1,3.3364,3.895215,0.2911,0.0832,0.2351,0.2361,0.8685,0.8711,0.8697,0.2279,43.0
2,2.369,4.0594,0.2603,0.0584,0.2204,0.2202,0.871,0.8545,0.8626,0.2129,35.0
3,1.4708,4.606133,0.2722,0.0714,0.2029,0.2031,0.8612,0.8618,0.8615,0.2582,45.0
4,0.9251,5.223887,0.2333,0.0475,0.1761,0.1762,0.8431,0.8562,0.8495,0.2342,58.827273
5,0.6367,5.819339,0.2622,0.0744,0.2001,0.1997,0.8634,0.8616,0.8625,0.1982,32.0
6,0.486,6.297507,0.2591,0.0557,0.2009,0.2012,0.859,0.8605,0.8597,0.2511,48.009091
7,0.3892,6.500186,0.2582,0.0781,0.2156,0.2154,0.8771,0.8626,0.8697,0.1855,29.0
8,0.3152,6.735162,0.313,0.0882,0.2413,0.2416,0.8789,0.8681,0.8735,0.2252,34.0
9,0.2751,6.997021,0.2906,0.0847,0.2272,0.2274,0.8671,0.8567,0.8618,0.1991,27.0
10,0.24,7.16334,0.2439,0.0504,0.2065,0.2067,0.8544,0.8581,0.8562,0.229,45.0


Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_l

Finished experiment 4: bart-abs-2409-1947-lr-0.0003-bs-4-maxep-10 - time it took for training: 0:22:02.307270


Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}


training_args.bin:   0%|          | 0.00/5.50k [00:00<?, ?B/s]

model.safetensors:   0%|          | 0.00/1.22G [00:00<?, ?B/s]

Upload 2 LFS files:   0%|          | 0/2 [00:00<?, ?it/s]

=== Starting experiment 5 on 2409-2133: bart-abs-2409-1947-lr-0.0003-bs-2-maxep-6 training


  self.scaler = torch.cuda.amp.GradScaler(**kwargs)


Epoch,Training Loss,Validation Loss,Rouge/rouge1,Rouge/rouge2,Rouge/rougel,Rouge/rougelsum,Bertscore/bertscore-precision,Bertscore/bertscore-recall,Bertscore/bertscore-f1,Meteor,Gen Len
1,0.955,5.774044,0.2485,0.0542,0.1867,0.1867,0.8491,0.8557,0.8523,0.2552,54.0
2,0.8434,5.69267,0.2599,0.0592,0.202,0.2017,0.8553,0.8626,0.8589,0.2583,46.0
3,0.5948,5.890735,0.2473,0.0528,0.1834,0.1833,0.8458,0.856,0.8508,0.2569,54.0
4,0.4377,6.573647,0.2591,0.0557,0.2009,0.2012,0.859,0.8605,0.8597,0.2511,48.0
5,0.3416,6.859653,0.3035,0.072,0.2428,0.2429,0.8724,0.8571,0.8646,0.2108,29.0
6,0.268,7.144084,0.3035,0.072,0.2428,0.2429,0.8724,0.8571,0.8646,0.2108,29.0


Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_l

Finished experiment 5: bart-abs-2409-1947-lr-0.0003-bs-2-maxep-6 - time it took for training: 0:16:14.438001


Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}


training_args.bin:   0%|          | 0.00/5.50k [00:00<?, ?B/s]

Upload 2 LFS files:   0%|          | 0/2 [00:00<?, ?it/s]

model.safetensors:   0%|          | 0.00/1.22G [00:00<?, ?B/s]

=== Starting experiment 6 on 2409-2150: bart-abs-2409-1947-lr-0.0003-bs-2-maxep-10 training


  self.scaler = torch.cuda.amp.GradScaler(**kwargs)


Epoch,Training Loss,Validation Loss,Rouge/rouge1,Rouge/rouge2,Rouge/rougel,Rouge/rougelsum,Bertscore/bertscore-precision,Bertscore/bertscore-recall,Bertscore/bertscore-f1,Meteor,Gen Len
1,0.6036,6.432414,0.2828,0.0721,0.2287,0.229,0.8776,0.863,0.8702,0.1865,29.0
2,0.6828,5.832995,0.2817,0.0594,0.2119,0.2118,0.8553,0.8592,0.8572,0.2216,38.0
3,0.5861,6.460395,0.2456,0.0556,0.1909,0.1914,0.8622,0.8598,0.861,0.2363,41.0
4,0.4888,6.309824,0.2591,0.0557,0.2009,0.2012,0.859,0.8605,0.8597,0.2511,47.0
5,0.4314,6.707602,0.3042,0.0843,0.2354,0.2357,0.8695,0.8605,0.8649,0.22,32.0
6,0.379,6.717302,0.2844,0.0777,0.2203,0.22,0.8641,0.8631,0.8635,0.2167,34.0
7,0.3245,6.838231,0.2613,0.0803,0.214,0.2142,0.8711,0.8469,0.8588,0.2102,25.0
8,0.289,7.025251,0.2396,0.0481,0.1978,0.198,0.8526,0.8544,0.8534,0.2079,34.0
9,0.2575,7.126397,0.3089,0.0693,0.2341,0.2343,0.8686,0.8645,0.8665,0.2205,36.0
10,0.2312,7.405517,0.2434,0.0406,0.2027,0.203,0.8533,0.8523,0.8528,0.194,34.0


Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_l

Finished experiment 6: bart-abs-2409-1947-lr-0.0003-bs-2-maxep-10 - time it took for training: 0:25:33.537305


Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}


Upload 2 LFS files:   0%|          | 0/2 [00:00<?, ?it/s]

training_args.bin:   0%|          | 0.00/5.50k [00:00<?, ?B/s]

model.safetensors:   0%|          | 0.00/1.22G [00:00<?, ?B/s]

=== Starting experiment 7 on 2409-2218: bart-abs-2409-1947-lr-0.0003-bs-8-maxep-6 training


  self.scaler = torch.cuda.amp.GradScaler(**kwargs)


Epoch,Training Loss,Validation Loss,Rouge/rouge1,Rouge/rouge2,Rouge/rougel,Rouge/rougelsum,Bertscore/bertscore-precision,Bertscore/bertscore-recall,Bertscore/bertscore-f1,Meteor,Gen Len
1,0.3901,6.58334,0.2377,0.0309,0.193,0.1932,0.8496,0.853,0.8512,0.2159,45.0
2,0.3274,6.558266,0.2439,0.0504,0.2065,0.2067,0.8544,0.8581,0.8562,0.229,45.0
3,0.3098,6.929381,0.2613,0.0803,0.214,0.2142,0.8711,0.8469,0.8588,0.2102,25.0
4,0.2625,7.022289,0.3008,0.0767,0.229,0.2292,0.858,0.8674,0.8626,0.2167,41.0
5,0.2379,7.227599,0.3035,0.072,0.2428,0.2429,0.8724,0.8571,0.8646,0.2108,29.0
6,0.2168,7.389841,0.3035,0.072,0.2428,0.2429,0.8724,0.8571,0.8646,0.2108,29.0


Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_l

Finished experiment 7: bart-abs-2409-1947-lr-0.0003-bs-8-maxep-6 - time it took for training: 0:12:00.231702


Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}


model.safetensors:   0%|          | 0.00/1.22G [00:00<?, ?B/s]

Upload 2 LFS files:   0%|          | 0/2 [00:00<?, ?it/s]

training_args.bin:   0%|          | 0.00/5.50k [00:00<?, ?B/s]

=== Starting experiment 8 on 2409-2231: bart-abs-2409-1947-lr-0.0003-bs-8-maxep-10 training


  self.scaler = torch.cuda.amp.GradScaler(**kwargs)


Epoch,Training Loss,Validation Loss,Rouge/rouge1,Rouge/rouge2,Rouge/rougel,Rouge/rougelsum,Bertscore/bertscore-precision,Bertscore/bertscore-recall,Bertscore/bertscore-f1,Meteor,Gen Len
1,0.2977,7.245364,0.268,0.0433,0.2049,0.205,0.8657,0.8613,0.8635,0.2212,35.0
2,0.3147,7.040257,0.2684,0.0598,0.2092,0.2091,0.8595,0.8599,0.8596,0.2363,41.0
3,0.5099,7.021123,0.2684,0.0598,0.2092,0.2091,0.8595,0.8599,0.8596,0.2363,41.0
4,0.2802,7.1107,0.3097,0.0856,0.2463,0.2464,0.8589,0.8656,0.8622,0.2246,36.0
5,0.2652,7.198689,0.2622,0.0744,0.2001,0.1997,0.8634,0.8616,0.8625,0.1982,32.0
6,0.255,7.17194,0.2591,0.0557,0.2009,0.2012,0.859,0.8605,0.8597,0.2511,47.0
7,0.2379,7.152111,0.3097,0.0856,0.2463,0.2464,0.8589,0.8656,0.8622,0.2246,36.0
8,0.2375,7.363271,0.3097,0.0856,0.2463,0.2464,0.8589,0.8656,0.8622,0.2246,36.0
9,0.219,7.438217,0.3089,0.0693,0.2341,0.2343,0.8686,0.8645,0.8665,0.2205,36.0
10,0.2091,7.548461,0.2722,0.0714,0.2029,0.2031,0.8612,0.8618,0.8615,0.2582,44.0


Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_l

Finished experiment 8: bart-abs-2409-1947-lr-0.0003-bs-8-maxep-10 - time it took for training: 0:19:52.506418


Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}


Upload 2 LFS files:   0%|          | 0/2 [00:00<?, ?it/s]

model.safetensors:   0%|          | 0.00/1.22G [00:00<?, ?B/s]

training_args.bin:   0%|          | 0.00/5.50k [00:00<?, ?B/s]

=== Starting experiment 9 on 2409-2253: bart-abs-2409-1947-lr-3e-06-bs-4-maxep-6 training


  self.scaler = torch.cuda.amp.GradScaler(**kwargs)


Epoch,Training Loss,Validation Loss,Rouge/rouge1,Rouge/rouge2,Rouge/rougel,Rouge/rougelsum,Bertscore/bertscore-precision,Bertscore/bertscore-recall,Bertscore/bertscore-f1,Meteor,Gen Len
1,0.2442,7.179628,0.2722,0.0714,0.2029,0.2031,0.8612,0.8618,0.8615,0.2582,44.0
2,0.2514,7.246984,0.2722,0.0714,0.2029,0.2031,0.8612,0.8618,0.8615,0.2582,44.0
3,0.2226,7.295325,0.2722,0.0714,0.2029,0.2031,0.8612,0.8618,0.8615,0.2582,44.0
4,0.2207,7.334236,0.2722,0.0714,0.2029,0.2031,0.8612,0.8618,0.8615,0.2582,44.0
5,0.2177,7.358789,0.2722,0.0714,0.2029,0.2031,0.8612,0.8618,0.8615,0.2582,44.0
6,0.2176,7.366581,0.2722,0.0714,0.2029,0.2031,0.8612,0.8618,0.8615,0.2582,44.0


Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_l

Finished experiment 9: bart-abs-2409-1947-lr-3e-06-bs-4-maxep-6 - time it took for training: 0:13:20.423511


Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}


Upload 2 LFS files:   0%|          | 0/2 [00:00<?, ?it/s]

model.safetensors:   0%|          | 0.00/1.22G [00:00<?, ?B/s]

training_args.bin:   0%|          | 0.00/5.50k [00:00<?, ?B/s]

=== Starting experiment 10 on 2409-2307: bart-abs-2409-1947-lr-3e-06-bs-4-maxep-10 training


  self.scaler = torch.cuda.amp.GradScaler(**kwargs)


Epoch,Training Loss,Validation Loss,Rouge/rouge1,Rouge/rouge2,Rouge/rougel,Rouge/rougelsum,Bertscore/bertscore-precision,Bertscore/bertscore-recall,Bertscore/bertscore-f1,Meteor,Gen Len
1,0.2264,7.297967,0.2722,0.0714,0.2029,0.2031,0.8612,0.8618,0.8615,0.2582,44.0
2,0.243,7.356686,0.2722,0.0714,0.2029,0.2031,0.8612,0.8618,0.8615,0.2582,44.0
3,0.2153,7.403932,0.2722,0.0714,0.2029,0.2031,0.8612,0.8618,0.8615,0.2582,44.0
4,0.2144,7.452021,0.2722,0.0714,0.2029,0.2031,0.8612,0.8618,0.8615,0.2582,44.0
5,0.2122,7.486974,0.2722,0.0714,0.2029,0.2031,0.8612,0.8618,0.8615,0.2582,44.0
6,0.2117,7.509673,0.2722,0.0714,0.2029,0.2031,0.8612,0.8618,0.8615,0.2582,44.0
7,0.2116,7.530538,0.3097,0.0856,0.2463,0.2464,0.8589,0.8656,0.8622,0.2246,36.0
8,0.2108,7.544109,0.3097,0.0856,0.2463,0.2464,0.8589,0.8656,0.8622,0.2246,36.0
9,0.2129,7.548274,0.2982,0.0831,0.2333,0.2336,0.8593,0.8643,0.8618,0.2356,38.4
10,0.2123,7.55064,0.3083,0.0846,0.2429,0.2432,0.8595,0.8658,0.8626,0.2274,36.581818


Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_l

Finished experiment 10: bart-abs-2409-1947-lr-3e-06-bs-4-maxep-10 - time it took for training: 0:22:01.122501


Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}


Upload 2 LFS files:   0%|          | 0/2 [00:00<?, ?it/s]

training_args.bin:   0%|          | 0.00/5.50k [00:00<?, ?B/s]

model.safetensors:   0%|          | 0.00/1.22G [00:00<?, ?B/s]

=== Starting experiment 11 on 2409-2331: bart-abs-2409-1947-lr-3e-06-bs-2-maxep-6 training


  self.scaler = torch.cuda.amp.GradScaler(**kwargs)


Epoch,Training Loss,Validation Loss,Rouge/rouge1,Rouge/rouge2,Rouge/rougel,Rouge/rougelsum,Bertscore/bertscore-precision,Bertscore/bertscore-recall,Bertscore/bertscore-f1,Meteor,Gen Len
1,0.2033,7.593763,0.3097,0.0856,0.2463,0.2464,0.8589,0.8656,0.8622,0.2246,36.0
2,0.2002,7.659335,0.3097,0.0856,0.2463,0.2464,0.8589,0.8656,0.8622,0.2246,36.0
3,0.1987,7.68996,0.3097,0.0856,0.2463,0.2464,0.8589,0.8656,0.8622,0.2246,36.0
4,0.1973,7.723392,0.3097,0.0856,0.2463,0.2464,0.8589,0.8656,0.8622,0.2246,36.0
5,0.1975,7.738822,0.3097,0.0856,0.2463,0.2464,0.8589,0.8656,0.8622,0.2246,36.0
6,0.2146,7.737656,0.3097,0.0856,0.2463,0.2464,0.8589,0.8656,0.8622,0.2246,36.0


Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_l

Finished experiment 11: bart-abs-2409-1947-lr-3e-06-bs-2-maxep-6 - time it took for training: 0:15:32.206235


Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}


Upload 2 LFS files:   0%|          | 0/2 [00:00<?, ?it/s]

training_args.bin:   0%|          | 0.00/5.50k [00:00<?, ?B/s]

model.safetensors:   0%|          | 0.00/1.22G [00:00<?, ?B/s]

=== Starting experiment 12 on 2409-2348: bart-abs-2409-1947-lr-3e-06-bs-2-maxep-10 training


  self.scaler = torch.cuda.amp.GradScaler(**kwargs)


Epoch,Training Loss,Validation Loss,Rouge/rouge1,Rouge/rouge2,Rouge/rougel,Rouge/rougelsum,Bertscore/bertscore-precision,Bertscore/bertscore-recall,Bertscore/bertscore-f1,Meteor,Gen Len
1,0.1989,7.690619,0.3097,0.0856,0.2463,0.2464,0.8589,0.8656,0.8622,0.2246,36.0
2,0.1993,7.737114,0.3097,0.0856,0.2463,0.2464,0.8589,0.8656,0.8622,0.2246,36.0
3,0.1978,7.761429,0.3097,0.0856,0.2463,0.2464,0.8589,0.8656,0.8622,0.2246,36.0
4,0.1965,7.798968,0.2722,0.0714,0.2029,0.2031,0.8612,0.8618,0.8615,0.2582,44.0
5,0.1968,7.820422,0.3097,0.0856,0.2463,0.2464,0.8589,0.8656,0.8622,0.2246,36.0
6,0.215,7.807253,0.3097,0.0856,0.2463,0.2464,0.8589,0.8656,0.8622,0.2246,36.0
7,0.2144,7.800263,0.3097,0.0856,0.2463,0.2464,0.8589,0.8656,0.8622,0.2246,36.0
8,0.2133,7.797372,0.3097,0.0856,0.2463,0.2464,0.8589,0.8656,0.8622,0.2246,36.0
9,0.2136,7.7947,0.3097,0.0856,0.2463,0.2464,0.8589,0.8656,0.8622,0.2246,36.0
10,0.2119,7.795702,0.3097,0.0856,0.2463,0.2464,0.8589,0.8656,0.8622,0.2246,36.0


Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_l

Finished experiment 12: bart-abs-2409-1947-lr-3e-06-bs-2-maxep-10 - time it took for training: 0:26:19.778092


Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}


model.safetensors:   0%|          | 0.00/1.22G [00:00<?, ?B/s]

training_args.bin:   0%|          | 0.00/5.50k [00:00<?, ?B/s]

Upload 2 LFS files:   0%|          | 0/2 [00:00<?, ?it/s]

=== Starting experiment 13 on 2509-0016: bart-abs-2409-1947-lr-3e-06-bs-8-maxep-6 training


  self.scaler = torch.cuda.amp.GradScaler(**kwargs)


Epoch,Training Loss,Validation Loss,Rouge/rouge1,Rouge/rouge2,Rouge/rougel,Rouge/rougelsum,Bertscore/bertscore-precision,Bertscore/bertscore-recall,Bertscore/bertscore-f1,Meteor,Gen Len
1,0.1809,7.765838,0.3097,0.0856,0.2463,0.2464,0.8589,0.8656,0.8622,0.2246,36.0
2,0.1825,7.789093,0.2722,0.0714,0.2029,0.2031,0.8612,0.8618,0.8615,0.2582,44.0
3,0.1822,7.802975,0.3097,0.0856,0.2463,0.2464,0.8589,0.8656,0.8622,0.2246,36.0
4,0.1807,7.814247,0.2722,0.0714,0.2029,0.2031,0.8612,0.8618,0.8615,0.2582,44.0
5,0.2002,7.814513,0.2722,0.0714,0.2029,0.2031,0.8612,0.8618,0.8615,0.2582,44.0
6,0.2047,7.812089,0.2722,0.0714,0.2029,0.2031,0.8612,0.8618,0.8615,0.2582,44.0


Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_l

Finished experiment 13: bart-abs-2409-1947-lr-3e-06-bs-8-maxep-6 - time it took for training: 0:11:52.663646


Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}


model.safetensors:   0%|          | 0.00/1.22G [00:00<?, ?B/s]

Upload 2 LFS files:   0%|          | 0/2 [00:00<?, ?it/s]

training_args.bin:   0%|          | 0.00/5.50k [00:00<?, ?B/s]

=== Starting experiment 14 on 2509-0029: bart-abs-2409-1947-lr-3e-06-bs-8-maxep-10 training


  self.scaler = torch.cuda.amp.GradScaler(**kwargs)


Epoch,Training Loss,Validation Loss,Rouge/rouge1,Rouge/rouge2,Rouge/rougel,Rouge/rougelsum,Bertscore/bertscore-precision,Bertscore/bertscore-recall,Bertscore/bertscore-f1,Meteor,Gen Len
1,0.1784,7.816429,0.3097,0.0856,0.2463,0.2464,0.8589,0.8656,0.8622,0.2246,36.0
2,0.1816,7.834855,0.2722,0.0714,0.2029,0.2031,0.8612,0.8618,0.8615,0.2582,44.0
3,0.1813,7.847122,0.2677,0.0541,0.2002,0.2007,0.8757,0.864,0.8697,0.25,37.0
4,0.1798,7.859787,0.3097,0.0856,0.2463,0.2464,0.8589,0.8656,0.8622,0.2246,36.0
5,0.2,7.85682,0.2722,0.0714,0.2029,0.2031,0.8612,0.8618,0.8615,0.2582,44.0
6,0.2047,7.84579,0.3097,0.0856,0.2463,0.2464,0.8589,0.8656,0.8622,0.2246,36.0
7,0.2066,7.840898,0.3097,0.0856,0.2463,0.2464,0.8589,0.8656,0.8622,0.2246,36.0
8,0.2144,7.838196,0.2646,0.0434,0.203,0.2031,0.867,0.8616,0.8642,0.2187,36.0
9,0.2062,7.836782,0.2646,0.0434,0.203,0.2031,0.867,0.8616,0.8642,0.2187,36.0
10,0.2056,7.836253,0.3097,0.0856,0.2463,0.2464,0.8589,0.8656,0.8622,0.2246,36.0


Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}
Non-default generation parameters: {'max_length': 62, 'min_l

Finished experiment 14: bart-abs-2409-1947-lr-3e-06-bs-8-maxep-10 - time it took for training: 0:19:59.770202


Non-default generation parameters: {'max_length': 62, 'min_length': 11, 'early_stopping': True, 'num_beams': 6, 'length_penalty': 0.5, 'no_repeat_ngram_size': 3, 'forced_eos_token_id': 2}


Upload 2 LFS files:   0%|          | 0/2 [00:00<?, ?it/s]

model.safetensors:   0%|          | 0.00/1.22G [00:00<?, ?B/s]

training_args.bin:   0%|          | 0.00/5.50k [00:00<?, ?B/s]

In [32]:
# Using wandb documentation: https://docs.wandb.ai/guides/artifacts
def log_csv_wandb(results_path, model_name):
    artifact = wandb.Artifact(name=model_name, type="predictions")
    for root, dirs, files in os.walk(results_path):
        for file in files:
            artifact.add_file(local_path=os.path.join(root, file), name=file)
    wandb.log_artifact(artifact)

In [33]:
log_csv_wandb(results_dir, run_name)

In [34]:
print("Finished all training and evaluation for", run_name)
wandb.finish()

Finished all training and evaluation for bart-abs-2409-1947


[34m[1mwandb[0m:                                                                                
[34m[1mwandb[0m: 
[34m[1mwandb[0m: Run history:
[34m[1mwandb[0m:        eval/bertscore/bertscore-f1 ▇██▇▇█▄▃▃▂▂▁▃▃▄▂▃▃▂▁▃▃▃▂▃▃▃▃▃▃▃▃▃▃▃▃▃▃▃▃
[34m[1mwandb[0m: eval/bertscore/bertscore-precision █████████▆▄▁▃▅▅▃▄▂▂▅▄▃▄▃▃▃▃▃▃▃▃▃▃▃▃▃▃▃▃▃
[34m[1mwandb[0m:    eval/bertscore/bertscore-recall ▇████████▃▂▂▃▂▂▃▂▃▃▃▂▃▁▃▄▄▃▃▃▃▄▄▄▄▄▄▄▃▄▃
[34m[1mwandb[0m:                       eval/gen_len ▄▄▄▄▅▄▄▄▄▄▃▅▄▆▃██▇▂▂▆▃▁▆▅▄▆▆▆▆▆▆▄▄▄▄▄▄▆▄
[34m[1mwandb[0m:                          eval/loss ▁▁▃▃▃▃▃▃▄▅▆▅▆▇▆▆▇▇▆▆▇▇▇█▇▇▇▇▇███████████
[34m[1mwandb[0m:                        eval/meteor █▇▇▇▇▂▂▂▁▁▂▁▃▂▂▂▂▂▂▃▃▃▃▃▃▃▂▂▂▂▃▂▂▂▃▃▃▂▂▂
[34m[1mwandb[0m:                  eval/rouge/rouge1 ▇█▇▇▇█▁▂▁▂▁▂▂▃▂▁▃▂▂▂▂▂▂▂▃▃▃▃▃▃▃▃▃▃▂▂▂▃▂▂
[34m[1mwandb[0m:                  eval/rouge/rouge2 █▇█▇▇▇▇▇▇▂▁▂▁▂▁▂▁▁▁▂▂▂▁▃▁▂▂▂▂▂▃▃▃▂▃▃▂▃▃▃
[34m[1mwandb[0m:                  eval/rouge/rougeL ▇▇▇▇██▂▂▃▂▁▂▂▁▁▂▂▁▁▃▂▂▃

In [35]:
print("Results uploaded")

Results uploaded
