In [1]:
from transformers import AutoModelWithLMHead,BertForSequenceClassification, AutoTokenizer, AutoModel,AutoModelForMaskedLM,AutoModelForSequenceClassification
import torch
from torch import nn
import json
import numpy as np
from sklearn.linear_model import LogisticRegression
from sklearn.model_selection import cross_val_score
from sklearn.model_selection import train_test_split,StratifiedShuffleSplit
from torch.utils.data import DataLoader,TensorDataset
from transformers import Trainer, TrainingArguments
import pickle
from sklearn.metrics import confusion_matrix,classification_report
from sklearn.metrics import accuracy_score, recall_score, precision_score, f1_score,roc_curve
import pandas as pd
import matplotlib.pyplot as plt


In [2]:
model = AutoModelForMaskedLM.from_pretrained("emilyalsentzer/Bio_ClinicalBERT")

Some weights of the model checkpoint at emilyalsentzer/Bio_ClinicalBERT were not used when initializing BertForMaskedLM: ['cls.seq_relationship.weight', 'cls.seq_relationship.bias']
- This IS expected if you are initializing BertForMaskedLM from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForMaskedLM from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).


In [3]:
model

BertForMaskedLM(
  (bert): BertModel(
    (embeddings): BertEmbeddings(
      (word_embeddings): Embedding(28996, 768, padding_idx=0)
      (position_embeddings): Embedding(512, 768)
      (token_type_embeddings): Embedding(2, 768)
      (LayerNorm): LayerNorm((768,), eps=1e-12, elementwise_affine=True)
      (dropout): Dropout(p=0.1, inplace=False)
    )
    (encoder): BertEncoder(
      (layer): ModuleList(
        (0): BertLayer(
          (attention): BertAttention(
            (self): BertSelfAttention(
              (query): Linear(in_features=768, out_features=768, bias=True)
              (key): Linear(in_features=768, out_features=768, bias=True)
              (value): Linear(in_features=768, out_features=768, bias=True)
              (dropout): Dropout(p=0.1, inplace=False)
            )
            (output): BertSelfOutput(
              (dense): Linear(in_features=768, out_features=768, bias=True)
              (LayerNorm): LayerNorm((768,), eps=1e-12, elementwise_affine=Tr

In [4]:
model.bert.embeddings.word_embeddings

Embedding(28996, 768, padding_idx=0)

In [5]:
for name, param in model.bert.embeddings.word_embeddings.named_parameters():
    #print(dir(param))
    if param.requires_grad:
        print(name, len(param.data),param.data)

weight 28996 tensor([[-0.0333, -0.0794, -0.0196,  ..., -0.0365, -0.0359,  0.0013],
        [ 0.0125, -0.0182, -0.0349,  ..., -0.0387, -0.0596, -0.0106],
        [-0.0384, -0.0131,  0.0037,  ..., -0.0394, -0.0423, -0.0357],
        ...,
        [-0.0045, -0.0044, -0.0520,  ..., -0.0384, -0.0762, -0.0117],
        [-0.0235,  0.0125, -0.0237,  ..., -0.0818,  0.0034, -0.0393],
        [ 0.0488, -0.0234, -0.0319,  ..., -0.0522, -0.0444, -0.0116]])


In [7]:
for name, param in model.bert.embeddings.word_embeddings.named_parameters():
    #print(dir(param))
    if param.requires_grad:
        print(name, len(param.data),param.data)

weight 29002 tensor([[-0.0333, -0.0794, -0.0196,  ..., -0.0365, -0.0359,  0.0013],
        [ 0.0125, -0.0182, -0.0349,  ..., -0.0387, -0.0596, -0.0106],
        [-0.0384, -0.0131,  0.0037,  ..., -0.0394, -0.0423, -0.0357],
        ...,
        [-0.0015,  0.0085, -0.0136,  ..., -0.0067,  0.0218, -0.0072],
        [-0.0160,  0.0052,  0.0189,  ..., -0.0064, -0.0283,  0.0127],
        [-0.0282,  0.0033,  0.0212,  ..., -0.0097, -0.0260, -0.0052]])


In [5]:
for name, param in model.bert.embeddings.word_embeddings.named_parameters():
    #print(dir(param))
    if param.requires_grad:
        print(name, len(param.data),param.data)

weight 29002 tensor([[-0.0333, -0.0794, -0.0196,  ..., -0.0365, -0.0359,  0.0013],
        [ 0.0125, -0.0182, -0.0349,  ..., -0.0387, -0.0596, -0.0106],
        [-0.0384, -0.0131,  0.0037,  ..., -0.0394, -0.0423, -0.0357],
        ...,
        [-0.0147, -0.0325, -0.0084,  ..., -0.0460,  0.0382,  0.0045],
        [ 0.0046,  0.0099, -0.0027,  ...,  0.0149,  0.0103, -0.0042],
        [ 0.0223,  0.0003,  0.0170,  ...,  0.0172, -0.0408, -0.0061]])


In [6]:
for name, param in model.bert.embeddings.word_embeddings.named_parameters():
    #print(dir(param))
    if param.requires_grad:
        print(name, len(param.data),param.data)

weight 29002 tensor([[-0.0333, -0.0794, -0.0196,  ..., -0.0365, -0.0359,  0.0013],
        [ 0.0125, -0.0182, -0.0349,  ..., -0.0387, -0.0596, -0.0106],
        [-0.0384, -0.0131,  0.0037,  ..., -0.0394, -0.0423, -0.0357],
        ...,
        [-0.0376,  0.0200, -0.0143,  ...,  0.0254,  0.0201, -0.0004],
        [-0.0055, -0.0355,  0.0392,  ..., -0.0206,  0.0027, -0.0159],
        [-0.0111,  0.0308,  0.0389,  ...,  0.0054, -0.0082, -0.0020]])


In [5]:
model.resize_token_embeddings(29002)

Embedding(29002, 768)

In [6]:
model.config.tie_word_embeddings = False

In [5]:
model.config.tie_word_embeddings

True

In [12]:
model.bert.embeddings.word_embeddings.parameters()[-6:] #weight[-6:]

TypeError: 'generator' object is not subscriptable

In [13]:
model.named_parameters()

<generator object Module.named_parameters at 0x0000028B98AEF7B0>

In [2]:
tokenizer = AutoTokenizer.from_pretrained("emilyalsentzer/Bio_ClinicalBERT")
new_tokens = ["interstitial", "fibrosis", "tubular", "atrophy","antibody","T-cell"]
tokenizer.add_tokens(new_tokens)

6

In [2]:
tokenizer = AutoTokenizer.from_pretrained("dmis-lab/biobert-base-cased-v1.1")

In [2]:
tokenizer = AutoTokenizer.from_pretrained("emilyalsentzer/Bio_ClinicalBERT")

In [2]:
tokenizer = AutoTokenizer.from_pretrained("bert-base-cased")

In [3]:
data = pd.read_csv("data.csv")
# inputs1 = data["train_report"].tolist()
inputs1 = data["train_report_qa"].tolist()
label1 = data["IFTA"].tolist()

In [4]:
label2 = [l for i,l in zip(inputs1,label1) if str(i)!="nan"]
#label = [0 if l in ["nosig","minimal","noinfo"] else (1 if l=="mild" else (2 if l=="moderate" else 3)) for l in label2]
label = []
for l in label2:
    if l == "noinfo":
        label.append(0)
    elif l == "nosig":
        label.append(1)
    elif l == "minimal":
        label.append(2)
    elif l == "mild":
        label.append(3)
    elif l == "moderate":
        label.append(4)
    else:
        label.append(5)
inputs = [i for i in inputs1 if str(i)!="nan"]

In [5]:
train_text, test_text, train_labels, test_labels = train_test_split(
    inputs, label,random_state = 1,stratify=label,test_size=0.2)

In [6]:
class RenalDataset(torch.utils.data.Dataset):
    def __init__(self, encodings, labels):
        self.encodings = encodings
        self.labels = labels

    def __getitem__(self, idx):
        item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
        item['labels'] = torch.tensor(self.labels[idx])
        return item

    def __len__(self):
        return len(self.labels)
def compute_metrics(p):    
    pred, labels = p
    pred = np.argmax(pred, axis=1)
    accuracy = accuracy_score(y_true=labels, y_pred=pred)
    recall = recall_score(y_true=labels, y_pred=pred,average="micro")
    precision = precision_score(y_true=labels, y_pred=pred,average="micro")
    f1 = f1_score(y_true=labels, y_pred=pred,average="weighted")
    return {"accuracy": accuracy, "precision": precision, "recall": recall, "f1": f1} 

In [7]:
train_encodings = tokenizer(train_text,padding="max_length", truncation=True, 
                            return_tensors="pt",max_length=512)
test_encodings = tokenizer(test_text,padding="max_length", truncation=True, 
                            return_tensors="pt",max_length=512)
train_dataset = RenalDataset(train_encodings, train_labels)
test_dataset = RenalDataset(test_encodings, test_labels)
# model_renal = AutoModelForSequenceClassification.from_pretrained("./mlm_results_largeData/checkpoint-1100",num_labels=6)
# model_renal = AutoModelForSequenceClassification.from_pretrained("bert-base-cased",num_labels=6)
model_renal = AutoModelForSequenceClassification.from_pretrained("./mlm_results_largeData_extended_tokenizer_lr/checkpoint-1400",num_labels=6)
#model_renal = AutoModelForSequenceClassification.from_pretrained("dmis-lab/biobert-base-cased-v1.1",num_labels=6)


Some weights of the model checkpoint at ./mlm_results_largeData_extended_tokenizer_lr/checkpoint-1400 were not used when initializing BertForSequenceClassification: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.decoder.weight', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.bias', 'cls.predictions.transform.dense.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the mod

In [None]:
# BERT - ifta cls 
batch_size = 16
training_args = TrainingArguments(
    output_dir='./fine_mlm_results_ifta_4labels_largeData_batch16_extoken',          
    num_train_epochs=15,              
    per_device_train_batch_size=batch_size,  
    per_device_eval_batch_size=batch_size*4,   
    warmup_steps=50,                
    weight_decay=0.01,                          
    logging_steps=50*16/batch_size,
    evaluation_strategy="steps",
    eval_steps=50*16/batch_size,
    load_best_model_at_end=True,
    save_steps = 50*16/batch_size,
    save_total_limit = 1,
    seed = 0
)


trainer = Trainer(
    model=model_renal,                         
    args=training_args,                 
    train_dataset=train_dataset,         
    eval_dataset=test_dataset,
    compute_metrics=compute_metrics,
)

try:
    
    trainer.train()
except Exception as e:
    print(e)

***** Running training *****
  Num examples = 2738
  Num Epochs = 15
  Instantaneous batch size per device = 16
  Total train batch size (w. parallel, distributed & accumulation) = 16
  Gradient Accumulation steps = 1
  Total optimization steps = 2580
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}


Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
50,1.5577,1.388861,0.512409,0.512409,0.512409,0.42448
100,1.2313,1.162278,0.59708,0.59708,0.59708,0.492329
150,1.212,1.105211,0.613139,0.613139,0.613139,0.502948
200,1.1327,1.053624,0.618978,0.618978,0.618978,0.550526
250,1.0724,0.930673,0.651095,0.651095,0.651095,0.576806
300,0.9607,0.959221,0.665693,0.665693,0.665693,0.594036
350,0.94,0.925783,0.664234,0.664234,0.664234,0.590649
400,0.936,0.964335,0.652555,0.652555,0.652555,0.6314
450,0.8791,0.998828,0.637956,0.637956,0.637956,0.564034
500,0.9565,0.960702,0.626277,0.626277,0.626277,0.543292


***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-50
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-50\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-50\pytorch_model.bin
Deleting older checkpoint [fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-600] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-100
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-100\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-100\pytorch_model.bin
Deleting olde

***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-550
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-550\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-550\pytorch_model.bin
Deleting older checkpoint [fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-350] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-600
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-600\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-600\pytorch_model.bin
Deleting o

In [None]:
# KidneyBERT - ifta cls 
batch_size = 16
training_args = TrainingArguments(
    output_dir='./fine_mlm_results_ifta_4labels_largeData_batch16_extoken',          
    num_train_epochs=15,              
    per_device_train_batch_size=batch_size,  
    per_device_eval_batch_size=batch_size*4,   
    warmup_steps=50,                
    weight_decay=0.01,                          
    logging_steps=50*16/batch_size,
    evaluation_strategy="steps",
    eval_steps=50*16/batch_size,
    load_best_model_at_end=True,
    save_steps = 50*16/batch_size,
    save_total_limit = 1,
    seed = 0
)


trainer = Trainer(
    model=model_renal,                         
    args=training_args,                 
    train_dataset=train_dataset,         
    eval_dataset=test_dataset,
    compute_metrics=compute_metrics,
)

try:
    
    trainer.train()
except Exception as e:
    print(e)

***** Running training *****
  Num examples = 2738
  Num Epochs = 15
  Instantaneous batch size per device = 16
  Total train batch size (w. parallel, distributed & accumulation) = 16
  Gradient Accumulation steps = 1
  Total optimization steps = 2580
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}


Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
50,1.4626,1.183166,0.581022,0.581022,0.581022,0.477052
100,1.1018,0.980255,0.633577,0.633577,0.633577,0.562757
150,1.0853,0.928196,0.658394,0.658394,0.658394,0.576777
200,0.9658,0.90272,0.664234,0.664234,0.664234,0.628368
250,0.958,0.866512,0.678832,0.678832,0.678832,0.64881
300,0.9156,0.905765,0.667153,0.667153,0.667153,0.626471
350,0.8373,0.855402,0.69927,0.69927,0.69927,0.658419
400,0.8033,0.824018,0.718248,0.718248,0.718248,0.696512
450,0.7807,0.822974,0.708029,0.708029,0.708029,0.673226
500,0.806,0.805589,0.689051,0.689051,0.689051,0.651244


***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-50
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-50\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-50\pytorch_model.bin
Deleting older checkpoint [fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-500] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-100
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-100\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-100\pytorch_model.bin
Deleting olde

***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-550
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-550\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-550\pytorch_model.bin
Deleting older checkpoint [fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-450] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-600
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-600\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-600\pytorch_model.bin
Deleting o

***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1050
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1050\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1050\pytorch_model.bin
Deleting older checkpoint [fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1000] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1100
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1100\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1100\pytorch_model.bin
Del

***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1550
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1550\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1550\pytorch_model.bin
Deleting older checkpoint [fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1500] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1600
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1600\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1600\pytorch_model.bin
Del

***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-2050
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-2050\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-2050\pytorch_model.bin
Deleting older checkpoint [fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-2000] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}


In [8]:
# KidneyBERT - qa ifta cls 
batch_size = 16
training_args = TrainingArguments(
    output_dir='./fine_mlm_results_ifta_4labels_largeData_batch16_extoken',          
    num_train_epochs=15,              
    per_device_train_batch_size=batch_size,  
    per_device_eval_batch_size=batch_size*4,   
    warmup_steps=50,                
    weight_decay=0.01,                          
    logging_steps=50*16/batch_size,
    evaluation_strategy="steps",
    eval_steps=50*16/batch_size,
    load_best_model_at_end=True,
    save_steps = 50*16/batch_size,
    save_total_limit = 1,
    seed = 0
)


trainer = Trainer(
    model=model_renal,                         
    args=training_args,                 
    train_dataset=train_dataset,         
    eval_dataset=test_dataset,
    compute_metrics=compute_metrics,
)

try:
    
    trainer.train()
except Exception as e:
    print(e)

***** Running training *****
  Num examples = 2738
  Num Epochs = 15
  Instantaneous batch size per device = 16
  Total train batch size (w. parallel, distributed & accumulation) = 16
  Gradient Accumulation steps = 1
  Total optimization steps = 2580
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}


Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
50,1.4562,1.151662,0.59854,0.59854,0.59854,0.491674
100,0.7951,0.438924,0.849635,0.849635,0.849635,0.823548
150,0.4594,0.408765,0.891971,0.891971,0.891971,0.878131
200,0.3407,0.387071,0.894891,0.894891,0.894891,0.873957
250,0.3319,0.365728,0.905109,0.905109,0.905109,0.903574
300,0.3442,0.397677,0.886131,0.886131,0.886131,0.868524
350,0.2894,0.352807,0.89781,0.89781,0.89781,0.890348
400,0.2974,0.419329,0.874453,0.874453,0.874453,0.876963
450,0.2409,0.387285,0.89927,0.89927,0.89927,0.891748
500,0.2653,0.388091,0.89781,0.89781,0.89781,0.897468


***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-50
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-50\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-50\pytorch_model.bin
Deleting older checkpoint [fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-650] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-100
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-100\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-100\pytorch_model.bin
Deleting olde

***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-550
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-550\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-550\pytorch_model.bin
Deleting older checkpoint [fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-500] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-600
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-600\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-600\pytorch_model.bin
Deleting o

***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1050
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1050\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1050\pytorch_model.bin
Deleting older checkpoint [fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1000] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1100
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1100\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1100\pytorch_model.bin
Del

***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1550
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1550\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1550\pytorch_model.bin
Deleting older checkpoint [fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1500] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1600
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1600\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1600\pytorch_model.bin
Del

***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-2050
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-2050\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-2050\pytorch_model.bin
Deleting older checkpoint [fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-2000] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-2100
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-2100\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-2100\pytorch_model.bin
Del

***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-2550
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-2550\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-2550\pytorch_model.bin
Deleting older checkpoint [fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-2500] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}


Training completed. Do not forget to share your model on huggingface.co/models =)


Loading best model from ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-350 (score: 0.3528066575527191).


In [8]:
# exKidneyBERT - ifta cls 
batch_size = 16
training_args = TrainingArguments(
    output_dir='./fine_mlm_results_ifta_4labels_largeData_batch16_extoken',          
    num_train_epochs=15,              
    per_device_train_batch_size=batch_size,  
    per_device_eval_batch_size=batch_size*4,   
    warmup_steps=50,                
    weight_decay=0.01,                          
    logging_steps=50*16/batch_size,
    evaluation_strategy="steps",
    eval_steps=50*16/batch_size,
    load_best_model_at_end=True,
    save_steps = 50*16/batch_size,
    save_total_limit = 1,
    seed = 0
)


trainer = Trainer(
    model=model_renal,                         
    args=training_args,                 
    train_dataset=train_dataset,         
    eval_dataset=test_dataset,
    compute_metrics=compute_metrics,
)

try:
    
    trainer.train()
except Exception as e:
    print(e)

***** Running training *****
  Num examples = 2738
  Num Epochs = 15
  Instantaneous batch size per device = 16
  Total train batch size (w. parallel, distributed & accumulation) = 16
  Gradient Accumulation steps = 1
  Total optimization steps = 2580
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}


Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
50,1.4629,1.143271,0.59854,0.59854,0.59854,0.493175
100,1.08,1.083766,0.616058,0.616058,0.616058,0.541205
150,1.0752,0.950542,0.659854,0.659854,0.659854,0.595676
200,0.9521,0.937897,0.630657,0.630657,0.630657,0.579477
250,0.9544,0.900083,0.667153,0.667153,0.667153,0.63769
300,0.9153,0.862881,0.693431,0.693431,0.693431,0.669477
350,0.8185,0.843714,0.691971,0.691971,0.691971,0.635012
400,0.7924,0.83221,0.684672,0.684672,0.684672,0.675337
450,0.7656,0.835042,0.70073,0.70073,0.70073,0.666819
500,0.805,0.816369,0.671533,0.671533,0.671533,0.632238


***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-50
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-50\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-50\pytorch_model.bin
Deleting older checkpoint [fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-300] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-100
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-100\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-100\pytorch_model.bin
Deleting olde

***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-550
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-550\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-550\pytorch_model.bin
Deleting older checkpoint [fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-450] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-600
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-600\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-600\pytorch_model.bin
Deleting o

***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1050
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1050\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1050\pytorch_model.bin
Deleting older checkpoint [fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1000] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1100
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1100\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1100\pytorch_model.bin
Del

***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1550
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1550\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1550\pytorch_model.bin
Deleting older checkpoint [fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1500] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1600
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1600\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1600\pytorch_model.bin
Del

***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-2050
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-2050\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-2050\pytorch_model.bin
Deleting older checkpoint [fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-2000] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-2100
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-2100\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-2100\pytorch_model.bin
Del

***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-2550
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-2550\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-2550\pytorch_model.bin
Deleting older checkpoint [fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-2500] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}


Training completed. Do not forget to share your model on huggingface.co/models =)


Loading best model from ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-700 (score: 0.8057909607887268).


In [8]:
# exKidneyBERT_lr - qa ifta cls 
batch_size = 16
training_args = TrainingArguments(
    output_dir='./fine_mlm_results_ifta_4labels_largeData_batch16_extoken',          
    num_train_epochs=15,              
    per_device_train_batch_size=batch_size,  
    per_device_eval_batch_size=batch_size*4,   
    warmup_steps=50,                
    weight_decay=0.01,                          
    logging_steps=50*16/batch_size,
    evaluation_strategy="steps",
    eval_steps=50*16/batch_size,
    load_best_model_at_end=True,
    save_steps = 50*16/batch_size,
    save_total_limit = 1,
    seed = 0
)


trainer = Trainer(
    model=model_renal,                         
    args=training_args,                 
    train_dataset=train_dataset,         
    eval_dataset=test_dataset,
    compute_metrics=compute_metrics,
)

try:
    
    trainer.train()
except Exception as e:
    print(e)

***** Running training *****
  Num examples = 2738
  Num Epochs = 15
  Instantaneous batch size per device = 16
  Total train batch size (w. parallel, distributed & accumulation) = 16
  Gradient Accumulation steps = 1
  Total optimization steps = 2580
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}


Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
50,1.4516,1.075703,0.626277,0.626277,0.626277,0.512141
100,0.6478,0.414251,0.891971,0.891971,0.891971,0.880026
150,0.4603,0.437068,0.872993,0.872993,0.872993,0.851261
200,0.4004,0.424771,0.887591,0.887591,0.887591,0.861179
250,0.33,0.40223,0.890511,0.890511,0.890511,0.876411
300,0.3465,0.361697,0.90073,0.90073,0.90073,0.886696
350,0.3309,0.407881,0.90073,0.90073,0.90073,0.891341
400,0.2811,0.424414,0.881752,0.881752,0.881752,0.886123
450,0.2599,0.417459,0.893431,0.893431,0.893431,0.881994
500,0.2361,0.390827,0.90219,0.90219,0.90219,0.902108


***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-50
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-50\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-50\pytorch_model.bin
Deleting older checkpoint [fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-800] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-100
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-100\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-100\pytorch_model.bin
Deleting olde

***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-550
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-550\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-550\pytorch_model.bin
Deleting older checkpoint [fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-500] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-600
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-600\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-600\pytorch_model.bin
Deleting o

***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1050
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1050\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1050\pytorch_model.bin
Deleting older checkpoint [fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1000] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1100
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1100\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1100\pytorch_model.bin
Del

***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1550
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1550\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1550\pytorch_model.bin
Deleting older checkpoint [fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1500] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1600
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1600\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-1600\pytorch_model.bin
Del

***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-2050
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-2050\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-2050\pytorch_model.bin
Deleting older checkpoint [fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-2000] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-2100
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-2100\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-2100\pytorch_model.bin
Del

***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-2550
Configuration saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-2550\config.json
Model weights saved in ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-2550\pytorch_model.bin
Deleting older checkpoint [fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-2500] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}


Training completed. Do not forget to share your model on huggingface.co/models =)


Loading best model from ./fine_mlm_results_ifta_4labels_largeData_batch16_extoken\checkpoint-300 (score: 0.3616968095302582).


In [8]:
# BioBERT - ifta cls 
batch_size = 16
training_args = TrainingArguments(
    output_dir='./fine_bioBERT_results_ifta_4labels_largeData_batch16',          
    num_train_epochs=20,              
    per_device_train_batch_size=batch_size,  
    per_device_eval_batch_size=batch_size*4,   
    warmup_steps=50,                
    weight_decay=0.01,                          
    logging_steps=50*16/batch_size,
    evaluation_strategy="steps",
    eval_steps=50*16/batch_size,
    load_best_model_at_end=True,
    save_steps = 50*16/batch_size,
    save_total_limit = 1,
    seed = 0
)


trainer = Trainer(
    model=model_renal,                         
    args=training_args,                 
    train_dataset=train_dataset,         
    eval_dataset=test_dataset,
    compute_metrics=compute_metrics,
)

trainer.train()


***** Running training *****
  Num examples = 2738
  Num Epochs = 20
  Instantaneous batch size per device = 16
  Total train batch size (w. parallel, distributed & accumulation) = 16
  Gradient Accumulation steps = 1
  Total optimization steps = 3440
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}


Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
50,1.4897,1.287165,0.518248,0.518248,0.518248,0.422044
100,1.1587,1.048901,0.610219,0.610219,0.610219,0.500856
150,1.0781,0.960798,0.671533,0.671533,0.671533,0.591547
200,0.9789,0.916042,0.662774,0.662774,0.662774,0.623582
250,0.9651,0.888289,0.69927,0.69927,0.69927,0.649876
300,0.8934,0.889392,0.691971,0.691971,0.691971,0.64347
350,0.8235,0.842183,0.69635,0.69635,0.69635,0.651656
400,0.8343,0.846844,0.70219,0.70219,0.70219,0.679359
450,0.8021,0.880122,0.675912,0.675912,0.675912,0.62939
500,0.8326,0.841846,0.664234,0.664234,0.664234,0.636635


***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-50
Configuration saved in ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-50\config.json
Model weights saved in ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-50\pytorch_model.bin
Deleting older checkpoint [fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-300] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-100
Configuration saved in ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-100\config.json
Model weights saved in ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-100\pytorch_model.bin
Deleting older checkpoint [fine_bioBERT_r

Configuration saved in ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-550\config.json
Model weights saved in ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-550\pytorch_model.bin
Deleting older checkpoint [fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-450] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-600
Configuration saved in ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-600\config.json
Model weights saved in ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-600\pytorch_model.bin
Deleting older checkpoint [fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-500] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
**

Model weights saved in ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-1050\pytorch_model.bin
Deleting older checkpoint [fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-1000] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-1100
Configuration saved in ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-1100\config.json
Model weights saved in ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-1100\pytorch_model.bin
Deleting older checkpoint [fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-1050] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./f

Deleting older checkpoint [fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-1500] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-1600
Configuration saved in ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-1600\config.json
Model weights saved in ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-1600\pytorch_model.bin
Deleting older checkpoint [fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-1550] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-1650
Configuration saved in ./fine_bioBERT_result

  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-2100
Configuration saved in ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-2100\config.json
Model weights saved in ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-2100\pytorch_model.bin
Deleting older checkpoint [fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-2050] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-2150
Configuration saved in ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-2150\config.json
Model weights saved in ./fine_bioBERT_results_ifta_4labels_large

***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-2600
Configuration saved in ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-2600\config.json
Model weights saved in ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-2600\pytorch_model.bin
Deleting older checkpoint [fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-2550] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64


KeyboardInterrupt: 

In [None]:
# BioBERT - qa ifta cls 
batch_size = 16
training_args = TrainingArguments(
    output_dir='./fine_bioBERT_results_ifta_4labels_largeData_batch16',          
    num_train_epochs=20,              
    per_device_train_batch_size=batch_size,  
    per_device_eval_batch_size=batch_size*4,   
    warmup_steps=50,                
    weight_decay=0.01,                          
    logging_steps=50*16/batch_size,
    evaluation_strategy="steps",
    eval_steps=50*16/batch_size,
    load_best_model_at_end=True,
    save_steps = 50*16/batch_size,
    save_total_limit = 1,
    seed = 0
)


trainer = Trainer(
    model=model_renal,                         
    args=training_args,                 
    train_dataset=train_dataset,         
    eval_dataset=test_dataset,
    compute_metrics=compute_metrics,
)

trainer.train()


***** Running training *****
  Num examples = 2738
  Num Epochs = 20
  Instantaneous batch size per device = 16
  Total train batch size (w. parallel, distributed & accumulation) = 16
  Gradient Accumulation steps = 1
  Total optimization steps = 3440
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}


Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
50,1.5015,1.382176,0.467153,0.467153,0.467153,0.357851
100,1.051,0.842015,0.715328,0.715328,0.715328,0.636124
150,0.8533,0.736691,0.748905,0.748905,0.748905,0.665873
200,0.7251,0.67944,0.772263,0.772263,0.772263,0.72963
250,0.5521,0.484167,0.871533,0.871533,0.871533,0.854789
300,0.4669,0.446796,0.859854,0.859854,0.859854,0.846423
350,0.437,0.521461,0.859854,0.859854,0.859854,0.843272
400,0.3899,0.546551,0.826277,0.826277,0.826277,0.837394
450,0.3906,0.467222,0.865693,0.865693,0.865693,0.8461
500,0.3741,0.392983,0.891971,0.891971,0.891971,0.877525


***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-50
Configuration saved in ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-50\config.json
Model weights saved in ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-50\pytorch_model.bin
Deleting older checkpoint [fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-750] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-100
Configuration saved in ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-100\config.json
Model weights saved in ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-100\pytorch_model.bin
Deleting older checkpoint [fine_bioBERT_r

Configuration saved in ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-550\config.json
Model weights saved in ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-550\pytorch_model.bin
Deleting older checkpoint [fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-450] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-600
Configuration saved in ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-600\config.json
Model weights saved in ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-600\pytorch_model.bin
Deleting older checkpoint [fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-550] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
**

Model weights saved in ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-1050\pytorch_model.bin
Deleting older checkpoint [fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-1000] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-1100
Configuration saved in ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-1100\config.json
Model weights saved in ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-1100\pytorch_model.bin
Deleting older checkpoint [fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-1050] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./f

Deleting older checkpoint [fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-1500] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-1600
Configuration saved in ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-1600\config.json
Model weights saved in ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-1600\pytorch_model.bin
Deleting older checkpoint [fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-1550] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-1650
Configuration saved in ./fine_bioBERT_result

  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-2100
Configuration saved in ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-2100\config.json
Model weights saved in ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-2100\pytorch_model.bin
Deleting older checkpoint [fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-2050] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-2150
Configuration saved in ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-2150\config.json
Model weights saved in ./fine_bioBERT_results_ifta_4labels_large

***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-2600
Configuration saved in ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-2600\config.json
Model weights saved in ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-2600\pytorch_model.bin
Deleting older checkpoint [fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-2550] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-2650
Configuration saved in ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-2650\config.json
Model weights saved in ./fine_bioBERT_results_ifta_4labels_largeData_batch16\checkpoint-2650\pytorch_model.bin
Deleting older checkpoint [fine

In [None]:
# ClinicalBERT - ifta cls
batch_size = 16
model_cli = AutoModelForSequenceClassification.from_pretrained("emilyalsentzer/Bio_ClinicalBERT",num_labels=6)
training_args = TrainingArguments(
    output_dir='./fine_cliBERT_results_ifta_4labels_largeData_batch16',          
    num_train_epochs=15,              
    per_device_train_batch_size=batch_size,  
    per_device_eval_batch_size=batch_size*4,   
    warmup_steps=50,                
    weight_decay=0.01,                          
    logging_steps=50*16/batch_size,
    evaluation_strategy="steps",
    eval_steps=50*16/batch_size,
    load_best_model_at_end=True,
    save_steps = 50*16/batch_size,
    save_total_limit = 1,
    seed = 0
)


trainer = Trainer(
    model=model_cli,                         
    args=training_args,                 
    train_dataset=train_dataset,         
    eval_dataset=test_dataset,
    compute_metrics=compute_metrics,
)

trainer.train()


Some weights of the model checkpoint at emilyalsentzer/Bio_ClinicalBERT were not used when initializing BertForSequenceClassification: ['cls.predictions.decoder.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.transform.dense.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.bias', 'cls.seq_relationship.weight', 'cls.predictions.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
50,1.554,1.242224,0.576642,0.576642,0.576642,0.471908
100,1.1243,1.165618,0.613139,0.613139,0.613139,0.501815
150,1.1529,0.963942,0.643796,0.643796,0.643796,0.553779
200,1.032,0.929965,0.662774,0.662774,0.662774,0.593074
250,0.9942,0.885117,0.665693,0.665693,0.665693,0.596577
300,0.9147,0.883437,0.665693,0.665693,0.665693,0.59182
350,0.8645,0.85824,0.683212,0.683212,0.683212,0.624408
400,0.8327,0.826329,0.694891,0.694891,0.694891,0.685623
450,0.7928,0.875262,0.687591,0.687591,0.687591,0.650343
500,0.8704,0.80242,0.69927,0.69927,0.69927,0.669661


***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-50
Configuration saved in ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-50\config.json
Model weights saved in ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-50\pytorch_model.bin
Deleting older checkpoint [fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-800] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-100
Configuration saved in ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-100\config.json
Model weights saved in ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-100\pytorch_model.bin
Deleting older checkpoint [fine_cliBERT_r

Configuration saved in ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-550\config.json
Model weights saved in ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-550\pytorch_model.bin
Deleting older checkpoint [fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-450] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-600
Configuration saved in ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-600\config.json
Model weights saved in ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-600\pytorch_model.bin
Deleting older checkpoint [fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-500] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
**

Model weights saved in ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-1050\pytorch_model.bin
Deleting older checkpoint [fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-900] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-1100
Configuration saved in ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-1100\config.json
Model weights saved in ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-1100\pytorch_model.bin
Deleting older checkpoint [fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-1000] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fi

Deleting older checkpoint [fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-1500] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-1600
Configuration saved in ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-1600\config.json
Model weights saved in ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-1600\pytorch_model.bin
Deleting older checkpoint [fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-1550] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-1650
Configuration saved in ./fine_cliBERT_result

  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-2100
Configuration saved in ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-2100\config.json
Model weights saved in ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-2100\pytorch_model.bin
Deleting older checkpoint [fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-2050] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-2150
Configuration saved in ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-2150\config.json
Model weights saved in ./fine_cliBERT_results_ifta_4labels_large

In [None]:
# ClinicalBERT - qa ifta cls
batch_size = 16
model_cli = AutoModelForSequenceClassification.from_pretrained("emilyalsentzer/Bio_ClinicalBERT",num_labels=6)
training_args = TrainingArguments(
    output_dir='./fine_cliBERT_results_ifta_4labels_largeData_batch16',          
    num_train_epochs=15,              
    per_device_train_batch_size=batch_size,  
    per_device_eval_batch_size=batch_size*4,   
    warmup_steps=50,                
    weight_decay=0.01,                          
    logging_steps=50*16/batch_size,
    evaluation_strategy="steps",
    eval_steps=50*16/batch_size,
    load_best_model_at_end=True,
    save_steps = 50*16/batch_size,
    save_total_limit = 1,
    seed = 0
)


trainer = Trainer(
    model=model_cli,                         
    args=training_args,                 
    train_dataset=train_dataset,         
    eval_dataset=test_dataset,
    compute_metrics=compute_metrics,
)

trainer.train()


Some weights of the model checkpoint at emilyalsentzer/Bio_ClinicalBERT were not used when initializing BertForSequenceClassification: ['cls.predictions.transform.dense.bias', 'cls.predictions.transform.dense.weight', 'cls.seq_relationship.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.seq_relationship.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model

Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
50,1.4923,1.285793,0.534307,0.534307,0.534307,0.429406
100,1.0992,0.953476,0.668613,0.668613,0.668613,0.594669
150,0.9615,0.826294,0.738686,0.738686,0.738686,0.657862
200,0.683,0.496641,0.846715,0.846715,0.846715,0.805063
250,0.4412,0.42677,0.883212,0.883212,0.883212,0.865124
300,0.4139,0.423094,0.881752,0.881752,0.881752,0.861376
350,0.3732,0.447873,0.883212,0.883212,0.883212,0.878666
400,0.3847,0.447438,0.865693,0.865693,0.865693,0.867447
450,0.3096,0.41407,0.886131,0.886131,0.886131,0.873508
500,0.3529,0.355984,0.89927,0.89927,0.89927,0.89816


***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-50
Configuration saved in ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-50\config.json
Model weights saved in ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-50\pytorch_model.bin
Deleting older checkpoint [fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-1050] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-100
Configuration saved in ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-100\config.json
Model weights saved in ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-100\pytorch_model.bin
Deleting older checkpoint [fine_cliBERT_

Configuration saved in ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-550\config.json
Model weights saved in ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-550\pytorch_model.bin
Deleting older checkpoint [fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-450] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-600
Configuration saved in ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-600\config.json
Model weights saved in ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-600\pytorch_model.bin
Deleting older checkpoint [fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-550] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
**

Model weights saved in ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-1050\pytorch_model.bin
Deleting older checkpoint [fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-1000] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-1100
Configuration saved in ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-1100\config.json
Model weights saved in ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-1100\pytorch_model.bin
Deleting older checkpoint [fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-1050] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./f

Deleting older checkpoint [fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-1500] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-1600
Configuration saved in ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-1600\config.json
Model weights saved in ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-1600\pytorch_model.bin
Deleting older checkpoint [fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-1550] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-1650
Configuration saved in ./fine_cliBERT_result

  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-2100
Configuration saved in ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-2100\config.json
Model weights saved in ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-2100\pytorch_model.bin
Deleting older checkpoint [fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-2050] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 64
Saving model checkpoint to ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-2150
Configuration saved in ./fine_cliBERT_results_ifta_4labels_largeData_batch16\checkpoint-2150\config.json
Model weights saved in ./fine_cliBERT_results_ifta_4labels_large

In [1]:
from transformers import AutoModelWithLMHead,BertForSequenceClassification, AutoTokenizer, AutoModel,AutoModelForMaskedLM,AutoModelForSequenceClassification
import torch
from torch import nn
import json
import numpy as np
from sklearn.linear_model import LogisticRegression
from sklearn.model_selection import cross_val_score
from sklearn.model_selection import train_test_split,StratifiedShuffleSplit
from torch.utils.data import DataLoader,TensorDataset
from transformers import Trainer, TrainingArguments
import pickle
from sklearn.metrics import confusion_matrix,classification_report
from sklearn.metrics import accuracy_score, recall_score, precision_score, f1_score,roc_curve
import pandas as pd
import matplotlib.pyplot as plt


In [2]:
tokenizer = AutoTokenizer.from_pretrained("emilyalsentzer/Bio_ClinicalBERT")
new_tokens = ["interstitial", "fibrosis", "tubular", "atrophy","antibody","T-cell"]
tokenizer.add_tokens(new_tokens)

6

In [2]:
tokenizer = AutoTokenizer.from_pretrained("dmis-lab/biobert-base-cased-v1.1")

In [2]:
tokenizer = AutoTokenizer.from_pretrained("emilyalsentzer/Bio_ClinicalBERT")

In [3]:
data = pd.read_csv("data.csv")
inputs1 = data["train_report_qa"].tolist()
label1 = data["isRejection"].tolist()

label = [l for i,l in zip(inputs1,label1) if str(i)!="nan"]
inputs = [i for i in inputs1 if str(i)!="nan"]

In [4]:
train_text, test_text, train_labels, test_labels = train_test_split(
    inputs, label,random_state = 1,stratify=label,test_size=0.2)

In [5]:
class RenalDataset(torch.utils.data.Dataset):
    def __init__(self, encodings, labels):
        self.encodings = encodings
        self.labels = labels

    def __getitem__(self, idx):
        item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
        item['labels'] = torch.tensor(self.labels[idx])
        return item

    def __len__(self):
        return len(self.labels)
def compute_metrics(p):    
    pred, labels = p
    pred = np.argmax(pred, axis=1)
    accuracy = accuracy_score(y_true=labels, y_pred=pred)
    recall = recall_score(y_true=labels, y_pred=pred)
    precision = precision_score(y_true=labels, y_pred=pred)
    f1 = f1_score(y_true=labels, y_pred=pred)
    return {"accuracy": accuracy, "precision": precision, "recall": recall, "f1": f1} 

In [6]:
train_encodings = tokenizer(train_text,padding="max_length", truncation=True, 
                            return_tensors="pt",max_length=512)
test_encodings = tokenizer(test_text,padding="max_length", truncation=True, 
                            return_tensors="pt",max_length=512)
train_dataset = RenalDataset(train_encodings, train_labels)
test_dataset = RenalDataset(test_encodings, test_labels)
# model_renal = AutoModelForSequenceClassification.from_pretrained("./mlm_results_largeData/checkpoint-1100")
# model_renal = AutoModelForSequenceClassification.from_pretrained("bert-base-cased")
# model_renal = AutoModelForSequenceClassification.from_pretrained("dmis-lab/biobert-base-cased-v1.1")
# model_renal = AutoModelForSequenceClassification.from_pretrained("./mlm_results_largeData_extended_tokenizer/checkpoint-1100")
model_renal = AutoModelForSequenceClassification.from_pretrained("emilyalsentzer/Bio_ClinicalBERT")

Some weights of the model checkpoint at emilyalsentzer/Bio_ClinicalBERT were not used when initializing BertForSequenceClassification: ['cls.predictions.transform.LayerNorm.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.bias', 'cls.seq_relationship.weight', 'cls.predictions.transform.dense.weight', 'cls.predictions.decoder.weight', 'cls.seq_relationship.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model

In [None]:
# BioBERT - qa cls

batch_size = 16
training_args = TrainingArguments(
    output_dir='./fine_exkidBERTcased_results_largeData_batch16_wd1e-5',          
    num_train_epochs=20,              
    per_device_train_batch_size=batch_size,  
    per_device_eval_batch_size=batch_size*2,   
    warmup_steps=50,                
    weight_decay=1e-5,                          
    logging_steps=50*16/batch_size,
    evaluation_strategy="steps",
    eval_steps=50*16/batch_size,
    load_best_model_at_end=True,
    save_steps = 50*16/batch_size,
    save_total_limit = 1,
    seed = 0
)


trainer = Trainer(
    model=model_renal,                         
    args=training_args,                 
    train_dataset=train_dataset,         
    eval_dataset=test_dataset,
    compute_metrics=compute_metrics,
)

try:
    
    trainer.train()
except Exception as e:
    print(e)

***** Running training *****
  Num examples = 2738
  Num Epochs = 20
  Instantaneous batch size per device = 16
  Total train batch size (w. parallel, distributed & accumulation) = 16
  Gradient Accumulation steps = 1
  Total optimization steps = 3440
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}


Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
50,0.3487,0.224976,0.944526,0.0,0.0,0.0
100,0.2226,0.243678,0.944526,0.0,0.0,0.0
150,0.2268,0.210406,0.944526,0.0,0.0,0.0
200,0.1893,0.139218,0.944526,0.0,0.0,0.0
250,0.1642,0.123087,0.964964,0.733333,0.578947,0.647059
300,0.1657,0.245881,0.944526,0.0,0.0,0.0
350,0.1521,0.174738,0.960584,1.0,0.289474,0.44898
400,0.1876,0.144836,0.959124,1.0,0.263158,0.416667
450,0.1271,0.129198,0.967883,1.0,0.421053,0.592593
500,0.1614,0.16283,0.956204,1.0,0.210526,0.347826


***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
  _warn_prf(average, modifier, msg_start, len(result))
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-50
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-50\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-50\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1150] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
  _warn_prf(average, modifier, msg_start, len(result))
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-100
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-100\config.json
Model weights saved in ./fine_exki

Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-450\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-400] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-500
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-500\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-500\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-450] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
Saving model checkpoint to ./f

Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-900] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1000
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1000\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1000\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-950] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1050
Configuration saved in ./fine_exkidBERTc

Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1400] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1500
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1500\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1500\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1450] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1550
Configuration saved in ./fine_exkidBER

In [None]:
# Clinical BERT - qa cls

batch_size = 16
training_args = TrainingArguments(
    output_dir='./fine_exkidBERTcased_results_largeData_batch16_wd1e-5',          
    num_train_epochs=20,              
    per_device_train_batch_size=batch_size,  
    per_device_eval_batch_size=batch_size*2,   
    warmup_steps=50,                
    weight_decay=1e-5,                          
    logging_steps=50*16/batch_size,
    evaluation_strategy="steps",
    eval_steps=50*16/batch_size,
    load_best_model_at_end=True,
    save_steps = 50*16/batch_size,
    save_total_limit = 1,
    seed = 0
)


trainer = Trainer(
    model=model_renal,                         
    args=training_args,                 
    train_dataset=train_dataset,         
    eval_dataset=test_dataset,
    compute_metrics=compute_metrics,
)

try:
    
    trainer.train()
except Exception as e:
    print(e)

***** Running training *****
  Num examples = 2738
  Num Epochs = 20
  Instantaneous batch size per device = 16
  Total train batch size (w. parallel, distributed & accumulation) = 16
  Gradient Accumulation steps = 1
  Total optimization steps = 3440
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}


Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
50,0.3178,0.22968,0.944526,0.0,0.0,0.0
100,0.2148,0.263019,0.944526,0.0,0.0,0.0
150,0.2324,0.214161,0.944526,0.0,0.0,0.0
200,0.1944,0.185097,0.944526,0.0,0.0,0.0
250,0.1915,0.150284,0.944526,0.0,0.0,0.0
300,0.192,0.217008,0.944526,0.0,0.0,0.0
350,0.1597,0.150063,0.957664,0.8,0.315789,0.45283
400,0.166,0.132223,0.947445,0.535714,0.394737,0.454545
450,0.1348,0.14554,0.954745,0.652174,0.394737,0.491803
500,0.1784,0.152015,0.957664,1.0,0.236842,0.382979


***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
  _warn_prf(average, modifier, msg_start, len(result))
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-50
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-50\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-50\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-650] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
  _warn_prf(average, modifier, msg_start, len(result))
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-100
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-100\config.json
Model weights saved in ./fine_exkid

***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-450
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-450\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-450\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-350] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-500
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-500\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-500\pytorch_model.bin
Deleting older checkpoint [fine

  Batch size = 32
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-950
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-950\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-950\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-900] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1000
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1000\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1000\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\

  Batch size = 32
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1450
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1450\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1450\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1400] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1500
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1500\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1500\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1

In [None]:
# Kidney BERT - qa cls

batch_size = 16
training_args = TrainingArguments(
    output_dir='./fine_exkidBERTcased_results_largeData_batch16_wd1e-5',          
    num_train_epochs=20,              
    per_device_train_batch_size=batch_size,  
    per_device_eval_batch_size=batch_size*2,   
    warmup_steps=50,                
    weight_decay=1e-5,                          
    logging_steps=50*16/batch_size,
    evaluation_strategy="steps",
    eval_steps=50*16/batch_size,
    load_best_model_at_end=True,
    save_steps = 50*16/batch_size,
    save_total_limit = 1,
    seed = 0
)


trainer = Trainer(
    model=model_renal,                         
    args=training_args,                 
    train_dataset=train_dataset,         
    eval_dataset=test_dataset,
    compute_metrics=compute_metrics,
)

try:
    
    trainer.train()
except Exception as e:
    print(e)

***** Running training *****
  Num examples = 2738
  Num Epochs = 20
  Instantaneous batch size per device = 16
  Total train batch size (w. parallel, distributed & accumulation) = 16
  Gradient Accumulation steps = 1
  Total optimization steps = 3440
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}


Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
50,0.3185,0.219373,0.944526,0.0,0.0,0.0
100,0.2243,0.265068,0.944526,0.0,0.0,0.0
150,0.2472,0.220932,0.944526,0.0,0.0,0.0
200,0.1973,0.203422,0.944526,0.0,0.0,0.0
250,0.2011,0.16612,0.944526,0.0,0.0,0.0
300,0.1879,0.301379,0.944526,0.0,0.0,0.0
350,0.1674,0.190871,0.953285,0.8,0.210526,0.333333
400,0.1699,0.134971,0.959124,0.857143,0.315789,0.461538
450,0.1411,0.224407,0.944526,0.0,0.0,0.0
500,0.175,0.168174,0.944526,0.0,0.0,0.0


***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
  _warn_prf(average, modifier, msg_start, len(result))
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-50
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-50\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-50\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-2200] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
  _warn_prf(average, modifier, msg_start, len(result))
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-100
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-100\config.json
Model weights saved in ./fine_exki

***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
  _warn_prf(average, modifier, msg_start, len(result))
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-450
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-450\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-450\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-350] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
  _warn_prf(average, modifier, msg_start, len(result))
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-500
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-500\config.json
Model weights saved in ./fine_ex

Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-900\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-850] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-950
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-950\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-950\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-900] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
Saving model checkpoint to ./f

Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1350] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1450
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1450\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1450\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1400] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1500
Configuration saved in ./fine_exkidBER

Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1850] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1950
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1950\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1950\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1900] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-2000
Configuration saved in ./fine_exkidBER

Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-2350] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-2450
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-2450\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-2450\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-2400] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-2500
Configuration saved in ./fine_exkidBER

Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-2850] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-2950
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-2950\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-2950\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-2900] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-3000
Configuration saved in ./fine_exkidBER

Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-3350] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}


In [7]:
# exKidney BERT - qa cls

batch_size = 16
training_args = TrainingArguments(
    output_dir='./fine_exkidBERTcased_results_largeData_batch16_wd1e-5',          
    num_train_epochs=20,              
    per_device_train_batch_size=batch_size,  
    per_device_eval_batch_size=batch_size*2,   
    warmup_steps=50,                
    weight_decay=1e-5,                          
    logging_steps=50*16/batch_size,
    evaluation_strategy="steps",
    eval_steps=50*16/batch_size,
    load_best_model_at_end=True,
    save_steps = 50*16/batch_size,
    save_total_limit = 1,
    seed = 0
)


trainer = Trainer(
    model=model_renal,                         
    args=training_args,                 
    train_dataset=train_dataset,         
    eval_dataset=test_dataset,
    compute_metrics=compute_metrics,
)

try:
    
    trainer.train()
except Exception as e:
    print(e)

***** Running training *****
  Num examples = 2738
  Num Epochs = 20
  Instantaneous batch size per device = 16
  Total train batch size (w. parallel, distributed & accumulation) = 16
  Gradient Accumulation steps = 1
  Total optimization steps = 3440
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}


Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
50,0.2973,0.224674,0.944526,0.0,0.0,0.0
100,0.2183,0.27813,0.944526,0.0,0.0,0.0
150,0.2218,0.184699,0.944526,0.0,0.0,0.0
200,0.2019,0.163006,0.944526,0.0,0.0,0.0
250,0.1472,0.127365,0.964964,0.705882,0.631579,0.666667
300,0.1684,0.247684,0.944526,0.0,0.0,0.0
350,0.1208,0.193167,0.953285,1.0,0.157895,0.272727
400,0.1576,0.116394,0.963504,0.782609,0.473684,0.590164
450,0.1153,0.167927,0.962044,0.928571,0.342105,0.5
500,0.1674,0.127723,0.962044,1.0,0.315789,0.48


***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
  _warn_prf(average, modifier, msg_start, len(result))
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-50
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-50\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-50\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1300] due to args.save_total_limit
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-5100] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
  _warn_prf(average, modifier, msg_start, len(result))
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-100
Configuration

Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-450\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-450\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-350] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-500
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-500\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-500\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-450] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.item

Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-950\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-900] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1000
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1000\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1000\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-950] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
Saving model checkpoint to 

Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1450\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1400] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1500
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1500\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1500\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1450] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
Saving model checkpoint 

Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1950\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1900] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-2000
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-2000\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-2000\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1950] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
Saving model checkpoint 

Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-2450\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-2400] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-2500
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-2500\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-2500\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-2450] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
Saving model checkpoint 

Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-2950\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-2900] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-3000
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-3000\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-3000\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-2950] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 32
Saving model checkpoint 

In [7]:
# exKidney BERT - qa cls

batch_size = 8
training_args = TrainingArguments(
    output_dir='./fine_exkidBERTcased_results_largeData_batch16_wd1e-5',          
    num_train_epochs=20,              
    per_device_train_batch_size=batch_size,  
    per_device_eval_batch_size=batch_size*2,   
    warmup_steps=50,                
    weight_decay=1e-5,                          
    logging_steps=50*16/batch_size,
    evaluation_strategy="steps",
    eval_steps=50*16/batch_size,
    load_best_model_at_end=True,
    save_steps = 50*16/batch_size,
    save_total_limit = 1,
    seed = 0
)


trainer = Trainer(
    model=model_renal,                         
    args=training_args,                 
    train_dataset=train_dataset,         
    eval_dataset=test_dataset,
    compute_metrics=compute_metrics,
)

try:
    
    trainer.train()
except Exception as e:
    print(e)

***** Running training *****
  Num examples = 2738
  Num Epochs = 20
  Instantaneous batch size per device = 8
  Total train batch size (w. parallel, distributed & accumulation) = 8
  Gradient Accumulation steps = 1
  Total optimization steps = 6860
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}


Step,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
100,0.2708,0.276292,0.944526,0.0,0.0,0.0
200,0.2396,0.293186,0.944526,0.0,0.0,0.0
300,0.2305,0.232601,0.944526,0.0,0.0,0.0
400,0.227,0.205782,0.944526,0.0,0.0,0.0
500,0.2352,0.243196,0.944526,0.0,0.0,0.0
600,0.2324,0.255087,0.944526,0.0,0.0,0.0
700,0.1987,0.281646,0.944526,0.0,0.0,0.0
800,0.228,0.168213,0.944526,0.0,0.0,0.0
900,0.1748,0.177754,0.953285,1.0,0.157895,0.272727
1000,0.233,0.164829,0.944526,0.0,0.0,0.0


***** Running Evaluation *****
  Num examples = 685
  Batch size = 16
  _warn_prf(average, modifier, msg_start, len(result))
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-100
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-100\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-100\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-400] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 16
  _warn_prf(average, modifier, msg_start, len(result))
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-200
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-200\config.json
Model weights saved in ./fine_ex

Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-800\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-800\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-400] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 16
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-900
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-900\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-900\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-700] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.item

***** Running Evaluation *****
  Num examples = 685
  Batch size = 16
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1800
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1800\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1800\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1700] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 16
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1900
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1900\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-1900\pytorch_model.bin
Deleting older checkpoin

***** Running Evaluation *****
  Num examples = 685
  Batch size = 16
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-2800
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-2800\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-2800\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-2700] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 16
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-2900
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-2900\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-2900\pytorch_model.bin
Deleting older checkpoin

***** Running Evaluation *****
  Num examples = 685
  Batch size = 16
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-3800
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-3800\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-3800\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-3700] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 16
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-3900
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-3900\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-3900\pytorch_model.bin
Deleting older checkpoin

***** Running Evaluation *****
  Num examples = 685
  Batch size = 16
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-4800
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-4800\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-4800\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-4700] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 16
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-4900
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-4900\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-4900\pytorch_model.bin
Deleting older checkpoin

***** Running Evaluation *****
  Num examples = 685
  Batch size = 16
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-5800
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-5800\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-5800\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-5700] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
***** Running Evaluation *****
  Num examples = 685
  Batch size = 16
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-5900
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-5900\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-5900\pytorch_model.bin
Deleting older checkpoin

***** Running Evaluation *****
  Num examples = 685
  Batch size = 16
Saving model checkpoint to ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-6800
Configuration saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-6800\config.json
Model weights saved in ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-6800\pytorch_model.bin
Deleting older checkpoint [fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-6700] due to args.save_total_limit
  item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}


Training completed. Do not forget to share your model on huggingface.co/models =)


Loading best model from ./fine_exkidBERTcased_results_largeData_batch16_wd1e-5\checkpoint-2200 (score: 0.12533804774284363).
