In [1]:
import pandas as pd
import numpy as np
import csv
import os
import logging
import random
import copy
import json
import argparse
import torch
import torch.nn as nn
from transformers import BertTokenizer,AdamW, BertConfig, get_linear_schedule_with_warmup
from torch.utils.data import TensorDataset, DataLoader, RandomSampler, SequentialSampler
from transformers import BertModel, BertPreTrainedModel
from tqdm import tqdm, trange
from sklearn.model_selection import train_test_split
from sklearn.metrics import accuracy_score, f1_score, roc_auc_score, classification_report

In [2]:
label_path = '../data/label.txt'

Utils

In [3]:
logger = logging.getLogger(__name__)

ADDITIONAL_SPECIAL_TOKENS = ["<e1>", "</e1>", "<e2>", "</e2>"]


def get_label(args):
    return [label.strip() for label in open(label_path, "r", encoding="utf-8")]


def load_tokenizer(args):
    tokenizer = BertTokenizer.from_pretrained(args.model_name_or_path)
    tokenizer.add_special_tokens({"additional_special_tokens": ADDITIONAL_SPECIAL_TOKENS})
    return tokenizer


def write_prediction(args, output_file, preds):
    """
    For official evaluation script
    :param output_file: prediction_file_path (e.g. eval/proposed_answers.txt)
    :param preds: [0,1,0,2,18,...]
    """
    relation_labels = get_label(args)
    with open(output_file, "w", encoding="utf-8") as f:
        for idx, pred in enumerate(preds):
            f.write("{}\t{}\n".format(8001 + idx, relation_labels[pred]))


def init_logger():
    logging.basicConfig(
        format="%(asctime)s - %(levelname)s - %(name)s -   %(message)s",
        datefmt="%m/%d/%Y %H:%M:%S",
        level=logging.INFO)


def set_seed(args):
    random.seed(args.seed)
    np.random.seed(args.seed)
    torch.manual_seed(args.seed)
    if not args.no_cuda and torch.cuda.is_available():
        torch.cuda.manual_seed_all(args.seed)



def compute_metrics(preds, labels):
    assert len(preds) == len(labels)
    return acc(preds, labels)


def simple_accuracy(preds, labels):
    return (preds == labels).mean()


def acc(preds, labels, average="macro"):
    acc = simple_accuracy(preds, labels)
    return {
        "acc": acc}

Data_loader

In [4]:
#from utils import get_label
logger = logging.getLogger(__name__)

class InputExample(object):
    """
    A single training/test example for simple sequence classification.
    Args:
        guid: Unique id for the example.
        text_a: string. The untokenized text of the first sequence. For single
        sequence tasks, only this sequence must be specified.
        label: (Optional) string. The label of the example. This should be
        specified for train and dev examples, but not for test examples.
    """

    def __init__(self, guid, text_a, label):
        self.guid = guid
        self.text_a = text_a
        self.label = label

    def __repr__(self):
        return str(self.to_json_string())

    def to_dict(self):
        """Serializes this instance to a Python dictionary."""
        output = copy.deepcopy(self.__dict__)
        return output

    def to_json_string(self):
        """Serializes this instance to a JSON string."""
        return json.dumps(self.to_dict(), indent=2, sort_keys=True) + "\n"


class InputFeatures(object):
    """
    A single set of features of data.
    Args:
        input_ids: Indices of input sequence tokens in the vocabulary.
        attention_mask: Mask to avoid performing attention on padding token indices.
            Mask values selected in ``[0, 1]``:
            Usually  ``1`` for tokens that are NOT MASKED, ``0`` for MASKED (padded) tokens.
        token_type_ids: Segment token indices to indicate first and second portions of the inputs.
    """

    def __init__(self, input_ids, attention_mask, token_type_ids, label_id, e1_mask, e2_mask):
        self.input_ids = input_ids
        self.attention_mask = attention_mask
        self.token_type_ids = token_type_ids
        self.label_id = label_id
        self.e1_mask = e1_mask
        self.e2_mask = e2_mask

    def __repr__(self):
        return str(self.to_json_string())

    def to_dict(self):
        """Serializes this instance to a Python dictionary."""
        output = copy.deepcopy(self.__dict__)
        return output

    def to_json_string(self):
        """Serializes this instance to a JSON string."""
        return json.dumps(self.to_dict(), indent=2, sort_keys=True) + "\n"


class SemEvalProcessor(object):
    """Processor for the Semeval data set """

    def __init__(self, args):
        self.args = args
        self.relation_labels = get_label(args)

    @classmethod
    def _read_tsv(cls, input_file, quotechar=None):
        """Reads a tab separated value file."""
        with open(input_file, "r", encoding="utf-8") as f:
            reader = csv.reader(f, delimiter="\t", quotechar=quotechar)
            lines = []
            for line in reader:
                lines.append(line)
            return lines

    def _create_examples(self, lines, set_type):
        """Creates examples for the training and dev sets."""
        examples = []
        for (i, line) in enumerate(lines):
            guid = "%s-%s" % (set_type, i)
            text_a = line[0]
            label = self.relation_labels.index(line[1])
            if i % 1000 == 0:
                logger.info(line)
            examples.append(InputExample(guid=guid, text_a=text_a, label=label))
        return examples


    def get_examples(self, mode):
        """
        Args:
            mode: train, dev, test
        """
        file_to_read = None
        if mode == "train_file":
            file_to_read = self.args.train_file
        elif mode == "eval_file":
            file_to_read = self.args.test_file
        elif mode == "test_file":
            file_to_read = self.args.test_file

        logger.info("LOOKING AT {}".format(os.path.join(self.args.data_dir, file_to_read)))
        return self._create_examples(self._read_tsv(os.path.join(self.args.data_dir, file_to_read)), mode)


processors = {"semeval": SemEvalProcessor}


def read_examples_from_file(data_dir, mode):
    file_path = os.path.join(data_dir, "{}.txt".format(mode))
    guid_index = 1
    examples = []
    with open(file_path, "r", encoding="utf-8") as f:
        for line in f.readlines():
            line = line.strip().split("\t")
            if len(line) == 2:
                text_a = line[0]
                label = line[1]
            else:
                text_a = line[0]
                label = "NONE"
            examples.append(InputExample(guid=guid_index, text_a=text_a, label=label))
            guid_index += 1

    return examples

def convert_examples_to_features(
    examples,
    max_seq_len,
    tokenizer,
    cls_token="[CLS]",
    cls_token_segment_id=0,
    sep_token="[SEP]",
    pad_token=0,
    pad_token_segment_id=0,
    sequence_a_segment_id=0,
    add_sep_token=False,
    mask_padding_with_zero=True,
):
    features = []
    for (ex_index, example) in enumerate(examples):
        if ex_index % 5000 == 0:
            logger.info("Writing example %d of %d" % (ex_index, len(examples)))

        tokens_a = tokenizer.tokenize(example.text_a)

        e11_p = tokens_a.index("<e1>")  # the start position of entity1
        e12_p = tokens_a.index("</e1>")  # the end position of entity1
        e21_p = tokens_a.index("<e2>")  # the start position of entity2
        e22_p = tokens_a.index("</e2>")  # the end position of entity2

        # Replace the token
        tokens_a[e11_p] = "$"
        tokens_a[e12_p] = "$"
        tokens_a[e21_p] = "#"
        tokens_a[e22_p] = "#"

        # Add 1 because of the [CLS] token
        e11_p += 1
        e12_p += 1
        e21_p += 1
        e22_p += 1

        # Account for [CLS] and [SEP] with "- 2" and with "- 3" for RoBERTa.
        if add_sep_token:
            special_tokens_count = 2
        else:
            special_tokens_count = 1
        if len(tokens_a) > max_seq_len - special_tokens_count:
            tokens_a = tokens_a[: (max_seq_len - special_tokens_count)]

        tokens = tokens_a
        if add_sep_token:
            tokens += [sep_token]

        token_type_ids = [sequence_a_segment_id] * len(tokens)

        tokens = [cls_token] + tokens
        token_type_ids = [cls_token_segment_id] + token_type_ids

        input_ids = tokenizer.convert_tokens_to_ids(tokens)

        # The mask has 1 for real tokens and 0 for padding tokens. Only real tokens are attended to.
        attention_mask = [1 if mask_padding_with_zero else 0] * len(input_ids)

        # Zero-pad up to the sequence length.
        padding_length = max_seq_len - len(input_ids)
        input_ids = input_ids + ([pad_token] * padding_length)
        attention_mask = attention_mask + ([0 if mask_padding_with_zero else 1] * padding_length)
        token_type_ids = token_type_ids + ([pad_token_segment_id] * padding_length)

        # e1 mask, e2 mask
        e1_mask = [0] * len(attention_mask)
        e2_mask = [0] * len(attention_mask)

        for i in range(e11_p, e12_p + 1):
            e1_mask[i] = 1
        for i in range(e21_p, e22_p + 1):
            e2_mask[i] = 1

        assert len(input_ids) == max_seq_len, "Error with input length {} vs {}".format(len(input_ids), max_seq_len)
        assert len(attention_mask) == max_seq_len, "Error with attention mask length {} vs {}".format(
            len(attention_mask), max_seq_len
        )
        assert len(token_type_ids) == max_seq_len, "Error with token type length {} vs {}".format(
            len(token_type_ids), max_seq_len
        )

        label_id = int(example.label)

        if ex_index < 5:
            logger.info("*** Example ***")
            logger.info("guid: %s" % example.guid)
            logger.info("tokens: %s" % " ".join([str(x) for x in tokens]))
            logger.info("input_ids: %s" % " ".join([str(x) for x in input_ids]))
            logger.info("attention_mask: %s" % " ".join([str(x) for x in attention_mask]))
            logger.info("token_type_ids: %s" % " ".join([str(x) for x in token_type_ids]))
            logger.info("label: %s (id = %d)" % (example.label, label_id))
            logger.info("e1_mask: %s" % " ".join([str(x) for x in e1_mask]))
            logger.info("e2_mask: %s" % " ".join([str(x) for x in e2_mask]))

        features.append(
            InputFeatures(
                input_ids=input_ids,
                attention_mask=attention_mask,
                token_type_ids=token_type_ids,
                label_id=label_id,
                e1_mask=e1_mask,
                e2_mask=e2_mask,
            )
        )

    return features


def load_and_cache_examples(args, tokenizer, mode):
    processor = processors[args.task](args)

    # Load data features from cache or dataset file
    cached_features_file = os.path.join(
        args.data_dir,
        "cached_{}_{}_{}_{}".format(
            mode,
            args.task,
            list(filter(None, args.model_name_or_path.split("/"))).pop(),
            args.max_seq_len,
        ),
    )

    if os.path.exists(cached_features_file):
        logger.info("Loading features from cached file %s", cached_features_file)
        features = torch.load(cached_features_file)
    else:
        logger.info("Creating features from dataset file at %s", args.data_dir)
        if mode == "train_file":
            examples = processor.get_examples("train_file")
        elif mode == "eval_file":
            examples = processor.get_examples("eval_file")
        elif mode == "test_file":
            examples = processor.get_examples("test_file")
        else:
            raise Exception("For mode, Only train, dev, test is available")

        features = convert_examples_to_features(
            examples, args.max_seq_len, tokenizer
        )
        logger.info("Saving features into cached file %s", cached_features_file)
        torch.save(features, cached_features_file)

    # Convert to Tensors and build dataset
    all_input_ids = torch.tensor([f.input_ids for f in features], dtype=torch.long)
    all_attention_mask = torch.tensor([f.attention_mask for f in features], dtype=torch.long)
    all_token_type_ids = torch.tensor([f.token_type_ids for f in features], dtype=torch.long)
    all_e1_mask = torch.tensor([f.e1_mask for f in features], dtype=torch.long)  # add e1 mask
    all_e2_mask = torch.tensor([f.e2_mask for f in features], dtype=torch.long)  # add e2 mask

    all_label_ids = torch.tensor([f.label_id for f in features], dtype=torch.long)

    dataset = TensorDataset(
        all_input_ids,
        all_attention_mask,
        all_token_type_ids,
        all_label_ids,
        all_e1_mask,
        all_e2_mask,
    )
    return dataset

Model

In [5]:
class FCLayer(nn.Module):
    def __init__(self, input_dim, output_dim, dropout_rate=0.0, use_activation=True):
        super(FCLayer, self).__init__()
        self.use_activation = use_activation
        self.dropout = nn.Dropout(dropout_rate)
        self.linear = nn.Linear(input_dim, output_dim)
        self.tanh = nn.Tanh()

    def forward(self, x):
        x = self.dropout(x)
        if self.use_activation:
            x = self.tanh(x)
        return self.linear(x)


class RBERT(BertPreTrainedModel):
    def __init__(self, config, args):
        super(RBERT, self).__init__(config)
        self.bert = BertModel(config=config)  # Load pretrained bert

        self.num_labels = config.num_labels

        self.cls_fc_layer = FCLayer(config.hidden_size, config.hidden_size, args.dropout_rate)
        self.entity_fc_layer = FCLayer(config.hidden_size, config.hidden_size, args.dropout_rate)
        self.label_classifier = FCLayer(
            config.hidden_size * 3,
            config.num_labels,
            args.dropout_rate,
            use_activation=False,
        )

    @staticmethod
    def entity_average(hidden_output, e_mask):
        """
        Average the entity hidden state vectors (H_i ~ H_j)
        :param hidden_output: [batch_size, j-i+1, dim]
        :param e_mask: [batch_size, max_seq_len]
                e.g. e_mask[0] == [0, 0, 0, 1, 1, 1, 0, 0, ... 0]
        :return: [batch_size, dim]
        """
        e_mask_unsqueeze = e_mask.unsqueeze(1)  # [b, 1, j-i+1]
        length_tensor = (e_mask != 0).sum(dim=1).unsqueeze(1)  # [batch_size, 1]

        # [b, 1, j-i+1] * [b, j-i+1, dim] = [b, 1, dim] -> [b, dim]
        sum_vector = torch.bmm(e_mask_unsqueeze.float(), hidden_output).squeeze(1)
        avg_vector = sum_vector.float() / length_tensor.float()  # broadcasting
        return avg_vector

    def forward(self, input_ids, attention_mask, token_type_ids, labels, e1_mask, e2_mask):
        outputs = self.bert(
            input_ids, attention_mask=attention_mask, token_type_ids=token_type_ids
        )  # sequence_output, pooled_output, (hidden_states), (attentions)
        sequence_output = outputs[0]
        pooled_output = outputs[1]  # [CLS]

        # Average
        e1_h = self.entity_average(sequence_output, e1_mask)
        e2_h = self.entity_average(sequence_output, e2_mask)

        # Dropout -> tanh -> fc_layer (Share FC layer for e1 and e2)
        pooled_output = self.cls_fc_layer(pooled_output)
        e1_h = self.entity_fc_layer(e1_h)
        e2_h = self.entity_fc_layer(e2_h)

        # Concat -> fc_layer
        concat_h = torch.cat([pooled_output, e1_h, e2_h], dim=-1)
        logits = self.label_classifier(concat_h)

        outputs = (logits,) + outputs[2:]  # add hidden states and attention if they are here

        # Softmax
        if labels is not None:
            if self.num_labels == 1:
                loss_fct = nn.MSELoss()
                loss = loss_fct(logits.view(-1), labels.view(-1))
            else:
                loss_fct = nn.CrossEntropyLoss()
                loss = loss_fct(logits.view(-1, self.num_labels), labels.view(-1))

            outputs = (loss,) + outputs

        return outputs  # (loss), logits, (hidden_states), (attentions)

Trainer

In [6]:
def get_device(pred_config):
    return "cuda" if torch.cuda.is_available() and not pred_config.no_cuda else "cpu"

def convert_input_file_to_tensor_dataset(
    args,
    cls_token_segment_id=0,
    pad_token_segment_id=0,
    sequence_a_segment_id=0,
    mask_padding_with_zero=True):
    tokenizer = load_tokenizer(args)

    # Setting based on the current model type
    cls_token = tokenizer.cls_token
    sep_token = tokenizer.sep_token
    pad_token_id = tokenizer.pad_token_id

    all_input_ids = []
    all_attention_mask = []
    all_token_type_ids = []
    all_e1_mask = []
    all_e2_mask = []

    with open(args.input_file, "r", encoding="utf-8") as f:
        for line in f:
            line = line.strip()
            tokens = tokenizer.tokenize(line)

            e11_p = tokens.index("<e1>")  # the start position of entity1
            e12_p = tokens.index("</e1>")  # the end position of entity1
            e21_p = tokens.index("<e2>")  # the start position of entity2
            e22_p = tokens.index("</e2>")  # the end position of entity2

            # Replace the token
            tokens[e11_p] = "$"
            tokens[e12_p] = "$"
            tokens[e21_p] = "#"
            tokens[e22_p] = "#"

            # Add 1 because of the [CLS] token
            e11_p += 1
            e12_p += 1
            e21_p += 1
            e22_p += 1

            # Account for [CLS] and [SEP] with "- 2" and with "- 3" for RoBERTa.
            if args.add_sep_token:
                special_tokens_count = 2
            else:
                special_tokens_count = 1
            if len(tokens) > args.max_seq_len - special_tokens_count:
                tokens = tokens[: (args.max_seq_len - special_tokens_count)]

            # Add [SEP] token
            if args.add_sep_token:
                tokens += [sep_token]
            token_type_ids = [sequence_a_segment_id] * len(tokens)

            # Add [CLS] token
            tokens = [cls_token] + tokens
            token_type_ids = [cls_token_segment_id] + token_type_ids

            input_ids = tokenizer.convert_tokens_to_ids(tokens)

            # The mask has 1 for real tokens and 0 for padding tokens. Only real tokens are attended to.
            attention_mask = [1 if mask_padding_with_zero else 0] * len(input_ids)

            # Zero-pad up to the sequence length.
            padding_length = args.max_seq_len - len(input_ids)
            input_ids = input_ids + ([pad_token_id] * padding_length)
            attention_mask = attention_mask + ([0 if mask_padding_with_zero else 1] * padding_length)
            token_type_ids = token_type_ids + ([pad_token_segment_id] * padding_length)

            # e1 mask, e2 mask
            e1_mask = [0] * len(attention_mask)
            e2_mask = [0] * len(attention_mask)

            for i in range(e11_p, e12_p + 1):
                e1_mask[i] = 1
            for i in range(e21_p, e22_p + 1):
                e2_mask[i] = 1

            all_input_ids.append(input_ids)
            all_attention_mask.append(attention_mask)
            all_token_type_ids.append(token_type_ids)
            all_e1_mask.append(e1_mask)
            all_e2_mask.append(e2_mask)

    # Change to Tensor
    all_input_ids = torch.tensor(all_input_ids, dtype=torch.long)
    all_attention_mask = torch.tensor(all_attention_mask, dtype=torch.long)
    all_token_type_ids = torch.tensor(all_token_type_ids, dtype=torch.long)
    all_e1_mask = torch.tensor(all_e1_mask, dtype=torch.long)
    all_e2_mask = torch.tensor(all_e2_mask, dtype=torch.long)

    dataset = TensorDataset(all_input_ids, all_attention_mask, all_token_type_ids, all_e1_mask, all_e2_mask)

    return dataset

In [7]:
logger = logging.getLogger(__name__)


class Trainer(object):
    def __init__(self, args, train_dataset=None, dev_dataset=None, test_dataset=None):
        self.args = args
        self.train_dataset = train_dataset
        self.dev_dataset = dev_dataset
        self.test_dataset = test_dataset

        self.label_lst = get_label(args)
        self.num_labels = len(self.label_lst)

        self.config = BertConfig.from_pretrained(
            args.model_name_or_path,
            num_labels=self.num_labels,
            finetuning_task=args.task,
            id2label={str(i): label for i, label in enumerate(self.label_lst)},
            label2id={label: i for i, label in enumerate(self.label_lst)},
        )
        self.model = RBERT.from_pretrained(args.model_name_or_path, config=self.config, args=args)

        # GPU or CPU
        self.device = "cuda" if torch.cuda.is_available() and not args.no_cuda else "cpu"
        self.model.to(self.device)

        
    def evaluate(self, mode):
        # We use test dataset because semeval doesn't have dev dataset
        if mode == "test":
            dataset = self.test_dataset
        elif mode == "dev":
            dataset = self.dev_dataset
        else:
            raise Exception("Only dev and test dataset available")

        eval_sampler = SequentialSampler(dataset)
        eval_dataloader = DataLoader(dataset, sampler=eval_sampler, batch_size=self.args.eval_batch_size)
        # Eval!

        eval_loss = 0.0
        nb_eval_steps = 0
        preds = None
        out_label_ids = None

        self.model.eval()

        for batch in tqdm(eval_dataloader, desc="Evaluating"):
            batch = tuple(t.to(self.device) for t in batch)
            with torch.no_grad():
                inputs = {
                    "input_ids": batch[0],
                    "attention_mask": batch[1],
                    "token_type_ids": batch[2],
                    "labels": batch[3],
                    "e1_mask": batch[4],
                    "e2_mask": batch[5],
                }
                outputs = self.model(**inputs)
                tmp_eval_loss, logits = outputs[:2]

                eval_loss += tmp_eval_loss.mean().item()
            nb_eval_steps += 1

            if preds is None:
                preds = logits.detach().cpu().numpy()
                out_label_ids = inputs["labels"].detach().cpu().numpy()
            else:
                preds = np.append(preds, logits.detach().cpu().numpy(), axis=0)
                out_label_ids = np.append(out_label_ids, inputs["labels"].detach().cpu().numpy(), axis=0)

        eval_loss = eval_loss / nb_eval_steps
        #results = {"loss": eval_loss}
        preds = np.argmax(preds, axis=1)
        write_prediction(self.args, os.path.join(self.args.eval_dir, "proposed_answers_bert1.txt"), preds)

        results = {"loss": eval_loss, 'accuracy' : accuracy_score(out_label_ids, preds), 
                   'f1_score': f1_score(out_label_ids, preds, average='weighted'),
                  'roc_auc': roc_auc_score(out_label_ids, preds)}

          #result = compute_metrics(preds, out_label_ids)
          #results.update(result)

        logger.info("***** Eval results *****")
        for key in sorted(results.keys()):
            logger.info("  {} = {:.4f}".format(key, results[key]))

        return results

    
    def train(self):
        train_sampler = RandomSampler(self.train_dataset)
        train_dataloader = DataLoader(
            self.train_dataset,
            sampler=train_sampler,
            batch_size=self.args.train_batch_size,
        )

        if self.args.max_steps > 0:
            t_total = self.args.max_steps
            self.args.num_train_epochs = (
                self.args.max_steps // (len(train_dataloader) // self.args.gradient_accumulation_steps) + 1
            )
        else:
            t_total = len(train_dataloader) // self.args.gradient_accumulation_steps * self.args.num_train_epochs

        # Prepare optimizer and schedule (linear warmup and decay)
        no_decay = ["bias", "LayerNorm.weight"]
        optimizer_grouped_parameters = [
            {
                "params": [p for n, p in self.model.named_parameters() if not any(nd in n for nd in no_decay)],
                "weight_decay": self.args.weight_decay,
            },
            {
                "params": [p for n, p in self.model.named_parameters() if any(nd in n for nd in no_decay)],
                "weight_decay": 0.0,
            },
        ]
        optimizer = AdamW(
            optimizer_grouped_parameters,
            lr=self.args.learning_rate,
            eps=self.args.adam_epsilon,
        )
        scheduler = get_linear_schedule_with_warmup(
            optimizer,
            num_warmup_steps=self.args.warmup_steps,
            num_training_steps=t_total,
        )
        # Train!

        global_step = 0
        tr_loss = 0.0
        self.model.zero_grad()

        train_iterator = trange(int(self.args.num_train_epochs), desc="Epoch")

        for _ in train_iterator:
            epoch_iterator = tqdm(train_dataloader, desc="Iteration")
            for step, batch in enumerate(epoch_iterator):
                self.model.train()
                batch = tuple(t.to(self.device) for t in batch)  # GPU or CPU
                inputs = {
                    "input_ids": batch[0],
                    "attention_mask": batch[1],
                    "token_type_ids": batch[2],
                    "labels": batch[3],
                    "e1_mask": batch[4],
                    "e2_mask": batch[5],
                }
                outputs = self.model(**inputs)
                loss = outputs[0]

                if self.args.gradient_accumulation_steps > 1:
                    loss = loss / self.args.gradient_accumulation_steps

                loss.backward()

                tr_loss += loss.item()
                if (step + 1) % self.args.gradient_accumulation_steps == 0:
                    torch.nn.utils.clip_grad_norm_(self.model.parameters(), self.args.max_grad_norm)

                    optimizer.step()
                    scheduler.step()  # Update learning rate schedule
                    self.model.zero_grad()
                    global_step += 1

            print("\n====Evaluation====")
            print("\nEvaluation: ", self.evaluate("test"))
            
        self.save_model(self.model)

    def save_model(self, model):
        torch.save(model.state_dict(), 'model/model_bert_base1.bin')

Main

In [9]:
def RBERT_re(args):
    set_seed(args)
    tokenizer = load_tokenizer(args)

    train_dataset = load_and_cache_examples(args, tokenizer, mode="train_file")
    test_dataset = load_and_cache_examples(args, tokenizer, mode="eval_file")

    trainer = Trainer(args, train_dataset=train_dataset, test_dataset=test_dataset)


    if args.do_train:
        trainer.train()

In [12]:
class Trainer_args(object):
    def __init__(self,
                model_name_or_path = 'bert-base-uncased',
                seed = 24,
                task = "semeval",
                train_file = 'train_balanced.csv', 
                test_file = 'eval_balanced.csv',
                label_file = 'label.txt',  
                dropout_rate = 0.1,
                num_labels = 2,
                learning_rate = 2e-5,
                num_train_epochs = 11,
                max_seq_len = 384,
                train_batch_size = 16,
                eval_batch_size = 16,
                adam_epsilon = 1e-8,
                gradient_accumulation_steps = 1,
                max_grad_norm = 1.0,
                logging_steps = 250,
                save_steps = 250,
                weight_decay = 0.0,
                add_sep_token = True,
                do_train = True,
                no_cuda = True,
                do_eval = True,
                max_steps = -1,
                warmup_steps = 0,
                model_dir = 'model/',
                data_dir = '../data/',
                eval_dir = '../data/'
                ):

        super(Trainer_args, self).__init__()

        self.train_file = train_file
        self.test_file = test_file
        self.dropout_rate = dropout_rate
        self.num_labels = num_labels
        self.learning_rate = learning_rate
        self.num_train_epochs = num_train_epochs
        self.max_seq_len = max_seq_len
        self.train_batch_size = train_batch_size
        self.adam_epsilon = adam_epsilon
        self.gradient_accumulation_steps = gradient_accumulation_steps
        self.max_grad_norm = max_grad_norm
        self.logging_steps = logging_steps
        self.save_steps = save_steps
        self.weight_decay = weight_decay
        self.data_dir = data_dir
        self.model_name_or_path = model_name_or_path
        self.seed = seed
        self.task = task
        self.add_sep_token = add_sep_token
        self.do_train = do_train
        self.no_cuda = no_cuda
        self.max_steps = max_steps
        self.warmup_steps = warmup_steps
        self.model_dir = model_dir
        self.label_file = label_file
        self.eval_batch_size = eval_batch_size
        self.do_eval = do_eval
        self.eval_dir = eval_dir
        return 
args = Trainer_args()

In [13]:
train_path = '../data/train_balanced.csv'

In [14]:
main_model = RBERT_re(args)

Some weights of the model checkpoint at bert-base-uncased were not used when initializing RBERT: ['cls.predictions.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.dense.bias', 'cls.predictions.decoder.weight', 'cls.seq_relationship.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.LayerNorm.bias']
- This IS expected if you are initializing RBERT from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RBERT from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of RBERT were not initialized from the model checkpoint at bert-base-uncased and are newly initialized: ['cls_fc_layer.linear.weight', 'cls_fc_layer.linea


====Evaluation====



Evaluating:   0%|                                       | 0/12 [00:00<?, ?it/s][A
Evaluating:   8%|██▌                            | 1/12 [00:37<06:48, 37.15s/it][A
Evaluating:  17%|█████▏                         | 2/12 [01:15<06:16, 37.62s/it][A
Evaluating:  25%|███████▊                       | 3/12 [01:54<05:42, 38.02s/it][A
Evaluating:  33%|██████████▎                    | 4/12 [02:33<05:05, 38.18s/it][A
Evaluating:  42%|████████████▉                  | 5/12 [03:12<04:28, 38.36s/it][A
Evaluating:  50%|███████████████▌               | 6/12 [03:51<03:51, 38.54s/it][A
Evaluating:  58%|██████████████████             | 7/12 [04:31<03:15, 39.17s/it][A
Evaluating:  67%|████████████████████▋          | 8/12 [05:14<02:41, 40.28s/it][A
Evaluating:  75%|███████████████████████▎       | 9/12 [05:56<02:02, 40.89s/it][A
Evaluating:  83%|█████████████████████████     | 10/12 [06:40<01:23, 41.55s/it][A
Evaluating:  92%|███████████████████████████▌  | 11/12 [07:22<00:41, 41.72s/it][A
Eva


Evaluation:  {'loss': 0.5066063528259596, 'accuracy': 0.8379888268156425, 'f1_score': 0.7641235502878199, 'roc_auc': 0.5}



Iteration:   6%|█▊                             | 1/17 [02:34<41:05, 154.06s/it][A
Iteration:  12%|███▋                           | 2/17 [05:52<41:45, 167.04s/it][A
Iteration:  18%|█████▍                         | 3/17 [07:40<34:54, 149.57s/it][A
Iteration:  24%|███████▎                       | 4/17 [09:37<30:14, 139.60s/it][A
Iteration:  29%|█████████                      | 5/17 [11:27<26:13, 131.13s/it][A
Iteration:  35%|██████████▉                    | 6/17 [13:27<23:21, 127.44s/it][A
Iteration:  41%|████████████▊                  | 7/17 [15:22<20:37, 123.79s/it][A
Iteration:  47%|██████████████▌                | 8/17 [17:19<18:08, 120.92s/it][A
Iteration:  53%|████████████████▍              | 9/17 [19:22<16:18, 122.36s/it][A
Iteration:  59%|█████████████████▋            | 10/17 [21:22<14:11, 121.70s/it][A
Iteration:  65%|███████████████████▍          | 11/17 [23:52<12:52, 128.78s/it][A
Iteration:  71%|█████████████████████▏        | 12/17 [28:00<13:49, 165.84s/it][A
Ite


====Evaluation====



Evaluating:   0%|                                       | 0/12 [00:00<?, ?it/s][A
Evaluating:   8%|██▌                            | 1/12 [00:37<06:57, 37.93s/it][A
Evaluating:  17%|█████▏                         | 2/12 [01:16<06:19, 38.00s/it][A
Evaluating:  25%|███████▊                       | 3/12 [01:54<05:43, 38.14s/it][A
Evaluating:  33%|██████████▎                    | 4/12 [02:32<05:05, 38.17s/it][A
Evaluating:  42%|████████████▉                  | 5/12 [03:11<04:28, 38.30s/it][A
Evaluating:  50%|███████████████▌               | 6/12 [03:49<03:50, 38.34s/it][A
Evaluating:  58%|██████████████████             | 7/12 [04:28<03:11, 38.38s/it][A
Evaluating:  67%|████████████████████▋          | 8/12 [05:06<02:33, 38.36s/it][A
Evaluating:  75%|███████████████████████▎       | 9/12 [05:44<01:54, 38.13s/it][A
Evaluating:  83%|█████████████████████████     | 10/12 [06:20<01:15, 37.53s/it][A
Evaluating:  92%|███████████████████████████▌  | 11/12 [06:56<00:37, 37.11s/it][A
Eva


Evaluation:  {'loss': 0.5187283555666605, 'accuracy': 0.8324022346368715, 'f1_score': 0.7869171958314539, 'roc_auc': 0.5383908045977012}



Iteration:   6%|█▊                             | 1/17 [01:45<28:05, 105.34s/it][A
Iteration:  12%|███▋                           | 2/17 [03:32<26:23, 105.59s/it][A
Iteration:  18%|█████▍                         | 3/17 [05:14<24:26, 104.74s/it][A
Iteration:  24%|███████▎                       | 4/17 [06:57<22:36, 104.37s/it][A
Iteration:  29%|█████████                      | 5/17 [08:43<20:56, 104.69s/it][A
Iteration:  35%|██████████▉                    | 6/17 [10:26<19:07, 104.35s/it][A
Iteration:  41%|████████████▊                  | 7/17 [12:10<17:21, 104.19s/it][A
Iteration:  47%|██████████████▌                | 8/17 [13:58<15:47, 105.33s/it][A
Iteration:  53%|████████████████▍              | 9/17 [15:41<13:56, 104.60s/it][A
Iteration:  59%|█████████████████▋            | 10/17 [17:26<12:12, 104.69s/it][A
Iteration:  65%|███████████████████▍          | 11/17 [19:07<10:22, 103.69s/it][A
Iteration:  71%|█████████████████████▏        | 12/17 [20:54<08:43, 104.69s/it][A
Ite


====Evaluation====



Evaluating:   0%|                                       | 0/12 [00:00<?, ?it/s][A
Evaluating:   8%|██▌                            | 1/12 [00:36<06:40, 36.44s/it][A
Evaluating:  17%|█████▏                         | 2/12 [01:13<06:05, 36.53s/it][A
Evaluating:  25%|███████▊                       | 3/12 [01:49<05:29, 36.58s/it][A
Evaluating:  33%|██████████▎                    | 4/12 [02:26<04:52, 36.50s/it][A
Evaluating:  42%|████████████▉                  | 5/12 [03:02<04:15, 36.55s/it][A
Evaluating:  50%|███████████████▌               | 6/12 [03:39<03:39, 36.57s/it][A
Evaluating:  58%|██████████████████             | 7/12 [04:16<03:02, 36.57s/it][A
Evaluating:  67%|████████████████████▋          | 8/12 [04:52<02:26, 36.56s/it][A
Evaluating:  75%|███████████████████████▎       | 9/12 [05:29<01:49, 36.61s/it][A
Evaluating:  83%|█████████████████████████     | 10/12 [06:05<01:12, 36.49s/it][A
Evaluating:  92%|███████████████████████████▌  | 11/12 [06:41<00:36, 36.40s/it][A
Eva


Evaluation:  {'loss': 0.4698467080791791, 'accuracy': 0.8379888268156425, 'f1_score': 0.8033493508353843, 'roc_auc': 0.5695402298850575}



Iteration:   6%|█▊                             | 1/17 [01:44<27:56, 104.77s/it][A
Iteration:  12%|███▋                           | 2/17 [03:32<26:26, 105.77s/it][A
Iteration:  18%|█████▍                         | 3/17 [05:19<24:42, 105.90s/it][A
Iteration:  24%|███████▎                       | 4/17 [07:03<22:49, 105.32s/it][A
Iteration:  29%|█████████                      | 5/17 [08:48<21:05, 105.42s/it][A
Iteration:  35%|██████████▉                    | 6/17 [10:34<19:20, 105.53s/it][A
Iteration:  41%|████████████▊                  | 7/17 [12:18<17:31, 105.14s/it][A
Iteration:  47%|██████████████▌                | 8/17 [14:03<15:44, 104.94s/it][A
Iteration:  53%|████████████████▍              | 9/17 [15:49<14:03, 105.43s/it][A
Iteration:  59%|█████████████████▋            | 10/17 [17:37<12:23, 106.25s/it][A
Iteration:  65%|███████████████████▍          | 11/17 [19:21<10:32, 105.39s/it][A
Iteration:  71%|█████████████████████▏        | 12/17 [21:04<08:43, 104.75s/it][A
Ite


====Evaluation====



Evaluating:   0%|                                       | 0/12 [00:00<?, ?it/s][A
Evaluating:   8%|██▌                            | 1/12 [00:37<06:55, 37.74s/it][A
Evaluating:  17%|█████▏                         | 2/12 [01:14<06:14, 37.45s/it][A
Evaluating:  25%|███████▊                       | 3/12 [01:51<05:35, 37.24s/it][A
Evaluating:  33%|██████████▎                    | 4/12 [02:27<04:55, 37.00s/it][A
Evaluating:  42%|████████████▉                  | 5/12 [03:04<04:18, 36.92s/it][A
Evaluating:  50%|███████████████▌               | 6/12 [03:41<03:41, 36.86s/it][A
Evaluating:  58%|██████████████████             | 7/12 [04:17<03:03, 36.72s/it][A
Evaluating:  67%|████████████████████▋          | 8/12 [04:54<02:26, 36.64s/it][A
Evaluating:  75%|███████████████████████▎       | 9/12 [05:30<01:49, 36.59s/it][A
Evaluating:  83%|█████████████████████████     | 10/12 [06:06<01:12, 36.49s/it][A
Evaluating:  92%|███████████████████████████▌  | 11/12 [06:43<00:36, 36.45s/it][A
Eva


Evaluation:  {'loss': 0.44764966517686844, 'accuracy': 0.8324022346368715, 'f1_score': 0.8047218321597785, 'roc_auc': 0.5801149425287356}



Iteration:   6%|█▊                             | 1/17 [01:41<27:08, 101.78s/it][A
Iteration:  12%|███▋                           | 2/17 [03:27<25:46, 103.09s/it][A
Iteration:  18%|█████▍                         | 3/17 [05:13<24:12, 103.75s/it][A
Iteration:  24%|███████▎                       | 4/17 [07:01<22:44, 104.98s/it][A
Iteration:  29%|█████████                      | 5/17 [08:48<21:09, 105.76s/it][A
Iteration:  35%|██████████▉                    | 6/17 [10:38<19:35, 106.89s/it][A
Iteration:  41%|████████████▊                  | 7/17 [12:27<17:57, 107.74s/it][A
Iteration:  47%|██████████████▌                | 8/17 [14:14<16:06, 107.36s/it][A
Iteration:  53%|████████████████▍              | 9/17 [15:58<14:11, 106.50s/it][A
Iteration:  59%|█████████████████▋            | 10/17 [17:44<12:23, 106.27s/it][A
Iteration:  65%|███████████████████▍          | 11/17 [19:29<10:35, 105.98s/it][A
Iteration:  71%|█████████████████████▏        | 12/17 [21:15<08:48, 105.75s/it][A
Ite


====Evaluation====



Evaluating:   0%|                                       | 0/12 [00:00<?, ?it/s][A
Evaluating:   8%|██▌                            | 1/12 [00:36<06:45, 36.91s/it][A
Evaluating:  17%|█████▏                         | 2/12 [01:14<06:09, 36.97s/it][A
Evaluating:  25%|███████▊                       | 3/12 [01:50<05:32, 36.94s/it][A
Evaluating:  33%|██████████▎                    | 4/12 [02:27<04:54, 36.80s/it][A
Evaluating:  42%|████████████▉                  | 5/12 [03:04<04:17, 36.79s/it][A
Evaluating:  50%|███████████████▌               | 6/12 [03:41<03:41, 36.87s/it][A
Evaluating:  58%|██████████████████             | 7/12 [04:17<03:04, 36.84s/it][A
Evaluating:  67%|████████████████████▋          | 8/12 [04:54<02:27, 36.78s/it][A
Evaluating:  75%|███████████████████████▎       | 9/12 [05:31<01:50, 36.71s/it][A
Evaluating:  83%|█████████████████████████     | 10/12 [06:07<01:13, 36.70s/it][A
Evaluating:  92%|███████████████████████████▌  | 11/12 [06:44<00:36, 36.65s/it][A
Eva


Evaluation:  {'loss': 0.44092554599046707, 'accuracy': 0.8491620111731844, 'f1_score': 0.8305067199742983, 'roc_auc': 0.6318390804597701}



Iteration:   6%|█▊                             | 1/17 [01:46<28:27, 106.70s/it][A
Iteration:  12%|███▋                           | 2/17 [03:35<26:49, 107.33s/it][A
Iteration:  18%|█████▍                         | 3/17 [05:25<25:12, 108.01s/it][A
Iteration:  24%|███████▎                       | 4/17 [07:14<23:27, 108.30s/it][A
Iteration:  29%|█████████                      | 5/17 [09:03<21:44, 108.72s/it][A
Iteration:  35%|██████████▉                    | 6/17 [10:50<19:47, 107.98s/it][A
Iteration:  41%|████████████▊                  | 7/17 [12:38<18:00, 108.05s/it][A
Iteration:  47%|██████████████▌                | 8/17 [14:27<16:15, 108.39s/it][A
Iteration:  53%|████████████████▍              | 9/17 [16:14<14:23, 107.92s/it][A
Iteration:  59%|█████████████████▋            | 10/17 [18:03<12:37, 108.23s/it][A
Iteration:  65%|███████████████████▍          | 11/17 [19:52<10:50, 108.44s/it][A
Iteration:  71%|█████████████████████▏        | 12/17 [21:41<09:03, 108.72s/it][A
Ite


====Evaluation====



Evaluating:   0%|                                       | 0/12 [00:00<?, ?it/s][A
Evaluating:   8%|██▌                            | 1/12 [00:38<07:01, 38.31s/it][A
Evaluating:  17%|█████▏                         | 2/12 [01:16<06:23, 38.38s/it][A
Evaluating:  25%|███████▊                       | 3/12 [01:54<05:44, 38.25s/it][A
Evaluating:  33%|██████████▎                    | 4/12 [02:32<05:04, 38.09s/it][A
Evaluating:  42%|████████████▉                  | 5/12 [03:09<04:25, 37.87s/it][A
Evaluating:  50%|███████████████▌               | 6/12 [03:48<03:48, 38.13s/it][A
Evaluating:  58%|██████████████████             | 7/12 [04:27<03:11, 38.22s/it][A
Evaluating:  67%|████████████████████▋          | 8/12 [05:05<02:33, 38.38s/it][A
Evaluating:  75%|███████████████████████▎       | 9/12 [05:44<01:55, 38.37s/it][A
Evaluating:  83%|█████████████████████████     | 10/12 [06:24<01:17, 38.92s/it][A
Evaluating:  92%|███████████████████████████▌  | 11/12 [07:02<00:38, 38.60s/it][A
Eva


Evaluation:  {'loss': 0.45442944516738254, 'accuracy': 0.8491620111731844, 'f1_score': 0.8341783100186015, 'roc_auc': 0.6457471264367816}



Iteration:   6%|█▊                             | 1/17 [01:47<28:32, 107.02s/it][A
Iteration:  12%|███▋                           | 2/17 [03:31<26:33, 106.26s/it][A
Iteration:  18%|█████▍                         | 3/17 [05:18<24:51, 106.53s/it][A
Iteration:  24%|███████▎                       | 4/17 [07:02<22:54, 105.72s/it][A
Iteration:  29%|█████████                      | 5/17 [08:46<21:01, 105.10s/it][A
Iteration:  35%|██████████▉                    | 6/17 [10:30<19:14, 104.98s/it][A
Iteration:  41%|████████████▊                  | 7/17 [12:20<17:44, 106.49s/it][A
Iteration:  47%|██████████████▌                | 8/17 [14:06<15:55, 106.17s/it][A
Iteration:  53%|████████████████▍              | 9/17 [15:51<14:07, 105.94s/it][A
Iteration:  59%|█████████████████▋            | 10/17 [17:39<12:26, 106.58s/it][A
Iteration:  65%|███████████████████▍          | 11/17 [19:28<10:43, 107.18s/it][A
Iteration:  71%|█████████████████████▏        | 12/17 [21:16<08:57, 107.51s/it][A
Ite


====Evaluation====



Evaluating:   0%|                                       | 0/12 [00:00<?, ?it/s][A
Evaluating:   8%|██▌                            | 1/12 [00:36<06:39, 36.31s/it][A
Evaluating:  17%|█████▏                         | 2/12 [01:13<06:04, 36.44s/it][A
Evaluating:  25%|███████▊                       | 3/12 [01:50<05:30, 36.69s/it][A
Evaluating:  33%|██████████▎                    | 4/12 [02:27<04:53, 36.69s/it][A
Evaluating:  42%|████████████▉                  | 5/12 [03:04<04:17, 36.82s/it][A
Evaluating:  50%|███████████████▌               | 6/12 [03:41<03:41, 36.88s/it][A
Evaluating:  58%|██████████████████             | 7/12 [04:17<03:03, 36.78s/it][A
Evaluating:  67%|████████████████████▋          | 8/12 [04:54<02:27, 36.76s/it][A
Evaluating:  75%|███████████████████████▎       | 9/12 [05:30<01:49, 36.65s/it][A
Evaluating:  83%|█████████████████████████     | 10/12 [06:07<01:13, 36.57s/it][A
Evaluating:  92%|███████████████████████████▌  | 11/12 [06:44<00:36, 36.73s/it][A
Eva


Evaluation:  {'loss': 0.45002453463772935, 'accuracy': 0.8770949720670391, 'f1_score': 0.8602818204462157, 'roc_auc': 0.6763218390804597}



Iteration:   6%|█▊                             | 1/17 [01:44<27:49, 104.37s/it][A
Iteration:  12%|███▋                           | 2/17 [03:28<26:04, 104.32s/it][A
Iteration:  18%|█████▍                         | 3/17 [05:14<24:25, 104.66s/it][A
Iteration:  24%|███████▎                       | 4/17 [06:59<22:41, 104.76s/it][A
Iteration:  29%|█████████                      | 5/17 [08:45<21:01, 105.15s/it][A
Iteration:  35%|██████████▉                    | 6/17 [10:31<19:20, 105.46s/it][A
Iteration:  41%|████████████▊                  | 7/17 [12:19<17:42, 106.27s/it][A
Iteration:  47%|██████████████▌                | 8/17 [14:03<15:50, 105.62s/it][A
Iteration:  53%|████████████████▍              | 9/17 [15:51<14:11, 106.43s/it][A
Iteration:  59%|█████████████████▋            | 10/17 [17:40<12:30, 107.21s/it][A
Iteration:  65%|███████████████████▍          | 11/17 [19:29<10:45, 107.60s/it][A
Iteration:  71%|█████████████████████▏        | 12/17 [21:18<08:59, 107.97s/it][A
Ite


====Evaluation====



Evaluating:   0%|                                       | 0/12 [00:00<?, ?it/s][A
Evaluating:   8%|██▌                            | 1/12 [00:36<06:42, 36.60s/it][A
Evaluating:  17%|█████▏                         | 2/12 [01:15<06:13, 37.35s/it][A
Evaluating:  25%|███████▊                       | 3/12 [01:51<05:33, 37.03s/it][A
Evaluating:  33%|██████████▎                    | 4/12 [02:28<04:54, 36.82s/it][A
Evaluating:  42%|████████████▉                  | 5/12 [03:05<04:17, 36.79s/it][A
Evaluating:  50%|███████████████▌               | 6/12 [03:41<03:40, 36.78s/it][A
Evaluating:  58%|██████████████████             | 7/12 [04:18<03:03, 36.71s/it][A
Evaluating:  67%|████████████████████▋          | 8/12 [04:55<02:26, 36.70s/it][A
Evaluating:  75%|███████████████████████▎       | 9/12 [05:31<01:49, 36.64s/it][A
Evaluating:  83%|█████████████████████████     | 10/12 [06:07<01:12, 36.50s/it][A
Evaluating:  92%|███████████████████████████▌  | 11/12 [06:44<00:36, 36.47s/it][A
Eva


Evaluation:  {'loss': 0.4787951971714695, 'accuracy': 0.88268156424581, 'f1_score': 0.8710275744589123, 'roc_auc': 0.707471264367816}



Iteration:   6%|█▊                             | 1/17 [01:41<27:11, 101.94s/it][A
Iteration:  12%|███▋                           | 2/17 [03:29<25:55, 103.67s/it][A
Iteration:  18%|█████▍                         | 3/17 [05:15<24:19, 104.23s/it][A
Iteration:  24%|███████▎                       | 4/17 [07:00<22:37, 104.45s/it][A
Iteration:  29%|█████████                      | 5/17 [08:48<21:08, 105.69s/it][A
Iteration:  35%|██████████▉                    | 6/17 [10:34<19:21, 105.57s/it][A
Iteration:  41%|████████████▊                  | 7/17 [12:22<17:45, 106.53s/it][A
Iteration:  47%|██████████████▌                | 8/17 [14:11<16:04, 107.17s/it][A
Iteration:  53%|████████████████▍              | 9/17 [15:59<14:20, 107.52s/it][A
Iteration:  59%|█████████████████▋            | 10/17 [17:47<12:32, 107.54s/it][A
Iteration:  65%|███████████████████▍          | 11/17 [19:34<10:44, 107.46s/it][A
Iteration:  71%|█████████████████████▏        | 12/17 [21:19<08:52, 106.58s/it][A
Ite


====Evaluation====



Evaluating:   0%|                                       | 0/12 [00:00<?, ?it/s][A
Evaluating:   8%|██▌                            | 1/12 [00:37<06:54, 37.73s/it][A
Evaluating:  17%|█████▏                         | 2/12 [01:16<06:20, 38.03s/it][A
Evaluating:  25%|███████▊                       | 3/12 [01:55<05:45, 38.43s/it][A
Evaluating:  33%|██████████▎                    | 4/12 [02:33<05:06, 38.34s/it][A
Evaluating:  42%|████████████▉                  | 5/12 [03:14<04:32, 38.96s/it][A
Evaluating:  50%|███████████████▌               | 6/12 [03:53<03:53, 38.91s/it][A
Evaluating:  58%|██████████████████             | 7/12 [04:32<03:15, 39.14s/it][A
Evaluating:  67%|████████████████████▋          | 8/12 [05:11<02:36, 39.11s/it][A
Evaluating:  75%|███████████████████████▎       | 9/12 [05:50<01:56, 38.85s/it][A
Evaluating:  83%|█████████████████████████     | 10/12 [06:28<01:17, 38.60s/it][A
Evaluating:  92%|███████████████████████████▌  | 11/12 [07:06<00:38, 38.40s/it][A
Eva


Evaluation:  {'loss': 0.503812527594467, 'accuracy': 0.8770949720670391, 'f1_score': 0.8602818204462157, 'roc_auc': 0.6763218390804597}



Iteration:   6%|█▊                             | 1/17 [02:00<32:05, 120.34s/it][A
Iteration:  12%|███▋                           | 2/17 [03:48<29:08, 116.56s/it][A
Iteration:  18%|█████▍                         | 3/17 [05:41<26:56, 115.45s/it][A
Iteration:  24%|███████▎                       | 4/17 [07:42<25:23, 117.21s/it][A
Iteration:  29%|█████████                      | 5/17 [09:57<24:27, 122.29s/it][A
Iteration:  35%|██████████▉                    | 6/17 [12:11<23:06, 126.02s/it][A
Iteration:  41%|████████████▊                  | 7/17 [14:10<20:38, 123.88s/it][A
Iteration:  47%|██████████████▌                | 8/17 [16:13<18:32, 123.62s/it][A
Iteration:  53%|████████████████▍              | 9/17 [18:36<17:15, 129.41s/it][A
Iteration:  59%|█████████████████▋            | 10/17 [20:59<15:33, 133.42s/it][A
Iteration:  65%|███████████████████▍          | 11/17 [23:06<13:09, 131.57s/it][A
Iteration:  71%|█████████████████████▏        | 12/17 [25:27<11:12, 134.42s/it][A
Ite


====Evaluation====



Evaluating:   0%|                                       | 0/12 [00:00<?, ?it/s][A
Evaluating:   8%|██▌                            | 1/12 [00:37<06:57, 37.97s/it][A
Evaluating:  17%|█████▏                         | 2/12 [01:15<06:18, 37.89s/it][A
Evaluating:  25%|███████▊                       | 3/12 [01:52<05:38, 37.56s/it][A
Evaluating:  33%|██████████▎                    | 4/12 [02:30<05:02, 37.81s/it][A
Evaluating:  42%|████████████▉                  | 5/12 [03:09<04:26, 38.01s/it][A
Evaluating:  50%|███████████████▌               | 6/12 [03:46<03:46, 37.67s/it][A
Evaluating:  58%|██████████████████             | 7/12 [04:22<03:06, 37.38s/it][A
Evaluating:  67%|████████████████████▋          | 8/12 [04:59<02:28, 37.15s/it][A
Evaluating:  75%|███████████████████████▎       | 9/12 [05:42<01:56, 39.00s/it][A
Evaluating:  83%|█████████████████████████     | 10/12 [06:25<01:20, 40.23s/it][A
Evaluating:  92%|███████████████████████████▌  | 11/12 [07:11<00:41, 41.94s/it][A
Eva


Evaluation:  {'loss': 0.46619628990689915, 'accuracy': 0.8770949720670391, 'f1_score': 0.8753072097165479, 'roc_auc': 0.7597701149425289}



Iteration:   6%|█▊                             | 1/17 [02:06<33:40, 126.25s/it][A
Iteration:  12%|███▋                           | 2/17 [04:41<33:40, 134.69s/it][A
Iteration:  18%|█████▍                         | 3/17 [07:00<31:46, 136.19s/it][A
Iteration:  24%|███████▎                       | 4/17 [09:05<28:44, 132.65s/it][A
Iteration:  29%|█████████                      | 5/17 [11:24<26:55, 134.60s/it][A
Iteration:  35%|██████████▉                    | 6/17 [13:49<25:13, 137.63s/it][A
Iteration:  41%|████████████▊                  | 7/17 [15:44<21:48, 130.88s/it][A
Iteration:  47%|██████████████▌                | 8/17 [17:39<18:56, 126.23s/it][A
Iteration:  53%|████████████████▍              | 9/17 [19:55<17:12, 129.07s/it][A
Iteration:  59%|█████████████████▋            | 10/17 [22:05<15:06, 129.43s/it][A
Iteration:  65%|███████████████████▍          | 11/17 [24:26<13:16, 132.74s/it][A
Iteration:  71%|█████████████████████▏        | 12/17 [26:51<11:23, 136.64s/it][A
Ite


====Evaluation====



Evaluating:   0%|                                       | 0/12 [00:00<?, ?it/s][A
Evaluating:   8%|██▌                            | 1/12 [00:43<07:57, 43.40s/it][A
Evaluating:  17%|█████▏                         | 2/12 [01:25<07:10, 43.05s/it][A
Evaluating:  25%|███████▊                       | 3/12 [02:08<06:27, 43.04s/it][A
Evaluating:  33%|██████████▎                    | 4/12 [02:50<05:42, 42.75s/it][A
Evaluating:  42%|████████████▉                  | 5/12 [03:31<04:54, 42.05s/it][A
Evaluating:  50%|███████████████▌               | 6/12 [04:13<04:12, 42.12s/it][A
Evaluating:  58%|██████████████████             | 7/12 [04:59<03:36, 43.31s/it][A
Evaluating:  67%|████████████████████▋          | 8/12 [05:43<02:53, 43.49s/it][A
Evaluating:  75%|███████████████████████▎       | 9/12 [06:27<02:10, 43.62s/it][A
Evaluating:  83%|█████████████████████████     | 10/12 [07:09<01:26, 43.28s/it][A
Evaluating:  92%|███████████████████████████▌  | 11/12 [07:49<00:42, 42.34s/it][A
Eva


Evaluation:  {'loss': 0.46982651265958947, 'accuracy': 0.8659217877094972, 'f1_score': 0.8659217877094972, 'roc_auc': 0.7531034482758621}


Epoch: 100%|███████████████████████████████| 11/11 [7:17:46<00:00, 2387.85s/it]
