Attempt 010 Summarization - followup of Attempt 008 summarization with 10fold cross-validation

In [None]:
%env CUDA_VISIBLE_DEVICES=0
!pip install transformers datasets
!pip install cloud-tpu-client==0.10 torch==1.12.0 https://storage.googleapis.com/tpu-pytorch/wheels/colab/torch_xla-1.12-cp37-cp37m-linux_x86_64.whl tensorboard-plugin-profile
!pip install accelerate

env: CUDA_VISIBLE_DEVICES=0
Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/
Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/
Collecting torch-xla==1.12
  Using cached https://storage.googleapis.com/tpu-pytorch/wheels/colab/torch_xla-1.12-cp37-cp37m-linux_x86_64.whl (187.4 MB)
Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/


In [None]:
#adapted from https://github.com/FakeNewsChallenge/fnc-1-baseline/tree/master/utils
from csv import DictReader
import random
import os
from collections import defaultdict
import sys
import os
import re
import argparse

In [None]:
#Loading dataset from summaries
class DataReaderFromPath():
    def __init__(self, name="train", path="fnc-1", is_unlabeled=False):
        self.path = path
        print("Reading data from path : " + str(path) + " " )
        summaries = name + "_summaries.csv"
        stances = name + "_stances"
        if is_unlabeled is True:
            stances = stances + "_unlabeled"
        stances = stances + ".csv"

        self.stances = self.read(stances)
        articlesSummaries = self.read(summaries)
        self.summaries = dict()

        # make the body ID an integer value
        for s in self.stances:
            s['Body ID'] = int(s['Body ID'])

        # copy all bodies into a dictionary
        for summary in articlesSummaries:
            self.summaries[int(summary['Body ID'])] = summary['articleSummary']

        print("Total stances: " + str(len(self.stances)))
        print("Total summaries: " + str(len(self.summaries)))

    def read(self, filename):
        rows = []
        with open(self.path + "/" + filename, "r", encoding='utf-8') as table:
            r = DictReader(table)

            for line in r:
                rows.append(line)
        return rows

In [None]:
import random
import os
from collections import defaultdict


def generate_hold_out_split (dataset, training = 0.8, base_dir="splits"):
    r = random.Random()
    r.seed(1489215)

    article_ids = list(dataset.articles.keys())  # get a list of article ids
    r.shuffle(article_ids)  # and shuffle that list


    training_ids = article_ids[:int(training * len(article_ids))]
    hold_out_ids = article_ids[int(training * len(article_ids)):]

    # write the split body ids out to files for future use
    with open(base_dir+ "/"+ "training_ids.txt", "w+") as f:
        f.write("\n".join([str(id) for id in training_ids]))

    with open(base_dir+ "/"+ "hold_out_ids.txt", "w+") as f:
        f.write("\n".join([str(id) for id in hold_out_ids]))


def read_ids(file,base):
    ids = []
    with open(base+"/"+file,"r") as f:
        for line in f:
           ids.append(int(line))
        return ids


def kfold_split(dataset, training = 0.8, n_folds = 10, base_dir="splits"):
    if not (os.path.exists(base_dir+ "/"+ "training_ids.txt")
            and os.path.exists(base_dir+ "/"+ "hold_out_ids.txt")):
        generate_hold_out_split(dataset,training,base_dir)

    training_ids = read_ids("training_ids.txt", base_dir)
    hold_out_ids = read_ids("hold_out_ids.txt", base_dir)

    folds = []
    for k in range(n_folds):
        folds.append(training_ids[int(k*len(training_ids)/n_folds):int((k+1)*len(training_ids)/n_folds)])

    return folds,hold_out_ids


def get_stances_for_folds(dataset,folds,hold_out):
    stances_folds = defaultdict(list)
    stances_hold_out = []
    for stance in dataset.stances:
        if stance['Body ID'] in hold_out:
            stances_hold_out.append(stance)
        else:
            fold_id = 0
            for fold in folds:
                if stance['Body ID'] in fold:
                    stances_folds[fold_id].append(stance)
                fold_id += 1

    return stances_folds,stances_hold_out


Reading data from path : fnc-1 
Total stances: 49972
Total summaries: 1683


In [None]:
d = DataReaderFromPath()

In [None]:
# Adapted from https://github.com/FakeNewsChallenge/fnc-1/blob/master/scorer.py
from sklearn.metrics import confusion_matrix
from sklearn.metrics import precision_recall_fscore_support, accuracy_score
import json
LABELS = ['agree', 'disagree', 'discuss', 'unrelated']
LABELS_RELATED = ['unrelated', 'related']
RELATED = LABELS[0:3]


def score_submission(gold_labels, test_labels):
    score = 0.0
    cm = [[0, 0, 0, 0],
          [0, 0, 0, 0],
          [0, 0, 0, 0],
          [0, 0, 0, 0]]

    for i, (g, t) in enumerate(zip(gold_labels, test_labels)):
        g_stance, t_stance = g, t
        if g_stance == t_stance:
            score += 0.25
            if g_stance != 'unrelated':
                score += 0.50
        if g_stance in RELATED and t_stance in RELATED:
            score += 0.25

        cm[LABELS.index(g_stance)][LABELS.index(t_stance)] += 1

    return score, cm


def print_confusion_matrix(cm):
    lines = []
    header = "|{:^11}|{:^11}|{:^11}|{:^11}|{:^11}|".format('', *LABELS)
    line_len = len(header)
    lines.append("-" * line_len)
    lines.append(header)
    lines.append("-" * line_len)

    hit = 0
    total = 0
    for i, row in enumerate(cm):
        hit += row[i]
        total += sum(row)
        lines.append("|{:^11}|{:^11}|{:^11}|{:^11}|{:^11}|".format(LABELS[i],
                                                                   *row))
        lines.append("-" * line_len)
    print('\n'.join(lines))


def report_score(actual, predicted):
    score, cm = score_submission(actual, predicted)
    best_score, _ = score_submission(actual, actual)

    print_confusion_matrix(cm)
    print("Score: " + str(score) + " out of " + str(best_score) + "\t(" + str(score * 100 / best_score) + "%)")
    all_values = get_precision_recall_f1_scores(actual, predicted)

    print("--All Metrics --")
    print(json.dumps(all_values, indent=4, sort_keys=True, separators=(',', ': ')))

    return score * 100 / best_score

#Calculating accuracy precision recall f1 scores
def get_precision_recall_f1_scores(actual, predicted):
    # calculate precision scores for labels - Average None
    p, r, f1, _ = precision_recall_fscore_support(y_true=actual, y_pred=predicted, labels=LABELS, zero_division=0.0,
                                                  average=None)

    precisions = [{LABELS[index] : value} for (index, value) in enumerate(p)]
    recalls = [{LABELS[index] : value} for (index, value) in enumerate(r)]
    f1_scores = [{LABELS[index] : value} for (index, value) in enumerate(f1)]
    acc = accuracy_score(actual, predicted)
    avg_none = {"accuracy": acc, "precision": precisions, "recall": recalls, "f1": f1_scores}

    # calculate precision scores for labels - Average micro
    p, r, f1, _ = precision_recall_fscore_support(y_true=actual, y_pred=predicted, labels=LABELS, zero_division=0.0,
                                                  average='micro')

    avg_micro = {"accuracy": acc, "precision": p, "recall": r, "f1": f1}

    # calculate precision scores for labels - Average macro
    p, r, f1, _ = precision_recall_fscore_support(y_true=actual, y_pred=predicted, labels=LABELS, zero_division=0.0,
                                                  average='macro')

    avg_macro = {"accuracy": acc, "precision": p, "recall": r, "f1": f1}

    # calculate precision scores for labels - Average weighted
    p, r, f1, _ = precision_recall_fscore_support(y_true=actual, y_pred=predicted, labels=LABELS, zero_division=0.0,
                                                  average='weighted')

    avg_weighted = {"accuracy": acc, "precision": p, "recall": r, "f1": f1}

    all_values = {"Each_Class": avg_none, "micro": avg_micro, "macro": avg_macro, "weighted": avg_weighted}

    return all_values

def compute_metrics(pred):
    actual = [LABELS[int(a)] for a in pred.label_ids]#pred.label_ids
    predicted = [LABELS[int(a)] for a in pred.predictions.argmax(-1)]#pred.predictions.argmax(-1)
    acc = accuracy_score(actual, predicted)
    # calculate precision scores for labels - Average macro
    p, r, f1, _ = precision_recall_fscore_support(y_true=actual, y_pred=predicted, labels=LABELS, zero_division=0.0,
                                                  average='macro')

    avg_macro = {"accuracy": acc, "precision": p, "recall": r, "f1": f1}

    return avg_macro

In [None]:
#adapted from https://github.com/FakeNewsChallenge/fnc-1-baseline/blob/master/feature_engineering.py
import os
import re
import nltk
import numpy as np
from tqdm import tqdm

def combine_headline_and_bodies(headlines, bodies):
    X = []
    for i, (headline, body) in tqdm(enumerate(zip(headlines, bodies))):
        joinedStr = headline + " <TitleSummarySep> " + body
        X.append(joinedStr)
    return X

2it [00:00, 24244.53it/s]

['The world is ending <TitleSummarySep> The world is ending', 'We all are about to die <TitleSummarySep> We all are about to die. Everyone will be dead. We will. Kill us.']





In [None]:
headlines = ["The world is ending","We all are about to die"]
bodies = ["The world is ending","We all are about to die. Everyone will be dead. We will. Kill us."]
fp = combine_headline_and_bodies(headlines, bodies)
print(fp)

In [None]:
#adapted from https://github.com/FakeNewsChallenge/fnc-1-baseline/blob/master/fnc_kfold.py
import sys
import numpy as np


def generate_labeled_data(stances, dataset, name):
    h, b, y = [], [], []

    for stance in stances:
        y.append((LABELS.index(stance['Stance'])))
        h.append(stance['Headline'])
        b.append(dataset.summaries[stance['Body ID']])

    X = combine_headline_and_bodies(h, b)
    print(y)

    return X, y


def generate_data_without_labels(stances, dataset, name):
    h, b= [], []

    for stance in stances:
        h.append(stance['Headline'])
        b.append(dataset.summaries[stance['Body ID']])
        
    X = combine_headline_and_bodies(h, b)
    return X

Reading data from path : fnc-1 
Total stances: 49972
Total summaries: 1683


9622it [00:00, 797155.53it/s]


[3, 0, 3, 3, 0, 3, 3, 3, 3, 3, 3, 0, 3, 3, 3, 0, 3, 3, 3, 3, 3, 3, 3, 0, 3, 3, 0, 3, 3, 0, 3, 3, 3, 3, 2, 3, 3, 3, 3, 3, 3, 2, 3, 3, 3, 0, 3, 3, 3, 3, 3, 3, 2, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 0, 2, 3, 3, 2, 3, 2, 3, 1, 3, 0, 3, 3, 3, 3, 3, 2, 3, 3, 1, 3, 2, 3, 3, 3, 3, 3, 3, 2, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 3, 3, 2, 3, 3, 2, 2, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 2, 3, 3, 3, 3, 3, 3, 0, 2, 3, 3, 2, 3, 2, 3, 3, 3, 0, 0, 3, 3, 3, 3, 3, 3, 0, 2, 3, 3, 3, 3, 2, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 2, 3, 3, 3, 2, 0, 3, 3, 2, 3, 3, 3, 3, 0, 3, 3, 3, 3, 3, 3, 3, 3, 0, 3, 3, 0, 3, 3, 3, 2, 3, 0, 2, 3, 3, 2, 3, 3, 3, 2, 3, 3, 3, 2, 3, 3, 3, 3, 3, 2, 3, 3, 2, 3, 0, 0, 2, 3, 3, 2, 0, 3, 2, 3, 3, 3, 3, 3, 3, 3, 0, 3, 3, 3, 3, 2, 3, 3, 2, 3, 3, 3, 3, 3, 3, 3, 3, 0, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 0, 3, 3, 3, 3, 3, 3, 3, 0, 3, 2, 3, 3, 3, 0, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 0, 3, 3, 2, 2, 3, 2, 2, 3, 3, 3, 3, 3, 2, 3, 3, 3, 2, 3, 2, 0, 3, 3, 3, 3, 3, 1, 3, 3, 2, 3, 2, 3, 3, 3, 3, 3, 3, 

4124it [00:00, 580602.50it/s]


[0, 3, 3, 0, 3, 3, 2, 3, 3, 0, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 0, 3, 3, 3, 3, 3, 3, 3, 3, 1, 3, 3, 2, 3, 3, 3, 2, 1, 3, 0, 3, 3, 3, 3, 3, 3, 3, 3, 1, 3, 0, 3, 0, 3, 3, 2, 3, 2, 3, 3, 3, 3, 3, 2, 3, 3, 3, 3, 3, 2, 3, 3, 2, 0, 0, 0, 3, 3, 3, 3, 0, 3, 0, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 0, 3, 3, 1, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 2, 0, 3, 3, 3, 3, 2, 2, 3, 3, 3, 3, 3, 3, 2, 1, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 3, 3, 1, 3, 3, 1, 3, 3, 0, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 0, 3, 3, 3, 3, 0, 3, 0, 3, 3, 2, 0, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 0, 3, 3, 3, 2, 3, 3, 3, 3, 2, 3, 3, 3, 3, 2, 0, 1, 3, 3, 3, 2, 3, 2, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 2, 3, 3, 3, 3, 3, 3, 3, 2, 0, 3, 3, 3, 3, 3, 3, 2, 3, 3, 0, 2, 3, 3, 3, 3, 3, 2, 2, 3, 3, 2, 3, 3, 0, 3, 3, 3, 3, 3, 2, 2, 2, 3, 0, 2, 0, 3, 2, 3, 3, 3, 3, 2, 3, 0, 3, 2, 3, 3, 0, 3, 3, 3, 3, 3, 3, 3, 3, 3, 0, 3, 3, 3, 0, 3, 3, 0, 2, 3, 3, 3, 1, 3, 3, 3, 2, 3, 3, 3, 3, 2, 2, 3, 2, 3, 3, 1, 0, 3, 3, 

4663it [00:00, 574982.79it/s]


[3, 3, 3, 0, 3, 2, 3, 3, 2, 3, 2, 2, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 2, 3, 3, 3, 3, 3, 3, 3, 0, 3, 3, 3, 2, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 2, 3, 3, 3, 3, 3, 3, 0, 3, 3, 3, 3, 3, 2, 2, 0, 3, 3, 2, 3, 2, 2, 0, 2, 3, 3, 3, 2, 3, 3, 3, 3, 3, 2, 0, 2, 3, 3, 1, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 3, 3, 2, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 1, 2, 3, 3, 3, 3, 3, 0, 2, 3, 3, 3, 0, 3, 0, 3, 2, 3, 3, 2, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 0, 3, 3, 3, 2, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 0, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 3, 2, 3, 3, 3, 2, 3, 3, 0, 3, 3, 3, 3, 2, 2, 2, 3, 3, 2, 3, 2, 2, 3, 3, 3, 3, 3, 3, 3, 3, 0, 3, 2, 3, 3, 3, 3, 3, 2, 2, 3, 2, 3, 3, 3, 2, 3, 2, 3, 3, 2, 3, 3, 3, 2, 2, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 2, 3, 3, 3, 3, 3, 0, 3, 0, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 3, 3, 0, 3, 0, 3, 3, 3, 3, 3, 2, 3, 2, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 2, 2, 3, 3, 3, 3, 3, 2, 3, 3, 3, 2, 3, 3, 3, 3, 3, 2, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 3, 0, 3, 3, 0, 2, 3, 3, 3, 3, 2, 3, 

3783it [00:00, 851693.61it/s]


[3, 3, 0, 3, 3, 3, 3, 3, 3, 0, 3, 2, 3, 3, 2, 3, 2, 3, 3, 2, 2, 3, 3, 3, 3, 3, 3, 3, 1, 3, 3, 2, 3, 3, 2, 3, 3, 3, 3, 2, 1, 2, 3, 3, 2, 3, 3, 3, 2, 3, 2, 3, 3, 3, 3, 3, 3, 2, 3, 0, 2, 2, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 2, 3, 2, 3, 3, 2, 3, 3, 3, 3, 2, 3, 0, 0, 3, 3, 3, 2, 3, 2, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 3, 2, 3, 3, 3, 2, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 0, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 2, 3, 3, 3, 3, 2, 3, 3, 3, 0, 2, 3, 3, 3, 3, 3, 3, 3, 0, 3, 2, 3, 2, 3, 3, 3, 0, 3, 3, 2, 3, 0, 3, 3, 3, 3, 3, 0, 3, 3, 3, 3, 2, 3, 2, 2, 3, 3, 3, 0, 3, 2, 3, 0, 0, 3, 3, 2, 0, 3, 3, 2, 3, 3, 0, 3, 3, 3, 3, 3, 3, 2, 3, 3, 2, 3, 2, 2, 0, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 2, 2, 3, 3, 3, 2, 3, 3, 1, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 3, 2, 3, 0, 2, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 2, 3, 3, 3, 3, 2, 3, 2, 2, 3, 3, 3, 3, 2, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 3, 3, 0, 3, 3, 2, 2, 3, 3, 3, 0, 3, 3, 3, 2, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 2, 2, 2, 3, 2, 3, 3, 1, 3, 3, 3, 2, 

3388it [00:00, 826324.47it/s]


[1, 3, 2, 3, 3, 0, 0, 3, 3, 2, 3, 3, 2, 0, 3, 2, 2, 2, 2, 3, 2, 3, 3, 3, 0, 3, 2, 3, 3, 3, 3, 3, 3, 0, 3, 3, 2, 3, 2, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 0, 2, 2, 3, 2, 3, 3, 2, 3, 2, 3, 3, 3, 3, 0, 2, 3, 2, 3, 2, 3, 3, 3, 3, 3, 2, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 0, 3, 2, 2, 3, 3, 2, 0, 2, 3, 3, 0, 3, 3, 3, 3, 3, 3, 0, 3, 3, 2, 3, 3, 3, 2, 2, 3, 3, 3, 3, 3, 3, 3, 2, 1, 3, 2, 2, 3, 3, 2, 3, 2, 3, 3, 3, 0, 3, 3, 3, 3, 3, 3, 2, 3, 2, 2, 0, 3, 3, 2, 3, 2, 2, 3, 3, 0, 2, 3, 3, 3, 2, 3, 2, 0, 3, 3, 3, 2, 3, 3, 0, 3, 2, 0, 3, 2, 2, 3, 3, 3, 3, 3, 0, 3, 2, 3, 0, 0, 0, 3, 3, 3, 3, 2, 3, 3, 3, 3, 3, 3, 2, 3, 2, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 2, 0, 0, 2, 2, 3, 3, 0, 3, 3, 0, 3, 3, 2, 3, 3, 3, 3, 2, 3, 2, 3, 0, 3, 3, 0, 3, 3, 1, 0, 3, 3, 0, 2, 3, 0, 3, 3, 3, 2, 1, 3, 2, 3, 1, 0, 0, 3, 3, 3, 3, 3, 3, 3, 2, 2, 3, 3, 2, 3, 2, 2, 0, 2, 3, 3, 3, 3, 3, 2, 2, 3, 3, 3, 0, 3, 3, 3, 2, 3, 3, 3, 2, 0, 3, 2, 1, 3, 3, 3, 3, 0, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 2, 3, 3, 3, 3, 2, 0, 3, 

3644it [00:00, 804127.10it/s]


[0, 3, 2, 2, 2, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 3, 3, 3, 3, 3, 2, 2, 3, 0, 3, 3, 3, 3, 3, 3, 2, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 0, 3, 2, 3, 3, 3, 3, 3, 3, 2, 3, 3, 3, 2, 2, 3, 0, 3, 3, 2, 3, 3, 0, 3, 3, 3, 3, 2, 3, 3, 3, 3, 3, 2, 3, 3, 0, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 2, 3, 2, 3, 3, 3, 2, 3, 3, 1, 3, 2, 3, 3, 2, 2, 3, 3, 1, 3, 3, 3, 3, 3, 3, 2, 3, 3, 3, 3, 3, 3, 2, 3, 3, 3, 2, 3, 1, 2, 3, 0, 3, 2, 3, 3, 3, 0, 3, 3, 3, 2, 3, 2, 2, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 3, 3, 1, 3, 3, 3, 3, 2, 2, 3, 3, 2, 3, 0, 0, 3, 3, 3, 3, 2, 3, 3, 2, 3, 3, 2, 2, 3, 3, 3, 3, 3, 2, 3, 3, 3, 3, 3, 3, 3, 2, 3, 2, 3, 2, 3, 3, 3, 3, 0, 3, 3, 1, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 2, 0, 1, 3, 3, 3, 3, 3, 2, 2, 3, 3, 3, 2, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 3, 3, 0, 0, 3, 2, 3, 3, 2, 3, 3, 3, 3, 2, 2, 3, 2, 3, 2, 3, 2, 3, 3, 3, 2, 3, 3, 3, 3, 3, 3, 2, 2, 3, 3, 3, 3, 3, 2, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 3, 2, 3, 3, 2, 3, 0, 0, 2, 3, 3, 3, 2, 3, 3, 2, 3, 3, 2, 3, 3, 3, 2, 2, 2, 3, 2, 2, 2, 3, 

4644it [00:00, 577427.08it/s]


[3, 3, 3, 3, 3, 3, 3, 2, 2, 3, 3, 2, 3, 3, 3, 3, 2, 2, 3, 3, 3, 3, 3, 3, 3, 3, 1, 3, 1, 3, 3, 3, 3, 2, 3, 0, 3, 3, 2, 3, 0, 3, 3, 2, 0, 3, 2, 3, 3, 3, 3, 3, 3, 3, 3, 0, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 2, 3, 3, 2, 1, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 1, 3, 3, 2, 3, 3, 2, 3, 3, 3, 2, 3, 3, 3, 1, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 2, 3, 2, 3, 3, 3, 2, 3, 3, 3, 3, 2, 3, 3, 3, 3, 0, 2, 3, 3, 3, 0, 3, 3, 3, 3, 3, 3, 2, 3, 2, 3, 3, 3, 1, 3, 3, 1, 3, 3, 3, 3, 3, 3, 0, 3, 2, 3, 3, 3, 3, 3, 3, 3, 3, 3, 0, 3, 3, 2, 3, 2, 3, 3, 3, 3, 3, 3, 2, 3, 0, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 2, 3, 3, 0, 3, 1, 3, 2, 2, 2, 2, 3, 3, 3, 2, 3, 3, 3, 3, 3, 1, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 3, 2, 3, 3, 2, 2, 3, 3, 3, 3, 3, 3, 3, 3, 0, 3, 2, 3, 2, 3, 2, 3, 3, 3, 2, 3, 3, 3, 3, 3, 2, 3, 0, 3, 3, 3, 3, 3, 3, 2, 3, 2, 3, 3, 3, 3, 3, 0, 3, 3, 3, 3, 3, 2, 3, 3, 3, 3, 0, 3, 3, 3, 2, 3, 3, 3, 3, 3, 3, 2, 2, 2, 3, 3, 0, 2, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 3, 3, 

3848it [00:00, 795646.13it/s]


[2, 3, 3, 3, 3, 3, 3, 2, 3, 3, 0, 3, 3, 3, 3, 2, 2, 3, 3, 2, 2, 3, 3, 0, 3, 3, 3, 3, 2, 3, 3, 3, 2, 0, 2, 3, 3, 3, 3, 3, 3, 3, 0, 0, 3, 2, 3, 0, 2, 3, 0, 0, 2, 3, 0, 3, 3, 3, 0, 2, 3, 2, 2, 3, 2, 0, 3, 3, 2, 3, 2, 3, 2, 3, 3, 3, 3, 2, 3, 3, 3, 0, 3, 2, 3, 3, 3, 2, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 2, 3, 0, 2, 3, 3, 3, 3, 2, 3, 3, 3, 2, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 2, 3, 2, 0, 2, 2, 3, 3, 3, 3, 3, 3, 3, 0, 2, 3, 3, 3, 2, 3, 3, 3, 0, 3, 3, 3, 3, 3, 2, 3, 3, 0, 3, 2, 3, 3, 3, 3, 3, 3, 3, 3, 2, 0, 2, 2, 3, 1, 3, 3, 2, 2, 3, 3, 3, 3, 2, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 3, 3, 3, 3, 3, 3, 3, 1, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 2, 3, 2, 2, 3, 3, 3, 3, 3, 3, 3, 3, 0, 3, 3, 3, 2, 0, 3, 2, 3, 3, 3, 3, 2, 3, 3, 2, 3, 2, 0, 2, 3, 0, 3, 3, 3, 2, 3, 2, 2, 2, 3, 3, 3, 3, 0, 3, 3, 3, 3, 3, 3, 2, 3, 2, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 3, 3, 3, 3, 3, 3, 1, 3, 3, 2, 2, 3, 2, 3, 3, 3, 0, 3, 1, 3, 3, 0, 3, 3, 3, 3, 3, 3, 3, 2, 0, 3, 2, 3, 1, 3, 3, 3, 3, 2, 3, 3, 2, 3, 3, 3, 3, 3, 2, 2, 2, 3, 3, 3, 0, 3, 3, 

4273it [00:00, 856295.32it/s]


[2, 0, 2, 0, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 0, 3, 2, 3, 1, 3, 3, 0, 0, 2, 3, 3, 2, 2, 3, 3, 3, 3, 3, 0, 2, 3, 3, 3, 3, 3, 3, 2, 3, 3, 2, 1, 3, 2, 3, 3, 0, 2, 3, 3, 3, 3, 3, 0, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 0, 3, 3, 3, 3, 3, 3, 2, 3, 3, 3, 3, 3, 2, 3, 3, 3, 0, 3, 3, 3, 2, 3, 3, 3, 3, 2, 3, 2, 2, 3, 1, 3, 2, 3, 0, 3, 3, 3, 2, 3, 3, 3, 3, 3, 3, 3, 0, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 0, 3, 2, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 3, 1, 3, 3, 2, 3, 3, 3, 3, 3, 0, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 1, 3, 3, 3, 2, 2, 3, 3, 3, 3, 3, 3, 3, 3, 3, 1, 3, 3, 3, 3, 3, 3, 0, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 3, 3, 3, 3, 0, 3, 2, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 2, 3, 3, 3, 3, 2, 3, 3, 3, 2, 3, 3, 3, 3, 3, 3, 3, 3, 3, 0, 0, 3, 2, 3, 3, 3, 3, 0, 2, 1, 3, 3, 3, 2, 3, 3, 2, 0, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 2, 3, 3, 3, 3, 3, 2, 2, 3, 2, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 3, 3, 3, 2, 3, 3, 3, 3, 2, 3, 0, 3, 0, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 

4039it [00:00, 817487.52it/s]


[2, 3, 3, 1, 3, 3, 3, 3, 3, 3, 0, 3, 3, 3, 3, 2, 3, 0, 3, 3, 0, 3, 3, 3, 3, 3, 2, 3, 3, 3, 2, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 0, 0, 3, 3, 2, 2, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 2, 3, 3, 2, 2, 3, 2, 3, 3, 0, 3, 0, 0, 3, 3, 2, 3, 3, 3, 3, 2, 0, 3, 3, 0, 3, 3, 2, 3, 3, 2, 0, 2, 3, 3, 3, 3, 2, 0, 3, 0, 3, 3, 3, 3, 1, 3, 1, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 3, 3, 3, 3, 3, 1, 3, 0, 3, 3, 3, 3, 3, 0, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 3, 3, 3, 2, 2, 3, 3, 3, 3, 3, 0, 2, 3, 3, 3, 2, 3, 3, 3, 3, 3, 3, 2, 3, 2, 3, 3, 2, 0, 2, 2, 3, 3, 3, 3, 1, 3, 0, 3, 3, 3, 3, 3, 2, 2, 0, 3, 3, 3, 3, 2, 3, 3, 3, 3, 3, 3, 3, 3, 2, 2, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 3, 3, 3, 3, 2, 0, 3, 0, 3, 3, 3, 2, 3, 3, 3, 3, 3, 0, 0, 3, 2, 3, 3, 3, 2, 3, 3, 3, 3, 3, 3, 3, 2, 3, 2, 3, 3, 3, 3, 3, 3, 3, 2, 3, 2, 3, 3, 3, 3, 3, 1, 3, 2, 3, 3, 3, 2, 2, 0, 3, 3, 3, 2, 3, 3, 0, 2, 2, 3, 3, 3, 3, 3, 3, 3, 2, 3, 2, 2, 3, 0, 3, 2, 2, 3, 3, 3, 3, 2, 2, 2, 2, 0, 3, 2, 3, 1, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 3, 2, 

3944it [00:00, 854238.83it/s]


[1, 3, 3, 2, 3, 3, 3, 3, 3, 3, 3, 1, 3, 3, 3, 2, 3, 3, 2, 2, 2, 2, 2, 3, 2, 3, 3, 3, 3, 3, 0, 3, 3, 3, 3, 0, 3, 2, 3, 2, 3, 2, 3, 2, 3, 0, 3, 3, 3, 3, 3, 3, 2, 3, 2, 2, 2, 3, 0, 3, 0, 3, 3, 3, 3, 3, 3, 3, 0, 3, 2, 3, 3, 0, 2, 3, 3, 3, 2, 3, 2, 3, 2, 0, 3, 3, 3, 3, 3, 3, 0, 0, 3, 2, 3, 3, 3, 3, 3, 3, 3, 3, 3, 0, 3, 3, 3, 3, 0, 3, 3, 3, 3, 3, 3, 0, 0, 3, 3, 0, 3, 3, 0, 3, 3, 3, 0, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 0, 3, 3, 3, 0, 2, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 3, 3, 3, 3, 3, 3, 3, 0, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 3, 2, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 2, 3, 0, 3, 3, 3, 2, 3, 2, 3, 3, 3, 3, 3, 3, 0, 3, 3, 3, 3, 0, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 0, 2, 3, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 3, 0, 3, 3, 3, 3, 3, 3, 3, 3, 2, 3, 0, 3, 3, 3, 3, 2, 2, 0, 0, 3, 3, 2, 3, 3, 0, 3, 3, 3, 2, 3, 3, 3, 0, 3, 3, 3, 3, 2, 3, 3, 3, 3, 3, 3, 0, 3, 3, 2, 3, 3, 3, 3, 3, 3, 2, 2, 3, 3, 3, 0, 3, 3, 3, 3, 3, 3, 2, 3, 3, 3, 0, 3, 2, 3, 3, 3, 2, 3, 3, 3, 2, 3, 1, 3, 3, 3, 3, 3, 2, 3, 3, 3, 3, 2, 3, 3, 2, 3, 

In [None]:
import sys
import numpy as np

from sklearn.ensemble import AdaBoostClassifier
import pandas as pd
from datasets import Dataset, DatasetDict

#check_version()
#parse_params()

# Load the training dataset and generate folds
d = DataReaderFromPath()

Xs = {}
ys = {}
folds, hold_out = kfold_split(d, n_folds=10)
fold_stances, hold_out_stances = get_stances_for_folds(d, folds, hold_out)
# Load/Precompute all features now
X_holdout, y_holdout = generate_labeled_data(hold_out_stances, d, "holdout")
for fold in fold_stances:
    Xs[fold], ys[fold] = generate_labeled_data(fold_stances[fold], d, str(fold))


# Load the competition dataset
unlabeled_competition_dataset = DataReaderFromPath(name="competition_test", is_unlabeled=True)

<__main__.DataReaderFromPath at 0x7fec2dd7d490>

In [None]:
unlabeled_competition_dataset

25413it [00:00, 845790.07it/s]


In [None]:
X_unlabeled = generate_data_without_labels(unlabeled_competition_dataset.stances, unlabeled_competition_dataset,"competition_unlabeled")

25413

In [None]:
len(X_unlabeled)

In [None]:
def get_X_data_in_batches(X_data):
  dataset_in_batches = []
  batch_size = 200
  i = 1
  batch = []

  for data in X_data:
    batch.append(data)
    if(i == 200):
      batch_to_append = batch.copy()
      print(batch_to_append[0])
      dataset_in_batches.append(batch_to_append)
      batch.clear()
      i=0

    i = i+1
    #print(i)

  if len(batch) > 0:
    dataset_in_batches.append(batch)
    batch = []

  return dataset_in_batches

In [None]:
def get_XY_data_in_batches(X_data, y_data):
  dataset_in_batches = []
  batch_size = 200
  i = 1
  batch = []

  for index, xdata in enumerate(X_data):
    data = DatasetDict(
        X = xdata,
        y = y_data[index],
    )
    batch.append(data)
    if(i == 200):
      batch_to_append = batch.copy()
      print(batch_to_append[0])
      dataset_in_batches.append(batch_to_append)
      batch.clear()
      i=0

    i = i+1
    #print(i)

  if len(batch) > 0:
    dataset_in_batches.append(batch)
    batch = []

  return dataset_in_batches

Ferguson riots: Pregnant woman loses eye after cops fire BEAN BAG round through car window <TitleSummarySep> Helric Fredou, 45, turned a gun on himself in his police office in Limoges. A colleague found his body at 1am on Thursday, the day after three gunmen fired at the satirical magazine's office and left 12 people dead. Union of Commissioners of the National Police confirmed Mr Fredou took his own life.
Bear attack foiled by Justin Bieber’s music: A story too good to check <TitleSummarySep> President Cristina Fernandez de Kirchhner adopted Yair Tawil as her godson. Tradition says the seventh son in a family will turn into a werewolf and eat unbaptized babies. Yair is the first Jewish boy to be adopted, as the practice only applied to Catholics until 2009.
Finally, proof that Justin Bieber IS unbearable: Russian fisherman saved from bear attack when ringtone featuring one of the pop brat's songs scares it away <TitleSummarySep> A customer says he was able to change the quality of App

In [None]:
competition_dataset_in_batches = get_X_data_in_batches(X_unlabeled)

DatasetDict({
    X: Police find mass graves with at least '15 bodies' near Mexico town where 43 students disappeared after police clash <TitleSummarySep> Seth Rogen is being eyed to play Apple co-founder Steve Wozniak in Sony’s Steve Jobs biopic. Danny Boyle is directing the untitled film, based on Walter Isaacson's book and adapted by Aaron Sorkin. Christian Bale, the actor who is to play Jobs, is still in the midst of closing his deal.
    y: 3
})
DatasetDict({
    X: Predator Drone Reportedly Spotted Over ISIS Hotbed in Syria; Airstrikes Hit ISIS Targets <TitleSummarySep> U.S. drones are hunting for al-Baghdadi, according to reports in the Telegraph. Reports say the U.S.-led coalition is using drones to hunt for the ISIS leader. The Telegraph reports that the drones are believed to be armed with machine guns and drones.
    y: 2
})
DatasetDict({
    X: One of 'Taliban Five' in Bowe Bergdahl swap allegedly returned to militancy <TitleSummarySep> The lethal animals are being launched

In [None]:
holdout_dataset_in_batches = get_XY_data_in_batches(X_holdout,y_holdout)

In [None]:
competition_data_dict_list = []
for batch in competition_dataset_in_batches:
    data_dict =DatasetDict(
      competition=Dataset.from_dict(
          {
              "text": batch,
              "label": [3]*len(batch),
          }
      )
    )
    competition_data_dict_list.append(data_dict)

In [None]:
holdout_data_dict_list = []
for batch in holdout_dataset_in_batches:
  #print(batch)
  X_values = []
  y_values = []
  for dict_val in batch:
    X_values.append(dict_val["X"])
    y_values.append(dict_val["y"])
  data_dict =DatasetDict(
    holdout=Dataset.from_dict(
        {
            "text": X_values,
            "label": y_values,
        }
    )
  )
  holdout_data_dict_list.append(data_dict)

'Bear attack foiled by Justin Bieber’s music: A story too good to check <TitleSummarySep> President Cristina Fernandez de Kirchhner adopted Yair Tawil as her godson. Tradition says the seventh son in a family will turn into a werewolf and eat unbaptized babies. Yair is the first Jewish boy to be adopted, as the practice only applied to Catholics until 2009.'

In [None]:
competition_data_dict_list[1]['competition']['text'][0]

'Predator Drone Reportedly Spotted Over ISIS Hotbed in Syria; Airstrikes Hit ISIS Targets <TitleSummarySep> U.S. drones are hunting for al-Baghdadi, according to reports in the Telegraph. Reports say the U.S.-led coalition is using drones to hunt for the ISIS leader. The Telegraph reports that the drones are believed to be armed with machine guns and drones.'

In [None]:
holdout_data_dict_list[1]['holdout']['text'][0]

Downloading tokenizer_config.json:   0%|          | 0.00/28.0 [00:00<?, ?B/s]

Downloading config.json:   0%|          | 0.00/483 [00:00<?, ?B/s]

Downloading vocab.txt:   0%|          | 0.00/226k [00:00<?, ?B/s]

Downloading tokenizer.json:   0%|          | 0.00/455k [00:00<?, ?B/s]

1

In [None]:
import os, numpy as np

from transformers import (
    AutoTokenizer,
    AutoModelForSequenceClassification,
    TrainingArguments,
    Trainer,
)

#adapted from https://github.com/Demfier/pytorch-tutorials/blob/main/bert_classifier/train.py
tokenizer = AutoTokenizer.from_pretrained("distilbert-base-uncased", use_fast=True)
new_token = "<TitleSummarySep>"
tokenizer.add_tokens(new_token)



In [None]:
def preprocess(example):
  result =  tokenizer(example["text"], max_length=200, truncation=True, padding='max_length')  
  return result

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

In [None]:
encoded_competitiondataset_list = [competition_data_dict.map(preprocess, batched=True) for competition_data_dict in competition_data_dict_list]

Downloading pytorch_model.bin:   0%|          | 0.00/256M [00:00<?, ?B/s]

Some weights of the model checkpoint at distilbert-base-uncased were not used when initializing DistilBertForSequenceClassification: ['vocab_transform.bias', 'vocab_projector.bias', 'vocab_transform.weight', 'vocab_layer_norm.weight', 'vocab_layer_norm.bias', 'vocab_projector.weight']
- This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.weight', 'pre_classifier.weight', 'pre_clas

The following columns in the training set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running training *****
  Num examples = 36226
  Num Epochs = 50
  Instantaneous batch size per device = 128
  Total train batch size (w. parallel, distributed & accumulation) = 1024
  Gradient Accumulation steps = 1
  Total optimization steps = 1800


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,1.235146,0.770611,0.192653,0.25,0.217612
2,No log,0.821368,0.770611,0.192653,0.25,0.217612
3,No log,0.610916,0.770611,0.192653,0.25,0.217612
4,No log,0.368666,0.863482,0.36367,0.471763,0.401484
5,No log,0.302182,0.878274,0.588563,0.50637,0.456108
6,No log,0.292716,0.901552,0.591114,0.570793,0.553389
7,No log,0.273503,0.908341,0.600753,0.583006,0.570441
8,No log,0.288601,0.904704,0.598259,0.570573,0.558115
9,No log,0.265292,0.910281,0.582813,0.607121,0.586979
10,No log,0.268641,0.910524,0.580099,0.601251,0.584179




Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,1.235146,0.770611,0.192653,0.25,0.217612
2,No log,0.821368,0.770611,0.192653,0.25,0.217612
3,No log,0.610916,0.770611,0.192653,0.25,0.217612
4,No log,0.368666,0.863482,0.36367,0.471763,0.401484
5,No log,0.302182,0.878274,0.588563,0.50637,0.456108
6,No log,0.292716,0.901552,0.591114,0.570793,0.553389
7,No log,0.273503,0.908341,0.600753,0.583006,0.570441
8,No log,0.288601,0.904704,0.598259,0.570573,0.558115
9,No log,0.265292,0.910281,0.582813,0.607121,0.586979
10,No log,0.268641,0.910524,0.580099,0.601251,0.584179




Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,1.235146,0.770611,0.192653,0.25,0.217612
2,No log,0.821368,0.770611,0.192653,0.25,0.217612
3,No log,0.610916,0.770611,0.192653,0.25,0.217612
4,No log,0.368666,0.863482,0.36367,0.471763,0.401484
5,No log,0.302182,0.878274,0.588563,0.50637,0.456108
6,No log,0.292716,0.901552,0.591114,0.570793,0.553389
7,No log,0.273503,0.908341,0.600753,0.583006,0.570441
8,No log,0.288601,0.904704,0.598259,0.570573,0.558115
9,No log,0.265292,0.910281,0.582813,0.607121,0.586979
10,No log,0.268641,0.910524,0.580099,0.601251,0.584179




Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,1.235146,0.770611,0.192653,0.25,0.217612
2,No log,0.821368,0.770611,0.192653,0.25,0.217612
3,No log,0.610916,0.770611,0.192653,0.25,0.217612
4,No log,0.368666,0.863482,0.36367,0.471763,0.401484
5,No log,0.302182,0.878274,0.588563,0.50637,0.456108
6,No log,0.292716,0.901552,0.591114,0.570793,0.553389
7,No log,0.273503,0.908341,0.600753,0.583006,0.570441
8,No log,0.288601,0.904704,0.598259,0.570573,0.558115
9,No log,0.265292,0.910281,0.582813,0.607121,0.586979
10,No log,0.268641,0.910524,0.580099,0.601251,0.584179




Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,1.235146,0.770611,0.192653,0.25,0.217612
2,No log,0.821368,0.770611,0.192653,0.25,0.217612
3,No log,0.610916,0.770611,0.192653,0.25,0.217612
4,No log,0.368666,0.863482,0.36367,0.471763,0.401484
5,No log,0.302182,0.878274,0.588563,0.50637,0.456108
6,No log,0.292716,0.901552,0.591114,0.570793,0.553389
7,No log,0.273503,0.908341,0.600753,0.583006,0.570441
8,No log,0.288601,0.904704,0.598259,0.570573,0.558115
9,No log,0.265292,0.910281,0.582813,0.607121,0.586979
10,No log,0.268641,0.910524,0.580099,0.601251,0.584179




Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,1.235146,0.770611,0.192653,0.25,0.217612
2,No log,0.821368,0.770611,0.192653,0.25,0.217612
3,No log,0.610916,0.770611,0.192653,0.25,0.217612
4,No log,0.368666,0.863482,0.36367,0.471763,0.401484
5,No log,0.302182,0.878274,0.588563,0.50637,0.456108
6,No log,0.292716,0.901552,0.591114,0.570793,0.553389
7,No log,0.273503,0.908341,0.600753,0.583006,0.570441
8,No log,0.288601,0.904704,0.598259,0.570573,0.558115
9,No log,0.265292,0.910281,0.582813,0.607121,0.586979
10,No log,0.268641,0.910524,0.580099,0.601251,0.584179




Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,1.235146,0.770611,0.192653,0.25,0.217612
2,No log,0.821368,0.770611,0.192653,0.25,0.217612
3,No log,0.610916,0.770611,0.192653,0.25,0.217612
4,No log,0.368666,0.863482,0.36367,0.471763,0.401484
5,No log,0.302182,0.878274,0.588563,0.50637,0.456108
6,No log,0.292716,0.901552,0.591114,0.570793,0.553389
7,No log,0.273503,0.908341,0.600753,0.583006,0.570441
8,No log,0.288601,0.904704,0.598259,0.570573,0.558115
9,No log,0.265292,0.910281,0.582813,0.607121,0.586979
10,No log,0.268641,0.910524,0.580099,0.601251,0.584179




Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,1.235146,0.770611,0.192653,0.25,0.217612
2,No log,0.821368,0.770611,0.192653,0.25,0.217612
3,No log,0.610916,0.770611,0.192653,0.25,0.217612
4,No log,0.368666,0.863482,0.36367,0.471763,0.401484
5,No log,0.302182,0.878274,0.588563,0.50637,0.456108
6,No log,0.292716,0.901552,0.591114,0.570793,0.553389
7,No log,0.273503,0.908341,0.600753,0.583006,0.570441
8,No log,0.288601,0.904704,0.598259,0.570573,0.558115
9,No log,0.265292,0.910281,0.582813,0.607121,0.586979
10,No log,0.268641,0.910524,0.580099,0.601251,0.584179


The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Evaluation *****
  Num examples = 4124
  Batch size = 128
Saving model checkpoint to checkpoints/checkpoint-36
Configuration saved in checkpoints/checkpoint-36/config.json
Model weights saved in checkpoints/checkpoint-36/pytorch_model.bin
tokenizer config file saved in checkpoints/checkpoint-36/tokenizer_config.json
Special tokens file saved in checkpoints/checkpoint-36/special_tokens_map.json
The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Evaluation *****
  Num examples = 4

Score for fold 6 was - 0.8760413674231543
Score for fold 6 was - 0.8760413674231543
Score for fold 6 was - 0.8760413674231543
Score for fold 6 was - 0.8760413674231543
Score for fold 6 was - 0.8760413674231543
Score for fold 6 was - 0.8760413674231543
Score for fold 6 was - 0.8760413674231543
Score for fold 6 was - 0.8760413674231543


  0%|          | 0/36 [00:00<?, ?ba/s]

  0%|          | 0/36 [00:00<?, ?ba/s]

  0%|          | 0/36 [00:00<?, ?ba/s]

  0%|          | 0/36 [00:00<?, ?ba/s]

  0%|          | 0/36 [00:00<?, ?ba/s]

  0%|          | 0/36 [00:00<?, ?ba/s]

  0%|          | 0/36 [00:00<?, ?ba/s]

  0%|          | 0/36 [00:00<?, ?ba/s]

  0%|          | 0/5 [00:00<?, ?ba/s]

  0%|          | 0/5 [00:00<?, ?ba/s]

  0%|          | 0/5 [00:00<?, ?ba/s]

  0%|          | 0/5 [00:00<?, ?ba/s]

  0%|          | 0/5 [00:00<?, ?ba/s]

  0%|          | 0/5 [00:00<?, ?ba/s]

  0%|          | 0/5 [00:00<?, ?ba/s]

  0%|          | 0/5 [00:00<?, ?ba/s]



Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.014261,0.995068,0.93111,0.950545,0.940031
2,No log,0.014807,0.995282,0.931669,0.959198,0.943856
3,No log,0.015757,0.994639,0.925584,0.957564,0.939405
4,No log,0.016427,0.994853,0.935861,0.955097,0.944664
5,No log,0.016669,0.993781,0.924469,0.947255,0.934595
6,No log,0.016912,0.993352,0.929116,0.921612,0.925294
7,No log,0.017021,0.99421,0.926946,0.960159,0.940978
8,No log,0.016403,0.992923,0.914109,0.941835,0.926245
9,No log,0.016806,0.993352,0.927536,0.933254,0.930369
10,No log,0.017686,0.992923,0.910207,0.948065,0.92568




Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.014261,0.995068,0.93111,0.950545,0.940031
2,No log,0.014807,0.995282,0.931669,0.959198,0.943856
3,No log,0.015757,0.994639,0.925584,0.957564,0.939405
4,No log,0.016427,0.994853,0.935861,0.955097,0.944664
5,No log,0.016669,0.993781,0.924469,0.947255,0.934595
6,No log,0.016912,0.993352,0.929116,0.921612,0.925294
7,No log,0.017021,0.99421,0.926946,0.960159,0.940978
8,No log,0.016403,0.992923,0.914109,0.941835,0.926245
9,No log,0.016806,0.993352,0.927536,0.933254,0.930369
10,No log,0.017686,0.992923,0.910207,0.948065,0.92568


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.014261,0.995068,0.93111,0.950545,0.940031
2,No log,0.014807,0.995282,0.931669,0.959198,0.943856
3,No log,0.015757,0.994639,0.925584,0.957564,0.939405
4,No log,0.016427,0.994853,0.935861,0.955097,0.944664
5,No log,0.016669,0.993781,0.924469,0.947255,0.934595
6,No log,0.016912,0.993352,0.929116,0.921612,0.925294
7,No log,0.017021,0.99421,0.926946,0.960159,0.940978
8,No log,0.016403,0.992923,0.914109,0.941835,0.926245
9,No log,0.016806,0.993352,0.927536,0.933254,0.930369
10,No log,0.017686,0.992923,0.910207,0.948065,0.92568




Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.014261,0.995068,0.93111,0.950545,0.940031
2,No log,0.014807,0.995282,0.931669,0.959198,0.943856
3,No log,0.015757,0.994639,0.925584,0.957564,0.939405
4,No log,0.016427,0.994853,0.935861,0.955097,0.944664
5,No log,0.016669,0.993781,0.924469,0.947255,0.934595
6,No log,0.016912,0.993352,0.929116,0.921612,0.925294
7,No log,0.017021,0.99421,0.926946,0.960159,0.940978
8,No log,0.016403,0.992923,0.914109,0.941835,0.926245
9,No log,0.016806,0.993352,0.927536,0.933254,0.930369
10,No log,0.017686,0.992923,0.910207,0.948065,0.92568


The following columns in the training set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running training *****
  Num examples = 35687
  Num Epochs = 50
  Instantaneous batch size per device = 128
  Total train batch size (w. parallel, distributed & accumulation) = 1024
  Gradient Accumulation steps = 1
  Total optimization steps = 1750


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.014261,0.995068,0.93111,0.950545,0.940031
2,No log,0.014807,0.995282,0.931669,0.959198,0.943856
3,No log,0.015757,0.994639,0.925584,0.957564,0.939405
4,No log,0.016427,0.994853,0.935861,0.955097,0.944664
5,No log,0.016669,0.993781,0.924469,0.947255,0.934595
6,No log,0.016912,0.993352,0.929116,0.921612,0.925294
7,No log,0.017021,0.99421,0.926946,0.960159,0.940978
8,No log,0.016403,0.992923,0.914109,0.941835,0.926245
9,No log,0.016806,0.993352,0.927536,0.933254,0.930369
10,No log,0.017686,0.992923,0.910207,0.948065,0.92568


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.014261,0.995068,0.93111,0.950545,0.940031
2,No log,0.014807,0.995282,0.931669,0.959198,0.943856
3,No log,0.015757,0.994639,0.925584,0.957564,0.939405
4,No log,0.016427,0.994853,0.935861,0.955097,0.944664
5,No log,0.016669,0.993781,0.924469,0.947255,0.934595
6,No log,0.016912,0.993352,0.929116,0.921612,0.925294
7,No log,0.017021,0.99421,0.926946,0.960159,0.940978
8,No log,0.016403,0.992923,0.914109,0.941835,0.926245
9,No log,0.016806,0.993352,0.927536,0.933254,0.930369
10,No log,0.017686,0.992923,0.910207,0.948065,0.92568


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.014261,0.995068,0.93111,0.950545,0.940031
2,No log,0.014807,0.995282,0.931669,0.959198,0.943856
3,No log,0.015757,0.994639,0.925584,0.957564,0.939405
4,No log,0.016427,0.994853,0.935861,0.955097,0.944664
5,No log,0.016669,0.993781,0.924469,0.947255,0.934595
6,No log,0.016912,0.993352,0.929116,0.921612,0.925294
7,No log,0.017021,0.99421,0.926946,0.960159,0.940978
8,No log,0.016403,0.992923,0.914109,0.941835,0.926245
9,No log,0.016806,0.993352,0.927536,0.933254,0.930369
10,No log,0.017686,0.992923,0.910207,0.948065,0.92568


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.014261,0.995068,0.93111,0.950545,0.940031
2,No log,0.014807,0.995282,0.931669,0.959198,0.943856
3,No log,0.015757,0.994639,0.925584,0.957564,0.939405
4,No log,0.016427,0.994853,0.935861,0.955097,0.944664
5,No log,0.016669,0.993781,0.924469,0.947255,0.934595
6,No log,0.016912,0.993352,0.929116,0.921612,0.925294
7,No log,0.017021,0.99421,0.926946,0.960159,0.940978
8,No log,0.016403,0.992923,0.914109,0.941835,0.926245
9,No log,0.016806,0.993352,0.927536,0.933254,0.930369
10,No log,0.017686,0.992923,0.910207,0.948065,0.92568


The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Evaluation *****
  Num examples = 4663
  Batch size = 128
Saving model checkpoint to checkpoints/checkpoint-35
Configuration saved in checkpoints/checkpoint-35/config.json
Model weights saved in checkpoints/checkpoint-35/pytorch_model.bin
tokenizer config file saved in checkpoints/checkpoint-35/tokenizer_config.json
Special tokens file saved in checkpoints/checkpoint-35/special_tokens_map.json
The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Evaluation *****
  Num examples = 4

Score for fold 0 was - 0.991909781809267
Score for fold 0 was - 0.991909781809267
Score for fold 0 was - 0.991909781809267
Score for fold 0 was - 0.991909781809267
Score for fold 0 was - 0.991909781809267
Score for fold 0 was - 0.991909781809267
Score for fold 0 was - 0.991909781809267
Score for fold 0 was - 0.991909781809267


  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/4 [00:00<?, ?ba/s]

  0%|          | 0/4 [00:00<?, ?ba/s]

  0%|          | 0/4 [00:00<?, ?ba/s]

  0%|          | 0/4 [00:00<?, ?ba/s]

  0%|          | 0/4 [00:00<?, ?ba/s]

  0%|          | 0/4 [00:00<?, ?ba/s]

  0%|          | 0/4 [00:00<?, ?ba/s]

  0%|          | 0/4 [00:00<?, ?ba/s]

The following columns in the training set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running training *****
  Num examples = 36567
  Num Epochs = 50
  Instantaneous batch size per device = 128
  Total train batch size (w. parallel, distributed & accumulation) = 1024
  Gradient Accumulation steps = 1
  Total optimization steps = 1800


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.023197,0.992863,0.938306,0.941387,0.939796
2,No log,0.024089,0.992863,0.941657,0.946429,0.943812
3,No log,0.029509,0.990219,0.931338,0.935924,0.932526
4,No log,0.02801,0.990748,0.929096,0.938025,0.932455
5,No log,0.025087,0.99207,0.928595,0.953361,0.938436
6,No log,0.027891,0.989955,0.918686,0.932031,0.924312
7,No log,0.023814,0.99207,0.933863,0.942223,0.937762
8,No log,0.039773,0.986783,0.924743,0.890229,0.906144
9,No log,0.027096,0.989955,0.926041,0.915118,0.920148
10,No log,0.027262,0.990748,0.928763,0.929407,0.929007




Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.023197,0.992863,0.938306,0.941387,0.939796
2,No log,0.024089,0.992863,0.941657,0.946429,0.943812
3,No log,0.029509,0.990219,0.931338,0.935924,0.932526
4,No log,0.02801,0.990748,0.929096,0.938025,0.932455
5,No log,0.025087,0.99207,0.928595,0.953361,0.938436
6,No log,0.027891,0.989955,0.918686,0.932031,0.924312
7,No log,0.023814,0.99207,0.933863,0.942223,0.937762
8,No log,0.039773,0.986783,0.924743,0.890229,0.906144
9,No log,0.027096,0.989955,0.926041,0.915118,0.920148
10,No log,0.027262,0.990748,0.928763,0.929407,0.929007




Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.023197,0.992863,0.938306,0.941387,0.939796
2,No log,0.024089,0.992863,0.941657,0.946429,0.943812
3,No log,0.029509,0.990219,0.931338,0.935924,0.932526
4,No log,0.02801,0.990748,0.929096,0.938025,0.932455
5,No log,0.025087,0.99207,0.928595,0.953361,0.938436
6,No log,0.027891,0.989955,0.918686,0.932031,0.924312
7,No log,0.023814,0.99207,0.933863,0.942223,0.937762
8,No log,0.039773,0.986783,0.924743,0.890229,0.906144
9,No log,0.027096,0.989955,0.926041,0.915118,0.920148
10,No log,0.027262,0.990748,0.928763,0.929407,0.929007




Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.023197,0.992863,0.938306,0.941387,0.939796
2,No log,0.024089,0.992863,0.941657,0.946429,0.943812
3,No log,0.029509,0.990219,0.931338,0.935924,0.932526
4,No log,0.02801,0.990748,0.929096,0.938025,0.932455
5,No log,0.025087,0.99207,0.928595,0.953361,0.938436
6,No log,0.027891,0.989955,0.918686,0.932031,0.924312
7,No log,0.023814,0.99207,0.933863,0.942223,0.937762
8,No log,0.039773,0.986783,0.924743,0.890229,0.906144
9,No log,0.027096,0.989955,0.926041,0.915118,0.920148
10,No log,0.027262,0.990748,0.928763,0.929407,0.929007




Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.023197,0.992863,0.938306,0.941387,0.939796
2,No log,0.024089,0.992863,0.941657,0.946429,0.943812
3,No log,0.029509,0.990219,0.931338,0.935924,0.932526
4,No log,0.02801,0.990748,0.929096,0.938025,0.932455
5,No log,0.025087,0.99207,0.928595,0.953361,0.938436
6,No log,0.027891,0.989955,0.918686,0.932031,0.924312
7,No log,0.023814,0.99207,0.933863,0.942223,0.937762
8,No log,0.039773,0.986783,0.924743,0.890229,0.906144
9,No log,0.027096,0.989955,0.926041,0.915118,0.920148
10,No log,0.027262,0.990748,0.928763,0.929407,0.929007


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.023197,0.992863,0.938306,0.941387,0.939796
2,No log,0.024089,0.992863,0.941657,0.946429,0.943812
3,No log,0.029509,0.990219,0.931338,0.935924,0.932526
4,No log,0.02801,0.990748,0.929096,0.938025,0.932455
5,No log,0.025087,0.99207,0.928595,0.953361,0.938436
6,No log,0.027891,0.989955,0.918686,0.932031,0.924312
7,No log,0.023814,0.99207,0.933863,0.942223,0.937762
8,No log,0.039773,0.986783,0.924743,0.890229,0.906144
9,No log,0.027096,0.989955,0.926041,0.915118,0.920148
10,No log,0.027262,0.990748,0.928763,0.929407,0.929007


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.023197,0.992863,0.938306,0.941387,0.939796
2,No log,0.024089,0.992863,0.941657,0.946429,0.943812
3,No log,0.029509,0.990219,0.931338,0.935924,0.932526
4,No log,0.02801,0.990748,0.929096,0.938025,0.932455
5,No log,0.025087,0.99207,0.928595,0.953361,0.938436
6,No log,0.027891,0.989955,0.918686,0.932031,0.924312
7,No log,0.023814,0.99207,0.933863,0.942223,0.937762
8,No log,0.039773,0.986783,0.924743,0.890229,0.906144
9,No log,0.027096,0.989955,0.926041,0.915118,0.920148
10,No log,0.027262,0.990748,0.928763,0.929407,0.929007


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.023197,0.992863,0.938306,0.941387,0.939796
2,No log,0.024089,0.992863,0.941657,0.946429,0.943812
3,No log,0.029509,0.990219,0.931338,0.935924,0.932526
4,No log,0.02801,0.990748,0.929096,0.938025,0.932455
5,No log,0.025087,0.99207,0.928595,0.953361,0.938436
6,No log,0.027891,0.989955,0.918686,0.932031,0.924312
7,No log,0.023814,0.99207,0.933863,0.942223,0.937762
8,No log,0.039773,0.986783,0.924743,0.890229,0.906144
9,No log,0.027096,0.989955,0.926041,0.915118,0.920148
10,No log,0.027262,0.990748,0.928763,0.929407,0.929007


The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Evaluation *****
  Num examples = 3783
  Batch size = 128
Saving model checkpoint to checkpoints/checkpoint-36
Configuration saved in checkpoints/checkpoint-36/config.json
Model weights saved in checkpoints/checkpoint-36/pytorch_model.bin
tokenizer config file saved in checkpoints/checkpoint-36/tokenizer_config.json
Special tokens file saved in checkpoints/checkpoint-36/special_tokens_map.json
The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Evaluation *****
  Num examples = 3

Score for fold 7 was - 0.9885447602885024
Score for fold 7 was - 0.9885447602885024
Score for fold 7 was - 0.9885447602885024
Score for fold 7 was - 0.9885447602885024
Score for fold 7 was - 0.9885447602885024
Score for fold 7 was - 0.9885447602885024
Score for fold 7 was - 0.9885447602885024
Score for fold 7 was - 0.9885447602885024


  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/4 [00:00<?, ?ba/s]

  0%|          | 0/4 [00:00<?, ?ba/s]

  0%|          | 0/4 [00:00<?, ?ba/s]

  0%|          | 0/4 [00:00<?, ?ba/s]

  0%|          | 0/4 [00:00<?, ?ba/s]



  0%|          | 0/4 [00:00<?, ?ba/s]



Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.028312,0.990555,0.941705,0.910038,0.924082
2,No log,0.027133,0.99026,0.956253,0.893425,0.91689
3,No log,0.029337,0.988784,0.938479,0.882589,0.903986
4,No log,0.027429,0.99026,0.935566,0.912518,0.923149
5,No log,0.030953,0.989669,0.941375,0.897941,0.916182
6,No log,0.027126,0.988784,0.928804,0.8891,0.905637
7,No log,0.035807,0.987898,0.914843,0.916074,0.915207
8,No log,0.028516,0.989965,0.932853,0.914997,0.923432
9,No log,0.035469,0.989079,0.944741,0.883365,0.906615
10,No log,0.028875,0.988784,0.922479,0.898868,0.909594


  0%|          | 0/4 [00:00<?, ?ba/s]

Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.028312,0.990555,0.941705,0.910038,0.924082
2,No log,0.027133,0.99026,0.956253,0.893425,0.91689
3,No log,0.029337,0.988784,0.938479,0.882589,0.903986
4,No log,0.027429,0.99026,0.935566,0.912518,0.923149
5,No log,0.030953,0.989669,0.941375,0.897941,0.916182
6,No log,0.027126,0.988784,0.928804,0.8891,0.905637
7,No log,0.035807,0.987898,0.914843,0.916074,0.915207
8,No log,0.028516,0.989965,0.932853,0.914997,0.923432
9,No log,0.035469,0.989079,0.944741,0.883365,0.906615
10,No log,0.028875,0.988784,0.922479,0.898868,0.909594




  0%|          | 0/4 [00:00<?, ?ba/s]



Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.028312,0.990555,0.941705,0.910038,0.924082
2,No log,0.027133,0.99026,0.956253,0.893425,0.91689
3,No log,0.029337,0.988784,0.938479,0.882589,0.903986
4,No log,0.027429,0.99026,0.935566,0.912518,0.923149
5,No log,0.030953,0.989669,0.941375,0.897941,0.916182
6,No log,0.027126,0.988784,0.928804,0.8891,0.905637
7,No log,0.035807,0.987898,0.914843,0.916074,0.915207
8,No log,0.028516,0.989965,0.932853,0.914997,0.923432
9,No log,0.035469,0.989079,0.944741,0.883365,0.906615
10,No log,0.028875,0.988784,0.922479,0.898868,0.909594




Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.028312,0.990555,0.941705,0.910038,0.924082
2,No log,0.027133,0.99026,0.956253,0.893425,0.91689
3,No log,0.029337,0.988784,0.938479,0.882589,0.903986
4,No log,0.027429,0.99026,0.935566,0.912518,0.923149
5,No log,0.030953,0.989669,0.941375,0.897941,0.916182
6,No log,0.027126,0.988784,0.928804,0.8891,0.905637
7,No log,0.035807,0.987898,0.914843,0.916074,0.915207
8,No log,0.028516,0.989965,0.932853,0.914997,0.923432
9,No log,0.035469,0.989079,0.944741,0.883365,0.906615
10,No log,0.028875,0.988784,0.922479,0.898868,0.909594




Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.028312,0.990555,0.941705,0.910038,0.924082
2,No log,0.027133,0.99026,0.956253,0.893425,0.91689
3,No log,0.029337,0.988784,0.938479,0.882589,0.903986
4,No log,0.027429,0.99026,0.935566,0.912518,0.923149
5,No log,0.030953,0.989669,0.941375,0.897941,0.916182
6,No log,0.027126,0.988784,0.928804,0.8891,0.905637
7,No log,0.035807,0.987898,0.914843,0.916074,0.915207
8,No log,0.028516,0.989965,0.932853,0.914997,0.923432
9,No log,0.035469,0.989079,0.944741,0.883365,0.906615
10,No log,0.028875,0.988784,0.922479,0.898868,0.909594


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.028312,0.990555,0.941705,0.910038,0.924082
2,No log,0.027133,0.99026,0.956253,0.893425,0.91689
3,No log,0.029337,0.988784,0.938479,0.882589,0.903986
4,No log,0.027429,0.99026,0.935566,0.912518,0.923149
5,No log,0.030953,0.989669,0.941375,0.897941,0.916182
6,No log,0.027126,0.988784,0.928804,0.8891,0.905637
7,No log,0.035807,0.987898,0.914843,0.916074,0.915207
8,No log,0.028516,0.989965,0.932853,0.914997,0.923432
9,No log,0.035469,0.989079,0.944741,0.883365,0.906615
10,No log,0.028875,0.988784,0.922479,0.898868,0.909594


The following columns in the training set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running training *****
  Num examples = 36962
  Num Epochs = 50
  Instantaneous batch size per device = 128
  Total train batch size (w. parallel, distributed & accumulation) = 1024
  Gradient Accumulation steps = 1
  Total optimization steps = 1850


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.028312,0.990555,0.941705,0.910038,0.924082
2,No log,0.027133,0.99026,0.956253,0.893425,0.91689
3,No log,0.029337,0.988784,0.938479,0.882589,0.903986
4,No log,0.027429,0.99026,0.935566,0.912518,0.923149
5,No log,0.030953,0.989669,0.941375,0.897941,0.916182
6,No log,0.027126,0.988784,0.928804,0.8891,0.905637
7,No log,0.035807,0.987898,0.914843,0.916074,0.915207
8,No log,0.028516,0.989965,0.932853,0.914997,0.923432
9,No log,0.035469,0.989079,0.944741,0.883365,0.906615
10,No log,0.028875,0.988784,0.922479,0.898868,0.909594


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.028312,0.990555,0.941705,0.910038,0.924082
2,No log,0.027133,0.99026,0.956253,0.893425,0.91689
3,No log,0.029337,0.988784,0.938479,0.882589,0.903986
4,No log,0.027429,0.99026,0.935566,0.912518,0.923149
5,No log,0.030953,0.989669,0.941375,0.897941,0.916182
6,No log,0.027126,0.988784,0.928804,0.8891,0.905637
7,No log,0.035807,0.987898,0.914843,0.916074,0.915207
8,No log,0.028516,0.989965,0.932853,0.914997,0.923432
9,No log,0.035469,0.989079,0.944741,0.883365,0.906615
10,No log,0.028875,0.988784,0.922479,0.898868,0.909594


The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Evaluation *****
  Num examples = 3388
  Batch size = 128
Saving model checkpoint to checkpoints/checkpoint-37
Configuration saved in checkpoints/checkpoint-37/config.json
Model weights saved in checkpoints/checkpoint-37/pytorch_model.bin
tokenizer config file saved in checkpoints/checkpoint-37/tokenizer_config.json
Special tokens file saved in checkpoints/checkpoint-37/special_tokens_map.json
The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Evaluation *****
  Num examples = 3

Score for fold 5 was - 0.9888070692194404
Score for fold 5 was - 0.9888070692194404
Score for fold 5 was - 0.9888070692194404
Score for fold 5 was - 0.9888070692194404
Score for fold 5 was - 0.9888070692194404
Score for fold 5 was - 0.9888070692194404
Score for fold 5 was - 0.9888070692194404
Score for fold 5 was - 0.9888070692194404


  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/4 [00:00<?, ?ba/s]

  0%|          | 0/4 [00:00<?, ?ba/s]

  0%|          | 0/4 [00:00<?, ?ba/s]

  0%|          | 0/4 [00:00<?, ?ba/s]

  0%|          | 0/4 [00:00<?, ?ba/s]

  0%|          | 0/4 [00:00<?, ?ba/s]

  0%|          | 0/4 [00:00<?, ?ba/s]

  0%|          | 0/4 [00:00<?, ?ba/s]



Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.003004,0.999177,0.986607,0.996739,0.991478
2,No log,0.003392,0.999177,0.986607,0.996739,0.991478
3,No log,0.003407,0.999177,0.986607,0.996739,0.991478
4,No log,0.003291,0.998902,0.982456,0.996425,0.989111
5,No log,0.005717,0.99753,0.96371,0.990217,0.975446
6,No log,0.003731,0.998628,0.983937,0.988078,0.985987
7,No log,0.003372,0.998628,0.987138,0.983675,0.985384
8,No log,0.005514,0.998079,0.976645,0.988761,0.98236
9,No log,0.004905,0.998079,0.978221,0.982274,0.980227
10,No log,0.005403,0.997805,0.971482,0.984817,0.977832




Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.003004,0.999177,0.986607,0.996739,0.991478
2,No log,0.003392,0.999177,0.986607,0.996739,0.991478
3,No log,0.003407,0.999177,0.986607,0.996739,0.991478
4,No log,0.003291,0.998902,0.982456,0.996425,0.989111
5,No log,0.005717,0.99753,0.96371,0.990217,0.975446
6,No log,0.003731,0.998628,0.983937,0.988078,0.985987
7,No log,0.003372,0.998628,0.987138,0.983675,0.985384
8,No log,0.005514,0.998079,0.976645,0.988761,0.98236
9,No log,0.004905,0.998079,0.978221,0.982274,0.980227
10,No log,0.005403,0.997805,0.971482,0.984817,0.977832


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.003004,0.999177,0.986607,0.996739,0.991478
2,No log,0.003392,0.999177,0.986607,0.996739,0.991478
3,No log,0.003407,0.999177,0.986607,0.996739,0.991478
4,No log,0.003291,0.998902,0.982456,0.996425,0.989111
5,No log,0.005717,0.99753,0.96371,0.990217,0.975446
6,No log,0.003731,0.998628,0.983937,0.988078,0.985987
7,No log,0.003372,0.998628,0.987138,0.983675,0.985384
8,No log,0.005514,0.998079,0.976645,0.988761,0.98236
9,No log,0.004905,0.998079,0.978221,0.982274,0.980227
10,No log,0.005403,0.997805,0.971482,0.984817,0.977832


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.003004,0.999177,0.986607,0.996739,0.991478
2,No log,0.003392,0.999177,0.986607,0.996739,0.991478
3,No log,0.003407,0.999177,0.986607,0.996739,0.991478
4,No log,0.003291,0.998902,0.982456,0.996425,0.989111
5,No log,0.005717,0.99753,0.96371,0.990217,0.975446
6,No log,0.003731,0.998628,0.983937,0.988078,0.985987
7,No log,0.003372,0.998628,0.987138,0.983675,0.985384
8,No log,0.005514,0.998079,0.976645,0.988761,0.98236
9,No log,0.004905,0.998079,0.978221,0.982274,0.980227
10,No log,0.005403,0.997805,0.971482,0.984817,0.977832




Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.003004,0.999177,0.986607,0.996739,0.991478
2,No log,0.003392,0.999177,0.986607,0.996739,0.991478
3,No log,0.003407,0.999177,0.986607,0.996739,0.991478
4,No log,0.003291,0.998902,0.982456,0.996425,0.989111
5,No log,0.005717,0.99753,0.96371,0.990217,0.975446
6,No log,0.003731,0.998628,0.983937,0.988078,0.985987
7,No log,0.003372,0.998628,0.987138,0.983675,0.985384
8,No log,0.005514,0.998079,0.976645,0.988761,0.98236
9,No log,0.004905,0.998079,0.978221,0.982274,0.980227
10,No log,0.005403,0.997805,0.971482,0.984817,0.977832




Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.003004,0.999177,0.986607,0.996739,0.991478
2,No log,0.003392,0.999177,0.986607,0.996739,0.991478
3,No log,0.003407,0.999177,0.986607,0.996739,0.991478
4,No log,0.003291,0.998902,0.982456,0.996425,0.989111
5,No log,0.005717,0.99753,0.96371,0.990217,0.975446
6,No log,0.003731,0.998628,0.983937,0.988078,0.985987
7,No log,0.003372,0.998628,0.987138,0.983675,0.985384
8,No log,0.005514,0.998079,0.976645,0.988761,0.98236
9,No log,0.004905,0.998079,0.978221,0.982274,0.980227
10,No log,0.005403,0.997805,0.971482,0.984817,0.977832


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.003004,0.999177,0.986607,0.996739,0.991478
2,No log,0.003392,0.999177,0.986607,0.996739,0.991478
3,No log,0.003407,0.999177,0.986607,0.996739,0.991478
4,No log,0.003291,0.998902,0.982456,0.996425,0.989111
5,No log,0.005717,0.99753,0.96371,0.990217,0.975446
6,No log,0.003731,0.998628,0.983937,0.988078,0.985987
7,No log,0.003372,0.998628,0.987138,0.983675,0.985384
8,No log,0.005514,0.998079,0.976645,0.988761,0.98236
9,No log,0.004905,0.998079,0.978221,0.982274,0.980227
10,No log,0.005403,0.997805,0.971482,0.984817,0.977832


The following columns in the training set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running training *****
  Num examples = 36706
  Num Epochs = 50
  Instantaneous batch size per device = 128
  Total train batch size (w. parallel, distributed & accumulation) = 1024
  Gradient Accumulation steps = 1
  Total optimization steps = 1800


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.003004,0.999177,0.986607,0.996739,0.991478
2,No log,0.003392,0.999177,0.986607,0.996739,0.991478
3,No log,0.003407,0.999177,0.986607,0.996739,0.991478
4,No log,0.003291,0.998902,0.982456,0.996425,0.989111
5,No log,0.005717,0.99753,0.96371,0.990217,0.975446
6,No log,0.003731,0.998628,0.983937,0.988078,0.985987
7,No log,0.003372,0.998628,0.987138,0.983675,0.985384
8,No log,0.005514,0.998079,0.976645,0.988761,0.98236
9,No log,0.004905,0.998079,0.978221,0.982274,0.980227
10,No log,0.005403,0.997805,0.971482,0.984817,0.977832


The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Evaluation *****
  Num examples = 3644
  Batch size = 128
Saving model checkpoint to checkpoints/checkpoint-36
Configuration saved in checkpoints/checkpoint-36/config.json
Model weights saved in checkpoints/checkpoint-36/pytorch_model.bin
tokenizer config file saved in checkpoints/checkpoint-36/tokenizer_config.json
Special tokens file saved in checkpoints/checkpoint-36/special_tokens_map.json
The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Evaluation *****
  Num examples = 3

Score for fold 2 was - 0.9986914800814191
Score for fold 2 was - 0.9986914800814191
Score for fold 2 was - 0.9986914800814191
Score for fold 2 was - 0.9986914800814191
Score for fold 2 was - 0.9986914800814191
Score for fold 2 was - 0.9986914800814191
Score for fold 2 was - 0.9986914800814191
Score for fold 2 was - 0.9986914800814191


  0%|          | 0/36 [00:00<?, ?ba/s]

  0%|          | 0/36 [00:00<?, ?ba/s]

  0%|          | 0/36 [00:00<?, ?ba/s]

  0%|          | 0/36 [00:00<?, ?ba/s]

  0%|          | 0/36 [00:00<?, ?ba/s]

  0%|          | 0/36 [00:00<?, ?ba/s]

  0%|          | 0/36 [00:00<?, ?ba/s]

  0%|          | 0/36 [00:00<?, ?ba/s]

  0%|          | 0/5 [00:00<?, ?ba/s]

  0%|          | 0/5 [00:00<?, ?ba/s]

  0%|          | 0/5 [00:00<?, ?ba/s]

  0%|          | 0/5 [00:00<?, ?ba/s]

  0%|          | 0/5 [00:00<?, ?ba/s]

  0%|          | 0/5 [00:00<?, ?ba/s]

  0%|          | 0/5 [00:00<?, ?ba/s]

  0%|          | 0/5 [00:00<?, ?ba/s]



Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.006682,0.997416,0.982936,0.974046,0.978264
2,No log,0.00867,0.996124,0.962789,0.977796,0.969502
3,No log,0.00731,0.997631,0.982147,0.978828,0.980451
4,No log,0.014008,0.995047,0.960201,0.974878,0.966268
5,No log,0.014059,0.995047,0.977165,0.941423,0.955665
6,No log,0.00995,0.99677,0.985508,0.967215,0.975408
7,No log,0.010003,0.996555,0.969709,0.977428,0.973444
8,No log,0.011015,0.995263,0.953757,0.972026,0.961628
9,No log,0.011144,0.995693,0.958414,0.977384,0.966841
10,No log,0.012136,0.995047,0.95415,0.964051,0.958833




Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.006682,0.997416,0.982936,0.974046,0.978264
2,No log,0.00867,0.996124,0.962789,0.977796,0.969502
3,No log,0.00731,0.997631,0.982147,0.978828,0.980451
4,No log,0.014008,0.995047,0.960201,0.974878,0.966268
5,No log,0.014059,0.995047,0.977165,0.941423,0.955665
6,No log,0.00995,0.99677,0.985508,0.967215,0.975408
7,No log,0.010003,0.996555,0.969709,0.977428,0.973444
8,No log,0.011015,0.995263,0.953757,0.972026,0.961628
9,No log,0.011144,0.995693,0.958414,0.977384,0.966841
10,No log,0.012136,0.995047,0.95415,0.964051,0.958833


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.006682,0.997416,0.982936,0.974046,0.978264
2,No log,0.00867,0.996124,0.962789,0.977796,0.969502
3,No log,0.00731,0.997631,0.982147,0.978828,0.980451
4,No log,0.014008,0.995047,0.960201,0.974878,0.966268
5,No log,0.014059,0.995047,0.977165,0.941423,0.955665
6,No log,0.00995,0.99677,0.985508,0.967215,0.975408
7,No log,0.010003,0.996555,0.969709,0.977428,0.973444
8,No log,0.011015,0.995263,0.953757,0.972026,0.961628
9,No log,0.011144,0.995693,0.958414,0.977384,0.966841
10,No log,0.012136,0.995047,0.95415,0.964051,0.958833




Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.006682,0.997416,0.982936,0.974046,0.978264
2,No log,0.00867,0.996124,0.962789,0.977796,0.969502
3,No log,0.00731,0.997631,0.982147,0.978828,0.980451
4,No log,0.014008,0.995047,0.960201,0.974878,0.966268
5,No log,0.014059,0.995047,0.977165,0.941423,0.955665
6,No log,0.00995,0.99677,0.985508,0.967215,0.975408
7,No log,0.010003,0.996555,0.969709,0.977428,0.973444
8,No log,0.011015,0.995263,0.953757,0.972026,0.961628
9,No log,0.011144,0.995693,0.958414,0.977384,0.966841
10,No log,0.012136,0.995047,0.95415,0.964051,0.958833


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.006682,0.997416,0.982936,0.974046,0.978264
2,No log,0.00867,0.996124,0.962789,0.977796,0.969502
3,No log,0.00731,0.997631,0.982147,0.978828,0.980451
4,No log,0.014008,0.995047,0.960201,0.974878,0.966268
5,No log,0.014059,0.995047,0.977165,0.941423,0.955665
6,No log,0.00995,0.99677,0.985508,0.967215,0.975408
7,No log,0.010003,0.996555,0.969709,0.977428,0.973444
8,No log,0.011015,0.995263,0.953757,0.972026,0.961628
9,No log,0.011144,0.995693,0.958414,0.977384,0.966841
10,No log,0.012136,0.995047,0.95415,0.964051,0.958833


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.006682,0.997416,0.982936,0.974046,0.978264
2,No log,0.00867,0.996124,0.962789,0.977796,0.969502
3,No log,0.00731,0.997631,0.982147,0.978828,0.980451
4,No log,0.014008,0.995047,0.960201,0.974878,0.966268
5,No log,0.014059,0.995047,0.977165,0.941423,0.955665
6,No log,0.00995,0.99677,0.985508,0.967215,0.975408
7,No log,0.010003,0.996555,0.969709,0.977428,0.973444
8,No log,0.011015,0.995263,0.953757,0.972026,0.961628
9,No log,0.011144,0.995693,0.958414,0.977384,0.966841
10,No log,0.012136,0.995047,0.95415,0.964051,0.958833


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.006682,0.997416,0.982936,0.974046,0.978264
2,No log,0.00867,0.996124,0.962789,0.977796,0.969502
3,No log,0.00731,0.997631,0.982147,0.978828,0.980451
4,No log,0.014008,0.995047,0.960201,0.974878,0.966268
5,No log,0.014059,0.995047,0.977165,0.941423,0.955665
6,No log,0.00995,0.99677,0.985508,0.967215,0.975408
7,No log,0.010003,0.996555,0.969709,0.977428,0.973444
8,No log,0.011015,0.995263,0.953757,0.972026,0.961628
9,No log,0.011144,0.995693,0.958414,0.977384,0.966841
10,No log,0.012136,0.995047,0.95415,0.964051,0.958833


The following columns in the training set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running training *****
  Num examples = 35706
  Num Epochs = 50
  Instantaneous batch size per device = 128
  Total train batch size (w. parallel, distributed & accumulation) = 1024
  Gradient Accumulation steps = 1
  Total optimization steps = 1750


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.006682,0.997416,0.982936,0.974046,0.978264
2,No log,0.00867,0.996124,0.962789,0.977796,0.969502
3,No log,0.00731,0.997631,0.982147,0.978828,0.980451
4,No log,0.014008,0.995047,0.960201,0.974878,0.966268
5,No log,0.014059,0.995047,0.977165,0.941423,0.955665
6,No log,0.00995,0.99677,0.985508,0.967215,0.975408
7,No log,0.010003,0.996555,0.969709,0.977428,0.973444
8,No log,0.011015,0.995263,0.953757,0.972026,0.961628
9,No log,0.011144,0.995693,0.958414,0.977384,0.966841
10,No log,0.012136,0.995047,0.95415,0.964051,0.958833


The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Evaluation *****
  Num examples = 4644
  Batch size = 128
Saving model checkpoint to checkpoints/checkpoint-35
Configuration saved in checkpoints/checkpoint-35/config.json
Model weights saved in checkpoints/checkpoint-35/pytorch_model.bin
tokenizer config file saved in checkpoints/checkpoint-35/tokenizer_config.json
Special tokens file saved in checkpoints/checkpoint-35/special_tokens_map.json
The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Evaluation *****
  Num examples = 4

Score for fold 8 was - 0.9960634920634921
Score for fold 8 was - 0.9960634920634921
Score for fold 8 was - 0.9960634920634921
Score for fold 8 was - 0.9960634920634921
Score for fold 8 was - 0.9960634920634921
Score for fold 8 was - 0.9960634920634921
Score for fold 8 was - 0.9960634920634921
Score for fold 8 was - 0.9960634920634921


  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/4 [00:00<?, ?ba/s]

  0%|          | 0/4 [00:00<?, ?ba/s]

  0%|          | 0/4 [00:00<?, ?ba/s]

  0%|          | 0/4 [00:00<?, ?ba/s]

  0%|          | 0/4 [00:00<?, ?ba/s]

  0%|          | 0/4 [00:00<?, ?ba/s]

  0%|          | 0/4 [00:00<?, ?ba/s]

  0%|          | 0/4 [00:00<?, ?ba/s]



Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.002948,0.99922,0.991667,0.997533,0.994523
2,No log,0.003114,0.99896,0.992608,0.992608,0.992608
3,No log,0.003005,0.998701,0.991727,0.989735,0.990722
4,No log,0.004157,0.998441,0.98901,0.991436,0.990215
5,No log,0.004572,0.997921,0.98185,0.989319,0.985453
6,No log,0.006697,0.997401,0.987302,0.98152,0.984374
7,No log,0.004359,0.998181,0.985078,0.992192,0.988496
8,No log,0.00687,0.997401,0.992439,0.973316,0.98213
9,No log,0.005814,0.998181,0.985078,0.992192,0.988496
10,No log,0.006373,0.997401,0.984374,0.98152,0.982938


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.002948,0.99922,0.991667,0.997533,0.994523
2,No log,0.003114,0.99896,0.992608,0.992608,0.992608
3,No log,0.003005,0.998701,0.991727,0.989735,0.990722
4,No log,0.004157,0.998441,0.98901,0.991436,0.990215
5,No log,0.004572,0.997921,0.98185,0.989319,0.985453
6,No log,0.006697,0.997401,0.987302,0.98152,0.984374
7,No log,0.004359,0.998181,0.985078,0.992192,0.988496
8,No log,0.00687,0.997401,0.992439,0.973316,0.98213
9,No log,0.005814,0.998181,0.985078,0.992192,0.988496
10,No log,0.006373,0.997401,0.984374,0.98152,0.982938


The following columns in the training set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running training *****
  Num examples = 36502
  Num Epochs = 50
  Instantaneous batch size per device = 128
  Total train batch size (w. parallel, distributed & accumulation) = 1024
  Gradient Accumulation steps = 1
  Total optimization steps = 1800


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.002948,0.99922,0.991667,0.997533,0.994523
2,No log,0.003114,0.99896,0.992608,0.992608,0.992608
3,No log,0.003005,0.998701,0.991727,0.989735,0.990722
4,No log,0.004157,0.998441,0.98901,0.991436,0.990215
5,No log,0.004572,0.997921,0.98185,0.989319,0.985453
6,No log,0.006697,0.997401,0.987302,0.98152,0.984374
7,No log,0.004359,0.998181,0.985078,0.992192,0.988496
8,No log,0.00687,0.997401,0.992439,0.973316,0.98213
9,No log,0.005814,0.998181,0.985078,0.992192,0.988496
10,No log,0.006373,0.997401,0.984374,0.98152,0.982938


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.002948,0.99922,0.991667,0.997533,0.994523
2,No log,0.003114,0.99896,0.992608,0.992608,0.992608
3,No log,0.003005,0.998701,0.991727,0.989735,0.990722
4,No log,0.004157,0.998441,0.98901,0.991436,0.990215
5,No log,0.004572,0.997921,0.98185,0.989319,0.985453
6,No log,0.006697,0.997401,0.987302,0.98152,0.984374
7,No log,0.004359,0.998181,0.985078,0.992192,0.988496
8,No log,0.00687,0.997401,0.992439,0.973316,0.98213
9,No log,0.005814,0.998181,0.985078,0.992192,0.988496
10,No log,0.006373,0.997401,0.984374,0.98152,0.982938


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.002948,0.99922,0.991667,0.997533,0.994523
2,No log,0.003114,0.99896,0.992608,0.992608,0.992608
3,No log,0.003005,0.998701,0.991727,0.989735,0.990722
4,No log,0.004157,0.998441,0.98901,0.991436,0.990215
5,No log,0.004572,0.997921,0.98185,0.989319,0.985453
6,No log,0.006697,0.997401,0.987302,0.98152,0.984374
7,No log,0.004359,0.998181,0.985078,0.992192,0.988496
8,No log,0.00687,0.997401,0.992439,0.973316,0.98213
9,No log,0.005814,0.998181,0.985078,0.992192,0.988496
10,No log,0.006373,0.997401,0.984374,0.98152,0.982938


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.002948,0.99922,0.991667,0.997533,0.994523
2,No log,0.003114,0.99896,0.992608,0.992608,0.992608
3,No log,0.003005,0.998701,0.991727,0.989735,0.990722
4,No log,0.004157,0.998441,0.98901,0.991436,0.990215
5,No log,0.004572,0.997921,0.98185,0.989319,0.985453
6,No log,0.006697,0.997401,0.987302,0.98152,0.984374
7,No log,0.004359,0.998181,0.985078,0.992192,0.988496
8,No log,0.00687,0.997401,0.992439,0.973316,0.98213
9,No log,0.005814,0.998181,0.985078,0.992192,0.988496
10,No log,0.006373,0.997401,0.984374,0.98152,0.982938


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.002948,0.99922,0.991667,0.997533,0.994523
2,No log,0.003114,0.99896,0.992608,0.992608,0.992608
3,No log,0.003005,0.998701,0.991727,0.989735,0.990722
4,No log,0.004157,0.998441,0.98901,0.991436,0.990215
5,No log,0.004572,0.997921,0.98185,0.989319,0.985453
6,No log,0.006697,0.997401,0.987302,0.98152,0.984374
7,No log,0.004359,0.998181,0.985078,0.992192,0.988496
8,No log,0.00687,0.997401,0.992439,0.973316,0.98213
9,No log,0.005814,0.998181,0.985078,0.992192,0.988496
10,No log,0.006373,0.997401,0.984374,0.98152,0.982938


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.002948,0.99922,0.991667,0.997533,0.994523
2,No log,0.003114,0.99896,0.992608,0.992608,0.992608
3,No log,0.003005,0.998701,0.991727,0.989735,0.990722
4,No log,0.004157,0.998441,0.98901,0.991436,0.990215
5,No log,0.004572,0.997921,0.98185,0.989319,0.985453
6,No log,0.006697,0.997401,0.987302,0.98152,0.984374
7,No log,0.004359,0.998181,0.985078,0.992192,0.988496
8,No log,0.00687,0.997401,0.992439,0.973316,0.98213
9,No log,0.005814,0.998181,0.985078,0.992192,0.988496
10,No log,0.006373,0.997401,0.984374,0.98152,0.982938


The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Evaluation *****
  Num examples = 3848
  Batch size = 128
Saving model checkpoint to checkpoints/checkpoint-36
Configuration saved in checkpoints/checkpoint-36/config.json
Model weights saved in checkpoints/checkpoint-36/pytorch_model.bin
tokenizer config file saved in checkpoints/checkpoint-36/tokenizer_config.json
Special tokens file saved in checkpoints/checkpoint-36/special_tokens_map.json
The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Evaluation *****
  Num examples = 3

Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.002948,0.99922,0.991667,0.997533,0.994523
2,No log,0.003114,0.99896,0.992608,0.992608,0.992608
3,No log,0.003005,0.998701,0.991727,0.989735,0.990722
4,No log,0.004157,0.998441,0.98901,0.991436,0.990215
5,No log,0.004572,0.997921,0.98185,0.989319,0.985453
6,No log,0.006697,0.997401,0.987302,0.98152,0.984374
7,No log,0.004359,0.998181,0.985078,0.992192,0.988496
8,No log,0.00687,0.997401,0.992439,0.973316,0.98213
9,No log,0.005814,0.998181,0.985078,0.992192,0.988496
10,No log,0.006373,0.997401,0.984374,0.98152,0.982938


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.002948,0.99922,0.991667,0.997533,0.994523
2,No log,0.003114,0.99896,0.992608,0.992608,0.992608
3,No log,0.003005,0.998701,0.991727,0.989735,0.990722
4,No log,0.004157,0.998441,0.98901,0.991436,0.990215
5,No log,0.004572,0.997921,0.98185,0.989319,0.985453
6,No log,0.006697,0.997401,0.987302,0.98152,0.984374
7,No log,0.004359,0.998181,0.985078,0.992192,0.988496
8,No log,0.00687,0.997401,0.992439,0.973316,0.98213
9,No log,0.005814,0.998181,0.985078,0.992192,0.988496
10,No log,0.006373,0.997401,0.984374,0.98152,0.982938


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.002948,0.99922,0.991667,0.997533,0.994523
2,No log,0.003114,0.99896,0.992608,0.992608,0.992608
3,No log,0.003005,0.998701,0.991727,0.989735,0.990722
4,No log,0.004157,0.998441,0.98901,0.991436,0.990215
5,No log,0.004572,0.997921,0.98185,0.989319,0.985453
6,No log,0.006697,0.997401,0.987302,0.98152,0.984374
7,No log,0.004359,0.998181,0.985078,0.992192,0.988496
8,No log,0.00687,0.997401,0.992439,0.973316,0.98213
9,No log,0.005814,0.998181,0.985078,0.992192,0.988496
10,No log,0.006373,0.997401,0.984374,0.98152,0.982938


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.002948,0.99922,0.991667,0.997533,0.994523
2,No log,0.003114,0.99896,0.992608,0.992608,0.992608
3,No log,0.003005,0.998701,0.991727,0.989735,0.990722
4,No log,0.004157,0.998441,0.98901,0.991436,0.990215
5,No log,0.004572,0.997921,0.98185,0.989319,0.985453
6,No log,0.006697,0.997401,0.987302,0.98152,0.984374
7,No log,0.004359,0.998181,0.985078,0.992192,0.988496
8,No log,0.00687,0.997401,0.992439,0.973316,0.98213
9,No log,0.005814,0.998181,0.985078,0.992192,0.988496
10,No log,0.006373,0.997401,0.984374,0.98152,0.982938


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.002948,0.99922,0.991667,0.997533,0.994523
2,No log,0.003114,0.99896,0.992608,0.992608,0.992608
3,No log,0.003005,0.998701,0.991727,0.989735,0.990722
4,No log,0.004157,0.998441,0.98901,0.991436,0.990215
5,No log,0.004572,0.997921,0.98185,0.989319,0.985453
6,No log,0.006697,0.997401,0.987302,0.98152,0.984374
7,No log,0.004359,0.998181,0.985078,0.992192,0.988496
8,No log,0.00687,0.997401,0.992439,0.973316,0.98213
9,No log,0.005814,0.998181,0.985078,0.992192,0.988496
10,No log,0.006373,0.997401,0.984374,0.98152,0.982938


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.002948,0.99922,0.991667,0.997533,0.994523
2,No log,0.003114,0.99896,0.992608,0.992608,0.992608
3,No log,0.003005,0.998701,0.991727,0.989735,0.990722
4,No log,0.004157,0.998441,0.98901,0.991436,0.990215
5,No log,0.004572,0.997921,0.98185,0.989319,0.985453
6,No log,0.006697,0.997401,0.987302,0.98152,0.984374
7,No log,0.004359,0.998181,0.985078,0.992192,0.988496
8,No log,0.00687,0.997401,0.992439,0.973316,0.98213
9,No log,0.005814,0.998181,0.985078,0.992192,0.988496
10,No log,0.006373,0.997401,0.984374,0.98152,0.982938


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.002948,0.99922,0.991667,0.997533,0.994523
2,No log,0.003114,0.99896,0.992608,0.992608,0.992608
3,No log,0.003005,0.998701,0.991727,0.989735,0.990722
4,No log,0.004157,0.998441,0.98901,0.991436,0.990215
5,No log,0.004572,0.997921,0.98185,0.989319,0.985453
6,No log,0.006697,0.997401,0.987302,0.98152,0.984374
7,No log,0.004359,0.998181,0.985078,0.992192,0.988496
8,No log,0.00687,0.997401,0.992439,0.973316,0.98213
9,No log,0.005814,0.998181,0.985078,0.992192,0.988496
10,No log,0.006373,0.997401,0.984374,0.98152,0.982938


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.002948,0.99922,0.991667,0.997533,0.994523
2,No log,0.003114,0.99896,0.992608,0.992608,0.992608
3,No log,0.003005,0.998701,0.991727,0.989735,0.990722
4,No log,0.004157,0.998441,0.98901,0.991436,0.990215
5,No log,0.004572,0.997921,0.98185,0.989319,0.985453
6,No log,0.006697,0.997401,0.987302,0.98152,0.984374
7,No log,0.004359,0.998181,0.985078,0.992192,0.988496
8,No log,0.00687,0.997401,0.992439,0.973316,0.98213
9,No log,0.005814,0.998181,0.985078,0.992192,0.988496
10,No log,0.006373,0.997401,0.984374,0.98152,0.982938


The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Evaluation *****
  Num examples = 3848
  Batch size = 128
Saving model checkpoint to checkpoints/checkpoint-1224
Configuration saved in checkpoints/checkpoint-1224/config.json
Model weights saved in checkpoints/checkpoint-1224/pytorch_model.bin
tokenizer config file saved in checkpoints/checkpoint-1224/tokenizer_config.json
Special tokens file saved in checkpoints/checkpoint-1224/special_tokens_map.json
The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Evaluation *****
  Num ex

Score for fold 9 was - 0.998744069215741
Score for fold 9 was - 0.998744069215741
Score for fold 9 was - 0.998744069215741
Score for fold 9 was - 0.998744069215741
Score for fold 9 was - 0.998744069215741
Score for fold 9 was - 0.998744069215741
Score for fold 9 was - 0.998744069215741
Score for fold 9 was - 0.998744069215741


  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/5 [00:00<?, ?ba/s]

  0%|          | 0/5 [00:00<?, ?ba/s]

  0%|          | 0/5 [00:00<?, ?ba/s]

  0%|          | 0/5 [00:00<?, ?ba/s]

  0%|          | 0/5 [00:00<?, ?ba/s]

  0%|          | 0/5 [00:00<?, ?ba/s]

  0%|          | 0/5 [00:00<?, ?ba/s]

  0%|          | 0/5 [00:00<?, ?ba/s]



Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.004072,0.998596,0.991797,0.982383,0.986896
2,No log,0.005288,0.997192,0.970823,0.979062,0.974772
3,No log,0.006032,0.998128,0.98734,0.978099,0.982528
4,No log,0.007043,0.997192,0.983312,0.964766,0.973255
5,No log,0.006673,0.998128,0.98734,0.978099,0.982528
6,No log,0.009909,0.997192,0.983312,0.964766,0.973255
7,No log,0.010953,0.997192,0.986081,0.962383,0.972974
8,No log,0.012256,0.997426,0.989964,0.963333,0.975095
9,No log,0.010795,0.996256,0.959934,0.97526,0.966962
10,No log,0.009546,0.996724,0.970013,0.970013,0.970013




Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.004072,0.998596,0.991797,0.982383,0.986896
2,No log,0.005288,0.997192,0.970823,0.979062,0.974772
3,No log,0.006032,0.998128,0.98734,0.978099,0.982528
4,No log,0.007043,0.997192,0.983312,0.964766,0.973255
5,No log,0.006673,0.998128,0.98734,0.978099,0.982528
6,No log,0.009909,0.997192,0.983312,0.964766,0.973255
7,No log,0.010953,0.997192,0.986081,0.962383,0.972974
8,No log,0.012256,0.997426,0.989964,0.963333,0.975095
9,No log,0.010795,0.996256,0.959934,0.97526,0.966962
10,No log,0.009546,0.996724,0.970013,0.970013,0.970013


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.004072,0.998596,0.991797,0.982383,0.986896
2,No log,0.005288,0.997192,0.970823,0.979062,0.974772
3,No log,0.006032,0.998128,0.98734,0.978099,0.982528
4,No log,0.007043,0.997192,0.983312,0.964766,0.973255
5,No log,0.006673,0.998128,0.98734,0.978099,0.982528
6,No log,0.009909,0.997192,0.983312,0.964766,0.973255
7,No log,0.010953,0.997192,0.986081,0.962383,0.972974
8,No log,0.012256,0.997426,0.989964,0.963333,0.975095
9,No log,0.010795,0.996256,0.959934,0.97526,0.966962
10,No log,0.009546,0.996724,0.970013,0.970013,0.970013


The following columns in the training set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running training *****
  Num examples = 36077
  Num Epochs = 50
  Instantaneous batch size per device = 128
  Total train batch size (w. parallel, distributed & accumulation) = 1024
  Gradient Accumulation steps = 1
  Total optimization steps = 1800


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.004072,0.998596,0.991797,0.982383,0.986896
2,No log,0.005288,0.997192,0.970823,0.979062,0.974772
3,No log,0.006032,0.998128,0.98734,0.978099,0.982528
4,No log,0.007043,0.997192,0.983312,0.964766,0.973255
5,No log,0.006673,0.998128,0.98734,0.978099,0.982528
6,No log,0.009909,0.997192,0.983312,0.964766,0.973255
7,No log,0.010953,0.997192,0.986081,0.962383,0.972974
8,No log,0.012256,0.997426,0.989964,0.963333,0.975095
9,No log,0.010795,0.996256,0.959934,0.97526,0.966962
10,No log,0.009546,0.996724,0.970013,0.970013,0.970013


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.004072,0.998596,0.991797,0.982383,0.986896
2,No log,0.005288,0.997192,0.970823,0.979062,0.974772
3,No log,0.006032,0.998128,0.98734,0.978099,0.982528
4,No log,0.007043,0.997192,0.983312,0.964766,0.973255
5,No log,0.006673,0.998128,0.98734,0.978099,0.982528
6,No log,0.009909,0.997192,0.983312,0.964766,0.973255
7,No log,0.010953,0.997192,0.986081,0.962383,0.972974
8,No log,0.012256,0.997426,0.989964,0.963333,0.975095
9,No log,0.010795,0.996256,0.959934,0.97526,0.966962
10,No log,0.009546,0.996724,0.970013,0.970013,0.970013




Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.004072,0.998596,0.991797,0.982383,0.986896
2,No log,0.005288,0.997192,0.970823,0.979062,0.974772
3,No log,0.006032,0.998128,0.98734,0.978099,0.982528
4,No log,0.007043,0.997192,0.983312,0.964766,0.973255
5,No log,0.006673,0.998128,0.98734,0.978099,0.982528
6,No log,0.009909,0.997192,0.983312,0.964766,0.973255
7,No log,0.010953,0.997192,0.986081,0.962383,0.972974
8,No log,0.012256,0.997426,0.989964,0.963333,0.975095
9,No log,0.010795,0.996256,0.959934,0.97526,0.966962
10,No log,0.009546,0.996724,0.970013,0.970013,0.970013




Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.004072,0.998596,0.991797,0.982383,0.986896
2,No log,0.005288,0.997192,0.970823,0.979062,0.974772
3,No log,0.006032,0.998128,0.98734,0.978099,0.982528
4,No log,0.007043,0.997192,0.983312,0.964766,0.973255
5,No log,0.006673,0.998128,0.98734,0.978099,0.982528
6,No log,0.009909,0.997192,0.983312,0.964766,0.973255
7,No log,0.010953,0.997192,0.986081,0.962383,0.972974
8,No log,0.012256,0.997426,0.989964,0.963333,0.975095
9,No log,0.010795,0.996256,0.959934,0.97526,0.966962
10,No log,0.009546,0.996724,0.970013,0.970013,0.970013


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.004072,0.998596,0.991797,0.982383,0.986896
2,No log,0.005288,0.997192,0.970823,0.979062,0.974772
3,No log,0.006032,0.998128,0.98734,0.978099,0.982528
4,No log,0.007043,0.997192,0.983312,0.964766,0.973255
5,No log,0.006673,0.998128,0.98734,0.978099,0.982528
6,No log,0.009909,0.997192,0.983312,0.964766,0.973255
7,No log,0.010953,0.997192,0.986081,0.962383,0.972974
8,No log,0.012256,0.997426,0.989964,0.963333,0.975095
9,No log,0.010795,0.996256,0.959934,0.97526,0.966962
10,No log,0.009546,0.996724,0.970013,0.970013,0.970013


The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Evaluation *****
  Num examples = 4273
  Batch size = 128
Saving model checkpoint to checkpoints/checkpoint-36
Configuration saved in checkpoints/checkpoint-36/config.json
Model weights saved in checkpoints/checkpoint-36/pytorch_model.bin
tokenizer config file saved in checkpoints/checkpoint-36/tokenizer_config.json
Special tokens file saved in checkpoints/checkpoint-36/special_tokens_map.json
The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Evaluation *****
  Num examples = 4

Score for fold 3 was - 0.9975711779786803
Score for fold 3 was - 0.9975711779786803
Score for fold 3 was - 0.9975711779786803
Score for fold 3 was - 0.9975711779786803
Score for fold 3 was - 0.9975711779786803
Score for fold 3 was - 0.9975711779786803
Score for fold 3 was - 0.9975711779786803
Score for fold 3 was - 0.9975711779786803


  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/5 [00:00<?, ?ba/s]

  0%|          | 0/5 [00:00<?, ?ba/s]

  0%|          | 0/5 [00:00<?, ?ba/s]

  0%|          | 0/5 [00:00<?, ?ba/s]

  0%|          | 0/5 [00:00<?, ?ba/s]

  0%|          | 0/5 [00:00<?, ?ba/s]

  0%|          | 0/5 [00:00<?, ?ba/s]

  0%|          | 0/5 [00:00<?, ?ba/s]

The following columns in the training set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running training *****
  Num examples = 36311
  Num Epochs = 50
  Instantaneous batch size per device = 128
  Total train batch size (w. parallel, distributed & accumulation) = 1024
  Gradient Accumulation steps = 1
  Total optimization steps = 1800


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.005437,0.998762,0.990593,0.989601,0.990093
2,No log,0.006085,0.998267,0.986499,0.987877,0.98716
3,No log,0.009009,0.997772,0.98304,0.986153,0.9845
4,No log,0.006827,0.997772,0.989861,0.970932,0.979818
5,No log,0.007024,0.997524,0.985209,0.97007,0.977244
6,No log,0.007842,0.997524,0.988493,0.967026,0.976957
7,No log,0.007784,0.998514,0.986864,0.988739,0.98778
8,No log,0.008783,0.997772,0.982519,0.986153,0.98425
9,No log,0.012514,0.996781,0.977925,0.982705,0.980109
10,No log,0.007756,0.997772,0.978591,0.983606,0.981036




Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.005437,0.998762,0.990593,0.989601,0.990093
2,No log,0.006085,0.998267,0.986499,0.987877,0.98716
3,No log,0.009009,0.997772,0.98304,0.986153,0.9845
4,No log,0.006827,0.997772,0.989861,0.970932,0.979818
5,No log,0.007024,0.997524,0.985209,0.97007,0.977244
6,No log,0.007842,0.997524,0.988493,0.967026,0.976957
7,No log,0.007784,0.998514,0.986864,0.988739,0.98778
8,No log,0.008783,0.997772,0.982519,0.986153,0.98425
9,No log,0.012514,0.996781,0.977925,0.982705,0.980109
10,No log,0.007756,0.997772,0.978591,0.983606,0.981036


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.005437,0.998762,0.990593,0.989601,0.990093
2,No log,0.006085,0.998267,0.986499,0.987877,0.98716
3,No log,0.009009,0.997772,0.98304,0.986153,0.9845
4,No log,0.006827,0.997772,0.989861,0.970932,0.979818
5,No log,0.007024,0.997524,0.985209,0.97007,0.977244
6,No log,0.007842,0.997524,0.988493,0.967026,0.976957
7,No log,0.007784,0.998514,0.986864,0.988739,0.98778
8,No log,0.008783,0.997772,0.982519,0.986153,0.98425
9,No log,0.012514,0.996781,0.977925,0.982705,0.980109
10,No log,0.007756,0.997772,0.978591,0.983606,0.981036


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.005437,0.998762,0.990593,0.989601,0.990093
2,No log,0.006085,0.998267,0.986499,0.987877,0.98716
3,No log,0.009009,0.997772,0.98304,0.986153,0.9845
4,No log,0.006827,0.997772,0.989861,0.970932,0.979818
5,No log,0.007024,0.997524,0.985209,0.97007,0.977244
6,No log,0.007842,0.997524,0.988493,0.967026,0.976957
7,No log,0.007784,0.998514,0.986864,0.988739,0.98778
8,No log,0.008783,0.997772,0.982519,0.986153,0.98425
9,No log,0.012514,0.996781,0.977925,0.982705,0.980109
10,No log,0.007756,0.997772,0.978591,0.983606,0.981036


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.005437,0.998762,0.990593,0.989601,0.990093
2,No log,0.006085,0.998267,0.986499,0.987877,0.98716
3,No log,0.009009,0.997772,0.98304,0.986153,0.9845
4,No log,0.006827,0.997772,0.989861,0.970932,0.979818
5,No log,0.007024,0.997524,0.985209,0.97007,0.977244
6,No log,0.007842,0.997524,0.988493,0.967026,0.976957
7,No log,0.007784,0.998514,0.986864,0.988739,0.98778
8,No log,0.008783,0.997772,0.982519,0.986153,0.98425
9,No log,0.012514,0.996781,0.977925,0.982705,0.980109
10,No log,0.007756,0.997772,0.978591,0.983606,0.981036




Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.005437,0.998762,0.990593,0.989601,0.990093
2,No log,0.006085,0.998267,0.986499,0.987877,0.98716
3,No log,0.009009,0.997772,0.98304,0.986153,0.9845
4,No log,0.006827,0.997772,0.989861,0.970932,0.979818
5,No log,0.007024,0.997524,0.985209,0.97007,0.977244
6,No log,0.007842,0.997524,0.988493,0.967026,0.976957
7,No log,0.007784,0.998514,0.986864,0.988739,0.98778
8,No log,0.008783,0.997772,0.982519,0.986153,0.98425
9,No log,0.012514,0.996781,0.977925,0.982705,0.980109
10,No log,0.007756,0.997772,0.978591,0.983606,0.981036


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.005437,0.998762,0.990593,0.989601,0.990093
2,No log,0.006085,0.998267,0.986499,0.987877,0.98716
3,No log,0.009009,0.997772,0.98304,0.986153,0.9845
4,No log,0.006827,0.997772,0.989861,0.970932,0.979818
5,No log,0.007024,0.997524,0.985209,0.97007,0.977244
6,No log,0.007842,0.997524,0.988493,0.967026,0.976957
7,No log,0.007784,0.998514,0.986864,0.988739,0.98778
8,No log,0.008783,0.997772,0.982519,0.986153,0.98425
9,No log,0.012514,0.996781,0.977925,0.982705,0.980109
10,No log,0.007756,0.997772,0.978591,0.983606,0.981036


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.005437,0.998762,0.990593,0.989601,0.990093
2,No log,0.006085,0.998267,0.986499,0.987877,0.98716
3,No log,0.009009,0.997772,0.98304,0.986153,0.9845
4,No log,0.006827,0.997772,0.989861,0.970932,0.979818
5,No log,0.007024,0.997524,0.985209,0.97007,0.977244
6,No log,0.007842,0.997524,0.988493,0.967026,0.976957
7,No log,0.007784,0.998514,0.986864,0.988739,0.98778
8,No log,0.008783,0.997772,0.982519,0.986153,0.98425
9,No log,0.012514,0.996781,0.977925,0.982705,0.980109
10,No log,0.007756,0.997772,0.978591,0.983606,0.981036


The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Evaluation *****
  Num examples = 4039
  Batch size = 128
Saving model checkpoint to checkpoints/checkpoint-36
Configuration saved in checkpoints/checkpoint-36/config.json
Model weights saved in checkpoints/checkpoint-36/pytorch_model.bin
tokenizer config file saved in checkpoints/checkpoint-36/tokenizer_config.json
Special tokens file saved in checkpoints/checkpoint-36/special_tokens_map.json
The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Evaluation *****
  Num examples = 4

Score for fold 1 was - 0.997904735298226
Score for fold 1 was - 0.997904735298226
Score for fold 1 was - 0.997904735298226
Score for fold 1 was - 0.997904735298226
Score for fold 1 was - 0.997904735298226
Score for fold 1 was - 0.997904735298226
Score for fold 1 was - 0.997904735298226
Score for fold 1 was - 0.997904735298226


  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/4 [00:00<?, ?ba/s]

  0%|          | 0/4 [00:00<?, ?ba/s]

  0%|          | 0/4 [00:00<?, ?ba/s]

  0%|          | 0/4 [00:00<?, ?ba/s]

  0%|          | 0/4 [00:00<?, ?ba/s]

  0%|          | 0/4 [00:00<?, ?ba/s]

  0%|          | 0/4 [00:00<?, ?ba/s]

  0%|          | 0/4 [00:00<?, ?ba/s]

The following columns in the training set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running training *****
  Num examples = 36406
  Num Epochs = 50
  Instantaneous batch size per device = 128
  Total train batch size (w. parallel, distributed & accumulation) = 1024
  Gradient Accumulation steps = 1
  Total optimization steps = 1800


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.00282,0.998732,0.972826,0.996082,0.983657
2,No log,0.003059,0.998732,0.972826,0.996082,0.983657
3,No log,0.004273,0.998479,0.968085,0.995298,0.980581
4,No log,0.00326,0.998732,0.972826,0.996082,0.983657
5,No log,0.0034,0.998732,0.972826,0.996082,0.983657
6,No log,0.006778,0.996957,0.943396,0.990596,0.963293
7,No log,0.005825,0.998225,0.967704,0.994514,0.97999
8,No log,0.003105,0.998986,0.977778,0.996865,0.986795
9,No log,0.004022,0.998225,0.971461,0.9892,0.979804
10,No log,0.003358,0.998732,0.976892,0.990768,0.983526




Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.00282,0.998732,0.972826,0.996082,0.983657
2,No log,0.003059,0.998732,0.972826,0.996082,0.983657
3,No log,0.004273,0.998479,0.968085,0.995298,0.980581
4,No log,0.00326,0.998732,0.972826,0.996082,0.983657
5,No log,0.0034,0.998732,0.972826,0.996082,0.983657
6,No log,0.006778,0.996957,0.943396,0.990596,0.963293
7,No log,0.005825,0.998225,0.967704,0.994514,0.97999
8,No log,0.003105,0.998986,0.977778,0.996865,0.986795
9,No log,0.004022,0.998225,0.971461,0.9892,0.979804
10,No log,0.003358,0.998732,0.976892,0.990768,0.983526


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.00282,0.998732,0.972826,0.996082,0.983657
2,No log,0.003059,0.998732,0.972826,0.996082,0.983657
3,No log,0.004273,0.998479,0.968085,0.995298,0.980581
4,No log,0.00326,0.998732,0.972826,0.996082,0.983657
5,No log,0.0034,0.998732,0.972826,0.996082,0.983657
6,No log,0.006778,0.996957,0.943396,0.990596,0.963293
7,No log,0.005825,0.998225,0.967704,0.994514,0.97999
8,No log,0.003105,0.998986,0.977778,0.996865,0.986795
9,No log,0.004022,0.998225,0.971461,0.9892,0.979804
10,No log,0.003358,0.998732,0.976892,0.990768,0.983526


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.00282,0.998732,0.972826,0.996082,0.983657
2,No log,0.003059,0.998732,0.972826,0.996082,0.983657
3,No log,0.004273,0.998479,0.968085,0.995298,0.980581
4,No log,0.00326,0.998732,0.972826,0.996082,0.983657
5,No log,0.0034,0.998732,0.972826,0.996082,0.983657
6,No log,0.006778,0.996957,0.943396,0.990596,0.963293
7,No log,0.005825,0.998225,0.967704,0.994514,0.97999
8,No log,0.003105,0.998986,0.977778,0.996865,0.986795
9,No log,0.004022,0.998225,0.971461,0.9892,0.979804
10,No log,0.003358,0.998732,0.976892,0.990768,0.983526




Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.00282,0.998732,0.972826,0.996082,0.983657
2,No log,0.003059,0.998732,0.972826,0.996082,0.983657
3,No log,0.004273,0.998479,0.968085,0.995298,0.980581
4,No log,0.00326,0.998732,0.972826,0.996082,0.983657
5,No log,0.0034,0.998732,0.972826,0.996082,0.983657
6,No log,0.006778,0.996957,0.943396,0.990596,0.963293
7,No log,0.005825,0.998225,0.967704,0.994514,0.97999
8,No log,0.003105,0.998986,0.977778,0.996865,0.986795
9,No log,0.004022,0.998225,0.971461,0.9892,0.979804
10,No log,0.003358,0.998732,0.976892,0.990768,0.983526




Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.00282,0.998732,0.972826,0.996082,0.983657
2,No log,0.003059,0.998732,0.972826,0.996082,0.983657
3,No log,0.004273,0.998479,0.968085,0.995298,0.980581
4,No log,0.00326,0.998732,0.972826,0.996082,0.983657
5,No log,0.0034,0.998732,0.972826,0.996082,0.983657
6,No log,0.006778,0.996957,0.943396,0.990596,0.963293
7,No log,0.005825,0.998225,0.967704,0.994514,0.97999
8,No log,0.003105,0.998986,0.977778,0.996865,0.986795
9,No log,0.004022,0.998225,0.971461,0.9892,0.979804
10,No log,0.003358,0.998732,0.976892,0.990768,0.983526


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.00282,0.998732,0.972826,0.996082,0.983657
2,No log,0.003059,0.998732,0.972826,0.996082,0.983657
3,No log,0.004273,0.998479,0.968085,0.995298,0.980581
4,No log,0.00326,0.998732,0.972826,0.996082,0.983657
5,No log,0.0034,0.998732,0.972826,0.996082,0.983657
6,No log,0.006778,0.996957,0.943396,0.990596,0.963293
7,No log,0.005825,0.998225,0.967704,0.994514,0.97999
8,No log,0.003105,0.998986,0.977778,0.996865,0.986795
9,No log,0.004022,0.998225,0.971461,0.9892,0.979804
10,No log,0.003358,0.998732,0.976892,0.990768,0.983526


Epoch,Training Loss,Validation Loss,Accuracy,Precision,Recall,F1
1,No log,0.00282,0.998732,0.972826,0.996082,0.983657
2,No log,0.003059,0.998732,0.972826,0.996082,0.983657
3,No log,0.004273,0.998479,0.968085,0.995298,0.980581
4,No log,0.00326,0.998732,0.972826,0.996082,0.983657
5,No log,0.0034,0.998732,0.972826,0.996082,0.983657
6,No log,0.006778,0.996957,0.943396,0.990596,0.963293
7,No log,0.005825,0.998225,0.967704,0.994514,0.97999
8,No log,0.003105,0.998986,0.977778,0.996865,0.986795
9,No log,0.004022,0.998225,0.971461,0.9892,0.979804
10,No log,0.003358,0.998732,0.976892,0.990768,0.983526


The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Evaluation *****
  Num examples = 3944
  Batch size = 128
Saving model checkpoint to checkpoints/checkpoint-36
Configuration saved in checkpoints/checkpoint-36/config.json
Model weights saved in checkpoints/checkpoint-36/pytorch_model.bin
tokenizer config file saved in checkpoints/checkpoint-36/tokenizer_config.json
Special tokens file saved in checkpoints/checkpoint-36/special_tokens_map.json
The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Evaluation *****
  Num examples = 3

Score for fold 4 was - 0.9991415080841322
Score for fold 4 was - 0.9991415080841322
Score for fold 4 was - 0.9991415080841322
Score for fold 4 was - 0.9991415080841322
Score for fold 4 was - 0.9991415080841322
Score for fold 4 was - 0.9991415080841322


Saving model checkpoint to nli_model/


Score for fold 4 was - 0.9991415080841322
Score for fold 4 was - 0.9991415080841322


Configuration saved in nli_model/config.json
Model weights saved in nli_model/pytorch_model.bin
tokenizer config file saved in nli_model/tokenizer_config.json
Special tokens file saved in nli_model/special_tokens_map.json


<transformers.trainer.Trainer object at 0x7feae52c5b90>
<transformers.trainer.Trainer object at 0x7feada346610>
<transformers.trainer.Trainer object at 0x7feadcf50710>
<transformers.trainer.Trainer object at 0x7feab4129510>
<transformers.trainer.Trainer object at 0x7feab46e6ed0>


tokenizer config file saved in nli_model/tokenizer_config.json
Special tokens file saved in nli_model/special_tokens_map.json


<transformers.trainer.Trainer object at 0x7feab3feef50>
<transformers.trainer.Trainer object at 0x7feab40707d0>
<transformers.trainer.Trainer object at 0x7feadcf96f50>


  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

  0%|          | 0/1 [00:00<?, ?ba/s]

The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


  0%|          | 0/1 [00:00<?, ?ba/s]

The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 22
  Batch size = 128


Scores on the dev set
Scores on the dev set
Scores on the dev set
Scores on the dev set
Scores on the dev set
Scores on the dev set
Scores on the dev set
Scores on the dev set
-------------------------------------------------------------
|           |   agree   | disagree  |  discuss  | unrelated |
-------------------------------------------------------------
|   agree   |    421    |    35     |    272    |    34     |
-------------------------------------------------------------
| disagree  |    36     |    62     |    58     |     6     |
-------------------------------------------------------------
|  discuss  |    142    |    59     |   1536    |    63     |
-------------------------------------------------------------
| unrelated |    12     |     4     |    42     |   6840    |
--------------------------------------------------------------------------------------------------------------------------
|           |   agree   | disagree  |  discuss  | unrelated |
-------------------

The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.






***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 200
  Batch size = 128


The following columns in the test set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: text. If text are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.
***** Running Prediction *****
  Num examples = 13
  Batch size = 128


In [None]:
import itertools
import torch_xla.distributed.xla_multiprocessing as xmp
from pathlib import Path


backbone = AutoModelForSequenceClassification.from_pretrained(
        "distilbert-base-uncased", num_labels=4
    )
backbone.resize_token_embeddings(len(tokenizer))
WRAPPED_MODEL = xmp.MpModelWrapper(backbone)

def train_fnc(WRAPPED_MODEL, device):
  # We wrap this 
  model = WRAPPED_MODEL.to(device)

  # https://huggingface.co/docs/transformers/v4.20.1/en/main_classes/trainer#transformers.TrainingArguments
  training_args = TrainingArguments(
      "checkpoints",
      evaluation_strategy="epoch",
      save_strategy="epoch",
      learning_rate=1e-5,
      warmup_ratio=0.1,
      weight_decay=0.01,
      load_best_model_at_end=True,
      num_train_epochs=50,
      metric_for_best_model="accuracy",
      per_device_eval_batch_size=128,
      per_device_train_batch_size=128,
      tpu_num_cores = 8,
  )

  best_fold = None

  directory_path = Path("nli_model/")
  if not directory_path.exists():
    


    best_score = 0
    # Classifier for each fold
    for fold in fold_stances:

        #Removing the fold from consideration
        ids = list(range(len(folds)))
        del ids[fold]

        #trainingset consists of everything except for the fold
        X_train = list(itertools.chain(*tuple([Xs[i] for i in ids])))
        y_train = list(itertools.chain(*tuple([ys[i] for i in ids])))

        data_dict = DatasetDict(
          train=Dataset.from_dict(
              {
                  "text": X_train, 
                  "label": y_train
              }
          ),
          test=Dataset.from_dict(
              {
                  "text": Xs[fold],
                  "label": ys[fold],
              }
          )
        )

        encoded_dataset = data_dict.map(preprocess, batched=True)

        trainer = Trainer(
            model,
            training_args,
            train_dataset=encoded_dataset["train"],
            eval_dataset=encoded_dataset["test"],
            tokenizer=tokenizer,
            compute_metrics=compute_metrics,
        )

        trainer.place_model_on_device = False
        trainer.train()
        predicted, _, _ = trainer.predict(encoded_dataset["test"])  
        labeled_Predictions = [LABELS[int(a)] for a in np.argmax(predicted, axis=-1)]
        actual = [LABELS[int(a)] for a in encoded_dataset["test"]["label"]]

        fold_score, _ = score_submission(actual, labeled_Predictions)
        max_fold_score, _ = score_submission(actual, actual)

        score = fold_score / max_fold_score

        print("Score for fold " + str(fold) + " was - " + str(score))
        if score > best_score:
            best_score = score
            best_fold = trainer

    #Saving the best fold model
    best_fold.save_model("nli_model/")
    tokenizer.save_pretrained("nli_model/")

  else:
    print("Loading model")
    best_fold = AutoModelForSequenceClassification.from_pretrained("./nli_model/").to(device)

  print(best_fold)

  holdout_data_dict = DatasetDict(
      holdout = Dataset.from_dict(
          {
              "text": X_holdout,
              "label": y_holdout,
          }
      )
    )

  encoded_holdout_dataset_list = [holdout_data_dict.map(preprocess, batched=True) for holdout_data_dict in holdout_data_dict_list]
  #encoded_holdout_dataset = holdout_data_dict.map(preprocess, batched=True)

  labeled_Predictions = []
  actual_predictions = []
  for encoded_holdout_dataset in encoded_holdout_dataset_list:
    prediction, _, _ = best_fold.predict(encoded_holdout_dataset["holdout"])
    labeled_Prediction = [LABELS[int(a)] for a in np.argmax(prediction, axis=-1)]
    labeled_Predictions.extend(labeled_Prediction)

    actual = [LABELS[int(a)] for a in encoded_holdout_dataset["holdout"]["label"]]
    actual_predictions.extend(actual)

  print("Scores on the dev set")
  report_score(actual_predictions, labeled_Predictions)
  print("")
  print("")

  result = []
  i = 0
  for encoded_competition_dataset in encoded_competitiondataset_list:
    predictions, _, _ = trainer.predict(encoded_competition_dataset["competition"])  
    labeled_Predictions = [LABELS[int(a)] for a in np.argmax(predictions, axis=-1)]

    for predictedLabel in labeled_Predictions:
        dict = {
            "Headline": unlabeled_competition_dataset.stances[i]['Headline'],
            "Body ID": unlabeled_competition_dataset.stances[i]['Body ID'],
            "Stance": predictedLabel
        }
        result.append(dict)
        i += 1

  test_data = pd.DataFrame(result)
  test_data.to_csv('answer.csv', index=False, encoding='utf-8')  # From pandas library

  return trainer


<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>