In [1]:
import numpy as np
import pickle
import os

seed = 2023

In [2]:
import torch

# set device
device = "cuda" if torch.cuda.is_available() else "cpu"
device

'cuda'

In [3]:
import transformers

# set to only report critical errors to avoid excessing logging
transformers.utils.logging.set_verbosity(50)

In [4]:
from nlpsig_networks.scripts.fine_tune_bert_classification import (
    fine_tune_transformer_average_seed,
)

In [5]:
output_dir = "rumours_output"
if not os.path.isdir(output_dir):
    os.makedirs(output_dir)

## Rumours

In [6]:
%run load_sbert-embeddings.py

In [7]:
df_rumours.head()

Unnamed: 0,id,label,datetime,text,timeline_id,set
0,5.249902e+17,0,2014-10-22 18:26:23,Police have clarified that there were two shoo...,0,train
1,5.249906e+17,0,2014-10-22 18:27:58,"@CTVNews you guys ""confirmed"" there were 3 sho...",0,train
2,5.249908e+17,1,2014-10-22 18:28:46,@CTVNews get it right. http://t.co/GHYxMuzPG9,0,train
3,5.249927e+17,1,2014-10-22 18:36:29,RT @CTVNews Police have clarified that there w...,0,train
4,5.250038e+17,1,2014-10-22 19:20:41,@CTVNews @ctvsaskatoon so what happened at Rid...,0,train


## Baseline: Fine-tine BERT for classification

In [8]:
num_epochs = 5
learning_rates = [5e-5, 1e-5, 1e-6]
seeds = [1, 12, 123]
validation_metric = "f1"

In [9]:
label_to_id

{'0': 0, '1': 1}

In [10]:
id_to_label

{0: '0', 1: '1'}

In [11]:
kwargs = {
    "num_epochs": num_epochs,
    "pretrained_model_name": "bert-base-uncased",
    "df": df_rumours,
    "feature_name": "text",
    "label_column": "label",
    "label_to_id": label_to_id,
    "id_to_label": id_to_label,
    "output_dim": output_dim,
    "learning_rates": learning_rates,
    "seeds": seeds,
    "device": device,
    "batch_size": 8,
    "split_ids": split_ids,
    "k_fold": True,
    "validation_metric": validation_metric,
    "verbose": False,
}

## Focal Loss

In [12]:
loss = "focal"
gamma = 2

In [13]:
bert_classifier = fine_tune_transformer_average_seed(
    loss=loss,
    gamma=gamma,
    results_output=f"{output_dir}/bert_classifier_focal.csv",
    **kwargs,
)

  0%|          | 0/3 [00:00<?, ?it/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.175128,0.78135,0.769612
2,0.215100,0.229847,0.801929,0.782294
3,0.130100,0.26366,0.787781,0.763419
4,0.062600,0.437864,0.789068,0.772723
5,0.062600,0.576602,0.786495,0.768369


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.180301,0.790953,0.768101
2,0.211600,0.162821,0.768334,0.763853
3,0.132200,0.206907,0.806717,0.79541
4,0.132200,0.341469,0.795751,0.780634
5,0.070500,0.425662,0.809459,0.796885


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.24009,0.648241,0.393293
2,0.214200,0.260987,0.777459,0.747333
3,0.152300,0.22076,0.781048,0.755537
4,0.152300,0.336756,0.767408,0.746393
5,0.088400,0.407268,0.769562,0.745787


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.192495,0.772575,0.746799
2,0.212900,0.17527,0.808696,0.800158
3,0.130800,0.198096,0.799331,0.793606
4,0.072800,0.289047,0.805351,0.789521
5,0.072800,0.455159,0.8,0.786648


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.208769,0.75412,0.725217
2,0.216200,0.186639,0.782465,0.776928
3,0.134100,0.335128,0.777851,0.757038
4,0.068000,0.37907,0.787739,0.777919
5,0.068000,0.526244,0.777851,0.764904


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.173963,0.805145,0.789334
2,0.204900,0.172301,0.814148,0.804817
3,0.127600,0.246576,0.821222,0.803831
4,0.075500,0.311917,0.813505,0.80146
5,0.075500,0.427955,0.810289,0.796264


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.276985,0.770391,0.731051
2,0.212500,0.203743,0.801234,0.784101
3,0.138400,0.246892,0.801919,0.789078
4,0.138400,0.473059,0.795751,0.778145
5,0.064600,0.562765,0.797121,0.77831


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.194702,0.750179,0.703843
2,0.212900,0.212851,0.772434,0.752645
3,0.149500,0.255148,0.748026,0.740709
4,0.149500,0.252674,0.776023,0.761387
5,0.093000,0.331272,0.778177,0.757138


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.19004,0.755853,0.708604
2,0.221300,0.202323,0.807358,0.798527
3,0.140800,0.190588,0.807358,0.795708
4,0.059900,0.416343,0.795987,0.781253
5,0.059900,0.509129,0.799331,0.783941


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.201363,0.760053,0.742978
2,0.211700,0.190972,0.77851,0.775523
3,0.117600,0.310327,0.768622,0.756079
4,0.036600,0.547778,0.7706,0.756829
5,0.036600,0.714912,0.773896,0.76364


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.228716,0.783923,0.76521
2,0.219800,0.171287,0.817363,0.802469
3,0.136100,0.186493,0.803215,0.793517
4,0.073000,0.388246,0.797428,0.780485
5,0.073000,0.565887,0.79164,0.772317


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.232894,0.690199,0.593713
2,0.240000,0.172886,0.784099,0.778298
3,0.162300,0.26637,0.797121,0.773742
4,0.162300,0.296031,0.799178,0.786004
5,0.084000,0.427534,0.785469,0.769143


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.205668,0.745872,0.672023
2,0.212600,0.210247,0.698492,0.696423
3,0.141400,0.281554,0.779612,0.765651
4,0.141400,0.331408,0.788227,0.766151
5,0.070000,0.445326,0.786073,0.762484


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.205116,0.755853,0.753693
2,0.210200,0.174034,0.804682,0.795242
3,0.137800,0.29092,0.806689,0.793487
4,0.078600,0.281582,0.798662,0.790563
5,0.078600,0.402969,0.803344,0.790439


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.193928,0.736322,0.735194
2,0.212600,0.174399,0.78708,0.781614
3,0.123100,0.330782,0.7706,0.763379
4,0.050800,0.557238,0.767304,0.754534
5,0.050800,0.615424,0.771259,0.759459


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.201046,0.74791,0.697839
2,0.220100,0.193069,0.793569,0.776477
3,0.147700,0.21169,0.792926,0.774274
4,0.107300,0.251894,0.796141,0.784047
5,0.107300,0.285151,0.792283,0.777722


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.212558,0.719671,0.641292
2,0.220500,0.176133,0.78684,0.773507
3,0.156200,0.213505,0.789582,0.768948
4,0.156200,0.270249,0.790953,0.770038
5,0.106900,0.29251,0.792324,0.776343


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.21303,0.688442,0.669559
2,0.210600,0.217848,0.761665,0.727854
3,0.140500,0.265752,0.763101,0.728547
4,0.140500,0.296287,0.762383,0.743279
5,0.090700,0.329909,0.765973,0.743419


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.185361,0.761204,0.736709
2,0.217400,0.1742,0.803344,0.788099
3,0.145100,0.208529,0.796656,0.775696
4,0.097200,0.282255,0.78796,0.772133
5,0.097200,0.298328,0.796656,0.782372


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.217801,0.723138,0.705525
2,0.215700,0.197992,0.738299,0.734129
3,0.146100,0.240959,0.769941,0.760962
4,0.096600,0.327589,0.769281,0.755755
5,0.096600,0.344132,0.767963,0.755918


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.192747,0.756913,0.738464
2,0.220200,0.17278,0.8,0.786428
3,0.146400,0.18923,0.810289,0.796264
4,0.109900,0.238175,0.800643,0.788747
5,0.109900,0.275836,0.8,0.78613


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.215921,0.640164,0.64011
2,0.219000,0.215752,0.766964,0.727869
3,0.165700,0.216756,0.795065,0.773731
4,0.165700,0.223707,0.79438,0.782645
5,0.120900,0.247763,0.787526,0.772496


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.217154,0.707107,0.631493
2,0.219800,0.219421,0.755205,0.714497
3,0.152000,0.215294,0.749462,0.731955
4,0.152000,0.282929,0.763819,0.739953
5,0.096900,0.331862,0.765973,0.739641


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.218677,0.60602,0.605505
2,0.234000,0.178372,0.786622,0.764945
3,0.164300,0.174943,0.803344,0.790733
4,0.109300,0.263351,0.797993,0.775311
5,0.109300,0.253343,0.811371,0.796272


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.217683,0.671061,0.662903
2,0.229600,0.204894,0.692156,0.692121
3,0.167000,0.221475,0.77851,0.766282
4,0.112900,0.259569,0.769281,0.759956
5,0.112900,0.290235,0.775873,0.765504


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.224347,0.713183,0.662815
2,0.229900,0.179527,0.787781,0.769584
3,0.161300,0.198989,0.763344,0.758644
4,0.112300,0.244185,0.783923,0.768365
5,0.112300,0.302253,0.787138,0.770899


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.207933,0.705963,0.694552
2,0.224100,0.184163,0.770391,0.752526
3,0.160000,0.217876,0.772447,0.746224
4,0.160000,0.246138,0.773818,0.758893
5,0.109100,0.277149,0.77793,0.766033


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.230448,0.717157,0.634964
2,0.213300,0.205331,0.72649,0.718265
3,0.150900,0.213805,0.766691,0.745495
4,0.150900,0.286852,0.760948,0.72293
5,0.097100,0.308331,0.763101,0.727905


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.217651,0.662207,0.662202
2,0.224600,0.173988,0.77592,0.771232
3,0.151600,0.205153,0.8,0.782326
4,0.105900,0.220094,0.799331,0.79097
5,0.105900,0.257435,0.788629,0.775541


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.220796,0.665788,0.66308
2,0.224000,0.207556,0.741595,0.713768
3,0.160700,0.217988,0.765326,0.754469
4,0.111200,0.280322,0.764667,0.757657
5,0.111200,0.311677,0.769941,0.757469


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.231764,0.623151,0.595728
2,0.245500,0.227113,0.612862,0.608977
3,0.233200,0.223713,0.651447,0.620051
4,0.221800,0.222175,0.650161,0.638177
5,0.221800,0.221505,0.650161,0.635191


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.230065,0.623715,0.610371
2,0.243800,0.224715,0.638794,0.616199
3,0.225800,0.224083,0.63331,0.629393
4,0.225800,0.220797,0.663468,0.640604
5,0.223100,0.220382,0.655929,0.639771


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.232466,0.644652,0.574386
2,0.238000,0.232981,0.666188,0.592609
3,0.217200,0.231354,0.659727,0.613228
4,0.217200,0.230576,0.658291,0.615024
5,0.211800,0.23128,0.661163,0.61486


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.227342,0.633445,0.617526
2,0.247900,0.224149,0.674916,0.617084
3,0.233700,0.217991,0.67291,0.65529
4,0.225300,0.215929,0.685619,0.663782
5,0.225300,0.215097,0.687625,0.66907


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.238731,0.599868,0.58942
2,0.246200,0.233572,0.609756,0.604852
3,0.226700,0.233211,0.627554,0.61574
4,0.220900,0.232254,0.629532,0.619443
5,0.220900,0.232481,0.634146,0.623422


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.238451,0.557556,0.538118
2,0.259300,0.233539,0.592926,0.564999
3,0.242000,0.230627,0.622508,0.581642
4,0.233800,0.22876,0.634727,0.607293
5,0.233800,0.228097,0.63537,0.609533


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.239902,0.572995,0.496082
2,0.258100,0.235359,0.59767,0.554536
3,0.240400,0.23272,0.612748,0.570825
4,0.240400,0.230982,0.612063,0.588804
5,0.236400,0.230481,0.619602,0.592541


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.236965,0.610194,0.471291
2,0.249100,0.234121,0.598708,0.537153
3,0.228100,0.233425,0.626705,0.52722
4,0.228100,0.23209,0.615937,0.566123
5,0.224100,0.231841,0.620244,0.567613


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.238454,0.604013,0.485722
2,0.255700,0.233879,0.598662,0.557294
3,0.242900,0.231003,0.616054,0.575321
4,0.237500,0.230112,0.610702,0.57987
5,0.237500,0.22929,0.618729,0.579808


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.242147,0.568227,0.469658
2,0.252900,0.235311,0.586684,0.58282
3,0.239500,0.232521,0.597891,0.59523
4,0.233600,0.230801,0.604483,0.602116
5,0.233600,0.229919,0.623599,0.617076


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.232476,0.626367,0.592875
2,0.246300,0.228697,0.623151,0.603878
3,0.230800,0.227094,0.616077,0.608524
4,0.228100,0.226229,0.63537,0.618174
5,0.228100,0.225734,0.636013,0.624611


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.230353,0.605209,0.591102
2,0.244800,0.226387,0.63194,0.598337
3,0.232500,0.224288,0.634681,0.615484
4,0.232500,0.222806,0.642221,0.623298
5,0.226000,0.222186,0.644962,0.628514


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.233633,0.634602,0.541393
2,0.233700,0.231283,0.646088,0.582951
3,0.227000,0.22985,0.637473,0.593534
4,0.227000,0.229329,0.643934,0.600989
5,0.218600,0.229598,0.653266,0.60476


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.230869,0.620736,0.572104
2,0.248400,0.226306,0.623411,0.612218
3,0.235400,0.223472,0.653512,0.629982
4,0.230500,0.221396,0.658863,0.638721
5,0.230500,0.220846,0.656856,0.637672


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.237544,0.584707,0.565994
2,0.240700,0.236579,0.597891,0.573181
3,0.231200,0.234016,0.61437,0.590536
4,0.226100,0.232878,0.605142,0.592616
5,0.226100,0.232662,0.602505,0.5923


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.201046,0.74791,0.697839
2,0.220100,0.193069,0.793569,0.776477
3,0.147700,0.21169,0.792926,0.774274
4,0.107300,0.251894,0.796141,0.784047
5,0.107300,0.285151,0.792283,0.777722


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.212558,0.719671,0.641292
2,0.220500,0.176133,0.78684,0.773507
3,0.156200,0.213505,0.789582,0.768948
4,0.156200,0.270249,0.790953,0.770038
5,0.106900,0.29251,0.792324,0.776343


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.21303,0.688442,0.669559
2,0.210600,0.217848,0.761665,0.727854
3,0.140500,0.265752,0.763101,0.728547
4,0.140500,0.296287,0.762383,0.743279
5,0.090700,0.329909,0.765973,0.743419


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.185361,0.761204,0.736709
2,0.217400,0.1742,0.803344,0.788099
3,0.145100,0.208529,0.796656,0.775696
4,0.097200,0.282255,0.78796,0.772133
5,0.097200,0.298328,0.796656,0.782372


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.217801,0.723138,0.705525
2,0.215700,0.197992,0.738299,0.734129
3,0.146100,0.240959,0.769941,0.760962
4,0.096600,0.327589,0.769281,0.755755
5,0.096600,0.344132,0.767963,0.755918


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.192747,0.756913,0.738464
2,0.220200,0.17278,0.8,0.786428
3,0.146400,0.18923,0.810289,0.796264
4,0.109900,0.238175,0.800643,0.788747
5,0.109900,0.275836,0.8,0.78613


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.215921,0.640164,0.64011
2,0.219000,0.215752,0.766964,0.727869
3,0.165700,0.216756,0.795065,0.773731
4,0.165700,0.223707,0.79438,0.782645
5,0.120900,0.247763,0.787526,0.772496


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.217154,0.707107,0.631493
2,0.219800,0.219421,0.755205,0.714497
3,0.152000,0.215294,0.749462,0.731955
4,0.152000,0.282929,0.763819,0.739953
5,0.096900,0.331862,0.765973,0.739641


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.218677,0.60602,0.605505
2,0.234000,0.178372,0.786622,0.764945
3,0.164300,0.174943,0.803344,0.790733
4,0.109300,0.263351,0.797993,0.775311
5,0.109300,0.253343,0.811371,0.796272


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.217683,0.671061,0.662903
2,0.229600,0.204894,0.692156,0.692121
3,0.167000,0.221475,0.77851,0.766282
4,0.112900,0.259569,0.769281,0.759956
5,0.112900,0.290235,0.775873,0.765504


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.224347,0.713183,0.662815
2,0.229900,0.179527,0.787781,0.769584
3,0.161300,0.198989,0.763344,0.758644
4,0.112300,0.244185,0.783923,0.768365
5,0.112300,0.302253,0.787138,0.770899


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.207933,0.705963,0.694552
2,0.224100,0.184163,0.770391,0.752526
3,0.160000,0.217876,0.772447,0.746224
4,0.160000,0.246138,0.773818,0.758893
5,0.109100,0.277149,0.77793,0.766033


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.230448,0.717157,0.634964
2,0.213300,0.205331,0.72649,0.718265
3,0.150900,0.213805,0.766691,0.745495
4,0.150900,0.286852,0.760948,0.72293
5,0.097100,0.308331,0.763101,0.727905


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.217651,0.662207,0.662202
2,0.224600,0.173988,0.77592,0.771232
3,0.151600,0.205153,0.8,0.782326
4,0.105900,0.220094,0.799331,0.79097
5,0.105900,0.257435,0.788629,0.775541


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.220796,0.665788,0.66308
2,0.224000,0.207556,0.741595,0.713768
3,0.160700,0.217988,0.765326,0.754469
4,0.111200,0.280322,0.764667,0.757657
5,0.111200,0.311677,0.769941,0.757469


saving the results dataframe to CSV in rumours_output/bert_classifier_focal.csv


In [14]:
bert_classifier

Unnamed: 0,accuracy,f1,f1_scores,precision,precision_scores,recall,recall_scores,valid_accuracy,valid_f1,valid_f1_scores,...,valid_precision_scores,valid_recall,valid_recall_scores,learning_rate,seed,loss_function,gamma,k_fold,n_splits,batch_size
0,0.625349,0.574354,"[0.7216837441152035, 0.427023945267959]",0.578569,"[0.6979110873058383, 0.4592274678111588]",0.573087,"[0.7471330275229358, 0.3990410229088972]",0.78582,0.771356,"[0.8288637587506732, 0.7138483702503151]",...,"[0.8197699190455902, 0.7273394495412844]",0.769505,"[0.8381616205619691, 0.7008486562942009]",1e-06,1,focal,2,True,5,8
0,0.646226,0.595797,"[0.7385674931129477, 0.45302593659942364]",0.602086,"[0.7107635206786851, 0.4934086629001883]",0.593694,"[0.7686353211009175, 0.4187533297815663]",0.792155,0.777186,"[0.8349389852280026, 0.7194323144104804]",...,"[0.8208798147758367, 0.7410044977511244]",0.774284,"[0.8494881289479417, 0.6990806223479491]",1e-06,12,focal,2,True,5,8
0,0.628332,0.595941,"[0.71034282393957, 0.48153926157046284]",0.595127,"[0.7199646643109541, 0.4702894870492636]",0.597158,"[0.7009747706422018, 0.4933404368673415]",0.77935,0.767093,"[0.8205240653437122, 0.7136610110197656]",...,"[0.8260485651214128, 0.7061266874350987]",0.768215,"[0.8150729688521019, 0.7213578500707214]",1e-06,123,focal,2,True,5,8


In [15]:
bert_classifier["f1"].mean()

0.5886972007675945

In [16]:
bert_classifier["precision"].mean()

0.5919274816760146

In [17]:
bert_classifier["recall"].mean()

0.5879796514706433

In [18]:
np.stack(bert_classifier["f1_scores"]).mean(axis=0)

array([0.72353135, 0.45386305])

In [19]:
np.stack(bert_classifier["precision_scores"]).mean(axis=0)

array([0.70954642, 0.47430854])

In [20]:
np.stack(bert_classifier["recall_scores"]).mean(axis=0)

array([0.73891437, 0.43704493])

## Using Cross-Entropy loss

In [21]:
loss = "cross_entropy"
gamma = None

In [22]:
bert_classifier_ce = fine_tune_transformer_average_seed(
    loss=loss,
    gamma=gamma,
    results_output=f"{output_dir}/bert_classifier_ce.csv",
    **kwargs,
)

  0%|          | 0/3 [00:00<?, ?it/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.534237,0.755627,0.74951
2,0.585600,0.523375,0.804502,0.784382
3,0.405400,0.532079,0.801286,0.782047
4,0.296200,0.760756,0.803215,0.791064
5,0.296200,0.91306,0.798071,0.784738


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.55986,0.732008,0.67919
2,0.606000,0.450734,0.797121,0.780899
3,0.429900,0.553459,0.801234,0.79099
4,0.429900,0.822448,0.800548,0.787922
5,0.296700,0.938725,0.795751,0.780803


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.515933,0.76023,0.722948
2,0.546500,0.53196,0.773869,0.739809
3,0.341900,0.75834,0.79397,0.7635
4,0.341900,1.058996,0.778177,0.763948
5,0.179000,1.216479,0.781048,0.758224


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.559142,0.77592,0.745348
2,0.562800,0.552186,0.810033,0.788503
3,0.380600,0.555676,0.820736,0.804155
4,0.294500,0.823779,0.816722,0.802666
5,0.294500,0.857257,0.820736,0.808144


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.552789,0.74555,0.712983
2,0.612300,0.534647,0.760053,0.757521
3,0.423300,0.552274,0.789057,0.779803
4,0.274700,0.889837,0.791035,0.780917
5,0.274700,1.050337,0.783125,0.772076


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.547582,0.752412,0.738554
2,0.596000,0.480532,0.792283,0.780929
3,0.426900,0.595866,0.814148,0.797325
4,0.321100,0.833292,0.797428,0.781157
5,0.321100,0.875806,0.800643,0.787334


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.616596,0.716929,0.713905
2,0.573900,0.587312,0.779986,0.775511
3,0.397300,0.750646,0.801919,0.786166
4,0.397300,0.816148,0.799178,0.781776
5,0.294700,0.955636,0.800548,0.788072


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.54022,0.73654,0.699338
2,0.567300,0.589955,0.757358,0.728379
3,0.396400,0.595849,0.763101,0.744592
4,0.396400,0.797275,0.768844,0.74231
5,0.256400,0.990864,0.767408,0.745932


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.550009,0.735117,0.669779
2,0.623900,0.514651,0.799331,0.776374
3,0.398300,0.643668,0.812709,0.804575
4,0.264800,0.774677,0.812709,0.803055
5,0.264800,0.888565,0.810033,0.798132


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.51241,0.758734,0.742125
2,0.562500,0.5406,0.789717,0.783846
3,0.384100,0.700819,0.777192,0.763501
4,0.240500,0.932919,0.782465,0.770161
5,0.240500,1.15946,0.785761,0.77512


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.496857,0.793569,0.777656
2,0.545800,0.557792,0.810289,0.791216
3,0.356700,0.760594,0.805145,0.786458
4,0.219400,0.943866,0.811576,0.795338
5,0.219400,1.018637,0.809003,0.793348


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.677707,0.664154,0.544838
2,0.628400,0.45981,0.804661,0.785889
3,0.449700,0.6078,0.799863,0.77523
4,0.449700,0.796474,0.780672,0.763701
5,0.269500,1.001797,0.793009,0.778534


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.591444,0.715721,0.610108
2,0.552700,0.612183,0.750179,0.738449
3,0.393100,0.716231,0.772434,0.759418
4,0.393100,1.031243,0.769562,0.733243
5,0.232100,1.167606,0.765973,0.734887


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.522766,0.754515,0.743486
2,0.602600,0.470483,0.797324,0.788218
3,0.408000,0.595292,0.808027,0.800734
4,0.303300,0.710465,0.81204,0.802041
5,0.303300,0.894472,0.813378,0.802025


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.536587,0.748187,0.718452
2,0.603400,0.533451,0.784443,0.769355
3,0.381100,0.763288,0.76269,0.759635
4,0.263900,0.957753,0.780488,0.769722
5,0.263900,1.144476,0.7706,0.75778


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.528591,0.751768,0.707144
2,0.593000,0.486115,0.790997,0.776345
3,0.417900,0.561344,0.798071,0.778981
4,0.323700,0.638418,0.793569,0.78118
5,0.323700,0.698787,0.790354,0.778411


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.579179,0.717615,0.646879
2,0.593200,0.494197,0.780672,0.766537
3,0.426800,0.51795,0.790953,0.776418
4,0.426800,0.654051,0.779986,0.759691
5,0.323400,0.69017,0.781357,0.763395


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.57182,0.737976,0.693232
2,0.561300,0.552549,0.755205,0.715214
3,0.390300,0.635689,0.764537,0.736138
4,0.390300,0.680342,0.766691,0.744086
5,0.292800,0.738666,0.764537,0.740369


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.520845,0.748495,0.696457
2,0.598000,0.456039,0.800669,0.779724
3,0.415400,0.472286,0.803344,0.793336
4,0.297300,0.608908,0.799331,0.780206
5,0.297300,0.613903,0.808027,0.794467


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.55618,0.735662,0.71716
2,0.576100,0.536865,0.752142,0.747253
3,0.410000,0.579441,0.775214,0.765418
4,0.310100,0.685412,0.777851,0.766534
5,0.310100,0.754841,0.77851,0.767012


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.539505,0.738907,0.717829
2,0.604800,0.470594,0.799357,0.78381
3,0.425300,0.538019,0.805788,0.789626
4,0.325400,0.631215,0.80836,0.794853
5,0.325400,0.675793,0.803215,0.789788


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.572496,0.7183,0.701099
2,0.596600,0.525223,0.763537,0.720591
3,0.472000,0.487145,0.795065,0.781936
4,0.472000,0.531315,0.797807,0.786625
5,0.370400,0.548181,0.805346,0.793097


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.591788,0.711414,0.601742
2,0.589100,0.585022,0.750179,0.706191
3,0.421900,0.572192,0.76023,0.732154
4,0.421900,0.660355,0.767408,0.744514
5,0.296100,0.711366,0.761665,0.736174


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.547845,0.728428,0.664884
2,0.619300,0.526516,0.790635,0.756748
3,0.436700,0.477522,0.805351,0.793085
4,0.340200,0.613758,0.8,0.785715
5,0.340200,0.639354,0.798662,0.78194


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.601351,0.679631,0.676251
2,0.612600,0.65691,0.665129,0.66475
3,0.441300,0.596747,0.769941,0.75275
4,0.329200,0.662894,0.767963,0.760079
5,0.329200,0.690629,0.775214,0.763763


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.537172,0.752412,0.729562
2,0.603800,0.461981,0.805145,0.788519
3,0.427900,0.495007,0.802572,0.791781
4,0.322900,0.588452,0.80836,0.791433
5,0.322900,0.640839,0.802572,0.783819


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.558819,0.717615,0.706897
2,0.603600,0.486334,0.788211,0.775122
3,0.437000,0.527239,0.779986,0.754268
4,0.437000,0.571226,0.791638,0.777727
5,0.330900,0.624998,0.789582,0.778948


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.601403,0.728643,0.630096
2,0.560700,0.559398,0.744436,0.727736
3,0.415000,0.587423,0.759512,0.742909
4,0.415000,0.731965,0.765973,0.735181
5,0.312400,0.770766,0.772434,0.742634


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.52508,0.746488,0.738581
2,0.594100,0.46971,0.799331,0.791653
3,0.401200,0.552186,0.802007,0.785129
4,0.297600,0.634235,0.803344,0.7956
5,0.297600,0.705688,0.805351,0.792356


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.559118,0.719183,0.709925
2,0.591800,0.522164,0.758075,0.737364
3,0.414700,0.580623,0.777192,0.770713
4,0.313900,0.685309,0.783125,0.771936
5,0.313900,0.73508,0.791694,0.780609


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.638994,0.638585,0.505365
2,0.655300,0.628059,0.650804,0.613345
3,0.638200,0.615601,0.664309,0.59455
4,0.604800,0.613162,0.665595,0.627888
5,0.604800,0.611834,0.664309,0.628463


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.637889,0.631254,0.540989
2,0.653400,0.625707,0.645648,0.546572
3,0.616100,0.620284,0.655243,0.627526
4,0.616100,0.609503,0.664154,0.610615
5,0.609700,0.609402,0.664839,0.626763


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.62968,0.657574,0.45596
2,0.635200,0.626317,0.666188,0.551682
3,0.592700,0.62762,0.660445,0.571023
4,0.592700,0.627438,0.661881,0.586116
5,0.575400,0.627639,0.666906,0.594987


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.635536,0.6301,0.481679
2,0.660900,0.621311,0.648829,0.508907
3,0.638700,0.606781,0.679599,0.621435
4,0.616200,0.599929,0.680936,0.618698
5,0.616200,0.597415,0.696321,0.646963


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.655548,0.59855,0.483487
2,0.657200,0.64281,0.618985,0.579847
3,0.623700,0.64118,0.62294,0.588477
4,0.604700,0.638651,0.626236,0.595527
5,0.604700,0.638471,0.628214,0.595896


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.659057,0.615434,0.393238
2,0.689600,0.645131,0.629582,0.464708
3,0.659200,0.632309,0.642444,0.556353
4,0.639400,0.625857,0.650161,0.587271
5,0.639400,0.623574,0.644373,0.590503


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.659516,0.613434,0.393177
2,0.690500,0.646807,0.628513,0.500317
3,0.652600,0.639281,0.633996,0.560982
4,0.652600,0.63408,0.636052,0.574218
5,0.640600,0.632057,0.637423,0.575302


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.643851,0.649677,0.395769
2,0.671700,0.637064,0.64537,0.432619
3,0.623500,0.633109,0.651113,0.464027
4,0.623500,0.635256,0.637473,0.53736
5,0.609800,0.634197,0.638191,0.538669


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.659567,0.620736,0.382996
2,0.685200,0.65068,0.625418,0.397899
3,0.661300,0.643088,0.632107,0.473249
4,0.650500,0.639086,0.631438,0.511833
5,0.650500,0.637919,0.6301,0.512616


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.666061,0.591958,0.380711
2,0.683200,0.65098,0.611734,0.478859
3,0.655200,0.640848,0.636124,0.578
4,0.637900,0.635439,0.642716,0.589768
5,0.637900,0.634149,0.640738,0.583114


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.645444,0.619936,0.390543
2,0.664100,0.629948,0.647588,0.551756
3,0.632200,0.621569,0.661736,0.630063
4,0.621900,0.616372,0.666881,0.626553
5,0.621900,0.614824,0.673312,0.639063


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.642814,0.616861,0.429578
2,0.658600,0.631115,0.64085,0.560132
3,0.633200,0.624222,0.650446,0.600694
4,0.633200,0.620735,0.660727,0.60915
5,0.615100,0.618619,0.660727,0.615987


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.632458,0.650395,0.418214
2,0.631000,0.628099,0.653984,0.511136
3,0.614600,0.623891,0.659009,0.531847
4,0.614600,0.621916,0.663317,0.565095
5,0.592700,0.621103,0.666188,0.566501


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.646331,0.622074,0.391718
2,0.664900,0.631001,0.644147,0.536295
3,0.645800,0.621549,0.654849,0.565812
4,0.630100,0.616379,0.664214,0.577592
5,0.630100,0.614326,0.670903,0.601204


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.658086,0.594595,0.415328
2,0.654900,0.649434,0.611074,0.519928
3,0.633700,0.645198,0.621622,0.550618
4,0.617800,0.640383,0.624918,0.577544
5,0.617800,0.637481,0.627554,0.596315


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.528591,0.751768,0.707144
2,0.593000,0.486115,0.790997,0.776345
3,0.417900,0.561344,0.798071,0.778981
4,0.323700,0.638418,0.793569,0.78118
5,0.323700,0.698787,0.790354,0.778411


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.579179,0.717615,0.646879
2,0.593200,0.494197,0.780672,0.766537
3,0.426800,0.51795,0.790953,0.776418
4,0.426800,0.654051,0.779986,0.759691
5,0.323400,0.69017,0.781357,0.763395


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.57182,0.737976,0.693232
2,0.561300,0.552549,0.755205,0.715214
3,0.390300,0.635689,0.764537,0.736138
4,0.390300,0.680342,0.766691,0.744086
5,0.292800,0.738666,0.764537,0.740369


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.520845,0.748495,0.696457
2,0.598000,0.456039,0.800669,0.779724
3,0.415400,0.472286,0.803344,0.793336
4,0.297300,0.608908,0.799331,0.780206
5,0.297300,0.613903,0.808027,0.794467


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.55618,0.735662,0.71716
2,0.576100,0.536865,0.752142,0.747253
3,0.410000,0.579441,0.775214,0.765418
4,0.310100,0.685412,0.777851,0.766534
5,0.310100,0.754841,0.77851,0.767012


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.539505,0.738907,0.717829
2,0.604800,0.470594,0.799357,0.78381
3,0.425300,0.538019,0.805788,0.789626
4,0.325400,0.631215,0.80836,0.794853
5,0.325400,0.675793,0.803215,0.789788


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.572496,0.7183,0.701099
2,0.596600,0.525223,0.763537,0.720591
3,0.472000,0.487145,0.795065,0.781936
4,0.472000,0.531315,0.797807,0.786625
5,0.370400,0.548181,0.805346,0.793097


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.591788,0.711414,0.601742
2,0.589100,0.585022,0.750179,0.706191
3,0.421900,0.572192,0.76023,0.732154
4,0.421900,0.660355,0.767408,0.744514
5,0.296100,0.711366,0.761665,0.736174


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.547845,0.728428,0.664884
2,0.619300,0.526516,0.790635,0.756748
3,0.436700,0.477522,0.805351,0.793085
4,0.340200,0.613758,0.8,0.785715
5,0.340200,0.639354,0.798662,0.78194


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.601351,0.679631,0.676251
2,0.612600,0.65691,0.665129,0.66475
3,0.441300,0.596747,0.769941,0.75275
4,0.329200,0.662894,0.767963,0.760079
5,0.329200,0.690629,0.775214,0.763763


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.537172,0.752412,0.729562
2,0.603800,0.461981,0.805145,0.788519
3,0.427900,0.495007,0.802572,0.791781
4,0.322900,0.588452,0.80836,0.791433
5,0.322900,0.640839,0.802572,0.783819


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.558819,0.717615,0.706897
2,0.603600,0.486334,0.788211,0.775122
3,0.437000,0.527239,0.779986,0.754268
4,0.437000,0.571226,0.791638,0.777727
5,0.330900,0.624998,0.789582,0.778948


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.601403,0.728643,0.630096
2,0.560700,0.559398,0.744436,0.727736
3,0.415000,0.587423,0.759512,0.742909
4,0.415000,0.731965,0.765973,0.735181
5,0.312400,0.770766,0.772434,0.742634


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.52508,0.746488,0.738581
2,0.594100,0.46971,0.799331,0.791653
3,0.401200,0.552186,0.802007,0.785129
4,0.297600,0.634235,0.803344,0.7956
5,0.297600,0.705688,0.805351,0.792356


Map:   0%|          | 0/5568 [00:00<?, ? examples/s]

Map:   0%|          | 0/5568 [00:00<?, ? examples/s]



Epoch,Training Loss,Validation Loss,Validation accuracy,Validation f1
1,No log,0.559118,0.719183,0.709925
2,0.591800,0.522164,0.758075,0.737364
3,0.414700,0.580623,0.777192,0.770713
4,0.313900,0.685309,0.783125,0.771936
5,0.313900,0.73508,0.791694,0.780609


saving the results dataframe to CSV in rumours_output/bert_classifier_ce.csv


In [23]:
bert_classifier_ce

Unnamed: 0,accuracy,f1,f1_scores,precision,precision_scores,recall,recall_scores,valid_accuracy,valid_f1,valid_f1_scores,...,valid_precision_scores,valid_recall,valid_recall_scores,learning_rate,seed,loss_function,gamma,k_fold,n_splits,batch_size
0,0.641566,0.599106,"[0.729573899592181, 0.46863774523348994]",0.601389,"[0.7159812310240132, 0.48679678530424797]",0.597739,"[0.7436926605504587, 0.4517847629195525]",0.787842,0.773333,"[0.8306798623063684, 0.7159870083002526]",...,"[0.8206163655685441, 0.7310243183492999]",0.771275,"[0.8409932476584622, 0.7015558698727016]",1e-06,1,cross_entropy,,True,5,8
0,0.637651,0.590118,"[0.7296996662958843, 0.45053702656868283]",0.594127,"[0.7084233261339092, 0.4798314268512944]",0.588454,"[0.7522935779816514, 0.4246137453383058]",0.792694,0.778646,"[0.8344099913867356, 0.7228828828828827]",...,"[0.8249946774536938, 0.7369581190301249]",0.776689,"[0.8440426922239164, 0.7093352192362093]",1e-06,12,cross_entropy,,True,5,8
0,0.62479,0.598535,"[0.7012023155707289, 0.49586776859504134]",0.597428,"[0.7269929208987381, 0.4678638941398866]",0.602308,"[0.6771788990825688, 0.527437400106553]",0.789864,0.778789,"[0.8282850534199803, 0.7292932800833478]",...,"[0.8377896613190731, 0.7164790174002047]",0.780784,"[0.8189936832934002, 0.7425742574257426]",1e-06,123,cross_entropy,,True,5,8


In [24]:
bert_classifier_ce["f1"].mean()

0.5959197369760014

In [25]:
bert_classifier_ce["precision"].mean()

0.5976482640586817

In [26]:
bert_classifier_ce["recall"].mean()

0.596166840996515

In [27]:
np.stack(bert_classifier_ce["f1_scores"]).mean(axis=0)

array([0.72015863, 0.47168085])

In [28]:
np.stack(bert_classifier_ce["precision_scores"]).mean(axis=0)

array([0.71713249, 0.47816404])

In [29]:
np.stack(bert_classifier_ce["recall_scores"]).mean(axis=0)

array([0.72438838, 0.4679453 ])