# Parameters 

In [1]:
# Model
model_checkpoint = 'bert-base-uncased'
batch_size = 8
metric_name = "accuracy"

# Fold
fold = 0

# Experiment
labels = ["none", "attribution", "causal", "conditional", "contrast", "description", "equivalence", "fulfillment", "identity", "purpose", "summary", "temporal"]

# Import

In [2]:
import torch
import numpy as np
import random
import pandas as pd
from IPython.display import display, HTML

In [3]:
def import_fold(path, fold):
    train = pd.read_csv(f"{path}/train.{fold}.csv")
    test = pd.read_csv(f"{path}/train.{fold}.csv")
    return train, test

train_df, test_df = import_fold("data/export", fold)
display(train_df)

train_origin = train_df["origin"].tolist()
train_target = train_df["target"].tolist()
train_labels = train_df["label"].tolist()
test_origin = test_df["origin"].tolist()
test_target = test_df["target"].tolist()
test_labels = test_df["label"].tolist()

Unnamed: 0,origin,target,label
0,Canada confirms fifth case of Mad Cow Disease....,Swine flu: recent developments worldwide. A ma...,0
1,Swine flu: recent developments worldwide. A ma...,Canada confirms fifth case of Mad Cow Disease....,0
2,U.K. National Portrait Gallery threatens U.S. ...,Church of Scientology attempting to block 'int...,0
3,Church of Scientology attempting to block 'int...,U.K. National Portrait Gallery threatens U.S. ...,0
4,31 children rescued as UK police shut down glo...,U.K. National Portrait Gallery threatens U.S. ...,0
...,...,...,...
3163,Efforts to cap Deepwater Horizon oil spill del...,"Deepwater Horizon oil well finally dead, autho...",2
3164,"Volcano near Anchorage, Alaska erupts, airport...",Volcano erupts in southern Chile. This was not...,0
3165,Volcano erupts in southern Chile. This was not...,"Volcano near Anchorage, Alaska erupts, airport...",0
3166,More suspected plane debris washes ashore on M...,Malaysia says debris found in Maldives could b...,11


# Model 

## Metric

In [4]:
from sklearn.metrics import classification_report
import collections

#classification_threshold = 0.

def flatten(d, parent_key='', sep='__'):
    items = []
    for k, v in d.items():
        new_key = parent_key + sep + k if parent_key else k
        if isinstance(v, collections.MutableMapping):
            items.extend(flatten(v, new_key, sep=sep).items())
        else:
            items.append((new_key, v))
    return dict(items)

def compute_metrics(eval_pred):
    global labels
    predictions, true_labels = eval_pred
    # take most probable guess
    predictions = np.argmax(predictions, axis=-1)
    return flatten(classification_report(
        y_true=true_labels,
        y_pred=predictions,
        target_names=labels,
        zero_division=0,
        output_dict=True))

In [5]:
#TEST
#flatten(classification_report(
#    y_true=[0,1,2,3,4,5,6,7,8,9,10,11,12],
#    y_pred=[0,0,0,1,3,0,0,0,0,0,0,0,0],
#    target_names=labels,
#    zero_division=0,
#    output_dict=True))

## Model Settings

In [6]:
from transformers import AutoModelForSequenceClassification, TrainingArguments, Trainer

args = TrainingArguments(
    "semantic-test",
    evaluation_strategy = "epoch",
    learning_rate=2e-5,
    per_device_train_batch_size=batch_size,
    per_device_eval_batch_size=batch_size,
    num_train_epochs=5,
    weight_decay=0.01,
    load_best_model_at_end=True,
    metric_for_best_model=metric_name,
)

## Tokenize

In [7]:
from transformers import BertTokenizerFast
tokenizer = BertTokenizerFast.from_pretrained(model_checkpoint)

In [8]:
train_encodings = tokenizer(train_origin, train_target, truncation=True, padding=True, return_token_type_ids=True)
test_encodings = tokenizer(test_origin, test_target, truncation=True, padding=True, return_token_type_ids=True)

## Print Examples

In [9]:
#train_encodings

In [10]:
def show_random_elements(origin_list, target_list, label_list, encodings, num_examples=10):
    global labels
    assert num_examples <= len(origin_list), "Can't pick more elements than there are in the dataset."
    picks = []
    for _ in range(num_examples):
        pick = random.randint(0, len(origin_list)-1)
        while pick in picks:
            pick = random.randint(0, len(origin_list)-1)
        picks.append(pick)
    data = []
    for n in picks:
        data.append([n, origin_list[n], labels[label_list[n]], target_list[n], encodings.input_ids[n], encodings.token_type_ids[n], encodings.attention_mask[n]])
    df = pd.DataFrame(data, columns=['index', 'Origin', 'Label', 'Target', 'Input_ids', 'Token_type_ids', 'Attention_mask'])
    display(HTML(df.to_html()))

In [11]:
show_random_elements(train_origin, train_target, train_labels, train_encodings)
# Output adjustet to Folds
#show_random_elements(k_fold_origin[0][0], k_fold_target[0][0], k_fold_labels[0][0], train_encodings[0])

Unnamed: 0,index,Origin,Label,Target,Input_ids,Token_type_ids,Attention_mask
0,424,"Spanish Prime Minster condemns killing of Spanish councillor. Zapatero told the press that the ETA is defeated by democracy, and that the Government wants to roundly manifest that those who took part in the shooting will be arrested shortly, and to express its solidarity with the family and companions of Isaías, in both the PSE Basque Socialist Party and in the UGT trade union. March 7, 2008",causal,"Basque separatist group ETA declares ceasefire. The bombing was frowned upon by all involved in the peace process, including other Basque separatist parties in the region. September 6, 2010","[101, 3009, 3539, 8117, 6238, 28887, 2015, 4288, 1997, 3009, 10674, 1012, 23564, 17585, 3217, 2409, 1996, 2811, 2008, 1996, 27859, 2003, 3249, 2011, 7072, 1010, 1998, 2008, 1996, 2231, 4122, 2000, 2461, 2135, 19676, 2008, 2216, 2040, 2165, 2112, 1999, 1996, 5008, 2097, 2022, 4727, 3859, 1010, 1998, 2000, 4671, 2049, 14657, 2007, 1996, 2155, 1998, 11946, 1997, 18061, 7951, 1010, 1999, 2119, 1996, 8827, 2063, 13915, 6102, 2283, 1998, 1999, 1996, 1057, 13512, 3119, 2586, 1012, 2233, 1021, 1010, 2263, 102, 13915, 19802, 25879, 2923, 2177, 27859, 18806, 26277, 1012, 1996, 8647, 2001, 7335, 2588, 2011, 2035, 2920, ...]","[0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, ...]","[1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, ...]"
1,1582,"Scholastic sued for Harry Potter copyright infringement. The complaint stated that in both books, the protagonists are required to deduce the exact nature of the central task in the competition, and had done so in a bathroom. July 14, 2010",none,"Portuguese writer José Saramago dies at 87. As Saramago Foundation reported, today, June 18, José Saramago has died at 12:30 at his home in Lanzarote, at 87 years old, as the aftermath of a multiorgan failure, after a prolonged illness. June 18, 2010","[101, 24105, 12923, 2005, 4302, 10693, 9385, 20701, 1012, 1996, 12087, 3090, 2008, 1999, 2119, 2808, 1010, 1996, 21989, 2024, 3223, 2000, 2139, 8566, 3401, 1996, 6635, 3267, 1997, 1996, 2430, 4708, 1999, 1996, 2971, 1010, 1998, 2018, 2589, 2061, 1999, 1037, 5723, 1012, 2251, 2403, 1010, 2230, 102, 5077, 3213, 4560, 7354, 2863, 3995, 8289, 2012, 6584, 1012, 2004, 7354, 2863, 3995, 3192, 2988, 1010, 2651, 1010, 2238, 2324, 1010, 4560, 7354, 2863, 3995, 2038, 2351, 2012, 2260, 1024, 2382, 2012, 2010, 2188, 1999, 17595, 9057, 12184, 1010, 2012, 6584, 2086, 2214, 1010, 2004, 1996, 10530, 1997, 1037, 4800, ...]","[0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, ...]","[1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, ...]"
2,365,"Malaysia says debris found in Maldives could be from MH370. Debris has since washed ashore on at least three other Maldives locations, the Fehendhoo and Fulhahdhoo, but most of it isn't believed to be from an aircraft. August 10, 2015",causal,"Malaysia to investigate suspected plane debris washed ashore on several Maldives islands. Abdulla Rasheed, a captain of a cargo boat which recently capsized in the waters off the Maldives, stated, From the pictures of the debris found on most of the islands, I can almost certainly say that they are from the cargo we were carrying. August 9, 2015","[101, 6027, 2758, 11385, 2179, 1999, 25059, 2071, 2022, 2013, 1049, 2232, 24434, 2692, 1012, 11385, 2038, 2144, 8871, 16145, 2006, 2012, 2560, 2093, 2060, 25059, 5269, 1010, 1996, 10768, 22342, 6806, 2080, 1998, 11865, 2140, 3270, 14945, 6806, 2080, 1010, 2021, 2087, 1997, 2009, 3475, 1005, 1056, 3373, 2000, 2022, 2013, 2019, 2948, 1012, 2257, 2184, 1010, 2325, 102, 6027, 2000, 8556, 6878, 4946, 11385, 8871, 16145, 2006, 2195, 25059, 3470, 1012, 10298, 2721, 23438, 13089, 1010, 1037, 2952, 1997, 1037, 6636, 4049, 2029, 3728, 9700, 3550, 1999, 1996, 5380, 2125, 1996, 25059, 1010, 3090, 1010, 2013, 1996, 4620, ...]","[0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, ...]","[1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, ...]"
3,3007,"WWE Raw Results from Cincinnati, OH for September 22, 2008. Michaels would tag in one last time while Batista would continue to fight outside of the ring with Layfield. September 22, 2008",none,"WWE Raw Results from Memphis, TN for September 15, 2008. After the match, Jericho would seek out WWE Raw General Manager Mike Adamle, taking issue with being booked to wrestle in four high-profile matches in a three-week time span, and demanded that the rookie G.M. needed to learn how to take care of his champions. September 15, 2008","[101, 11700, 6315, 3463, 2013, 7797, 1010, 2821, 2005, 2244, 2570, 1010, 2263, 1012, 17784, 2052, 6415, 1999, 2028, 2197, 2051, 2096, 7151, 11921, 2052, 3613, 2000, 2954, 2648, 1997, 1996, 3614, 2007, 3913, 3790, 1012, 2244, 2570, 1010, 2263, 102, 11700, 6315, 3463, 2013, 9774, 1010, 28286, 2005, 2244, 2321, 1010, 2263, 1012, 2044, 1996, 2674, 1010, 17309, 2052, 6148, 2041, 11700, 6315, 2236, 3208, 3505, 4205, 2571, 1010, 2635, 3277, 2007, 2108, 17414, 2000, 25579, 1999, 2176, 2152, 1011, 6337, 3503, 1999, 1037, 2093, 1011, 2733, 2051, 8487, 1010, 1998, 6303, 2008, 1996, 8305, 1043, 1012, 1049, 1012, ...]","[0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, ...]","[1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, ...]"
4,3021,"Fußball-Bundesliga 2007–08: Bayern Munich vs. Wolfsburg. Bayern Munich beat Wolfsburg 2-1 to remain at the top of the Bundesliga table. November 24, 2007",temporal,"Fußball-Bundesliga 2008–09: Wolfsburg win first season title. Wolfsburg manager Felix Magath Wolfsburg went into the match holding a two-point advantage over Bayern Munich and VfB Stuttgart, who played each other at the same time. May 23, 2009","[101, 11865, 19310, 7384, 1011, 14250, 2289, 1516, 5511, 1024, 21350, 7469, 5443, 1012, 4702, 9695, 1012, 21350, 7469, 3786, 4702, 9695, 1016, 1011, 1015, 2000, 3961, 2012, 1996, 2327, 1997, 1996, 14250, 2795, 1012, 2281, 2484, 1010, 2289, 102, 11865, 19310, 7384, 1011, 14250, 2263, 1516, 5641, 1024, 4702, 9695, 2663, 2034, 2161, 2516, 1012, 4702, 9695, 3208, 8383, 23848, 8988, 4702, 9695, 2253, 2046, 1996, 2674, 3173, 1037, 2048, 1011, 2391, 5056, 2058, 21350, 7469, 1998, 1058, 26337, 13022, 1010, 2040, 2209, 2169, 2060, 2012, 1996, 2168, 2051, 1012, 2089, 2603, 1010, 2268, 102, 0, 0, 0, 0, ...]","[0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, ...]","[1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, ...]"
5,1971,"Palestinians to elect new president on January 9. New leadership could prove to be the key to revitalizing the peace process in the Middle East, as both Israel and the United States had refused to work with Arafat. November 14, 2004",none,"Investigation wanted into the murders of Iraqi academics. The situation in the last six months has gotten so bad, we couldn't continue. February 1,2006","[101, 21524, 2000, 11322, 2047, 2343, 2006, 2254, 1023, 1012, 2047, 4105, 2071, 6011, 2000, 2022, 1996, 3145, 2000, 7065, 18400, 6026, 1996, 3521, 2832, 1999, 1996, 2690, 2264, 1010, 2004, 2119, 3956, 1998, 1996, 2142, 2163, 2018, 4188, 2000, 2147, 2007, 19027, 27753, 1012, 2281, 2403, 1010, 2432, 102, 4812, 2359, 2046, 1996, 9916, 1997, 8956, 15032, 1012, 1996, 3663, 1999, 1996, 2197, 2416, 2706, 2038, 5407, 2061, 2919, 1010, 2057, 2481, 1005, 1056, 3613, 1012, 2337, 1015, 1010, 2294, 102, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, ...]","[0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, ...]","[1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, ...]"
6,2546,"President of China lunches with Brazilian President. Hu Jintao, the President of the People's Republic of China had lunch today with the President of Brazil, Luiz Inácio Lula da Silva, at the Granja do Torto, the President's country residence in the Brazilian Federal District. November 12, 2004",temporal,"Lula's future in the hands of Brazilian Parliament. On June 4, during the so called Curupira operation, the Brazilian Federal Police arrested members of IBAMA, a Brazilian agency for environment. June 6, 2005","[101, 2343, 1997, 2859, 6265, 2229, 2007, 6142, 2343, 1012, 15876, 9743, 28555, 1010, 1996, 2343, 1997, 1996, 2111, 1005, 1055, 3072, 1997, 2859, 2018, 6265, 2651, 2007, 1996, 2343, 1997, 4380, 1010, 11320, 10993, 27118, 9793, 11320, 2721, 4830, 11183, 1010, 2012, 1996, 12604, 3900, 2079, 17153, 3406, 1010, 1996, 2343, 1005, 1055, 2406, 5039, 1999, 1996, 6142, 2976, 2212, 1012, 2281, 2260, 1010, 2432, 102, 11320, 2721, 1005, 1055, 2925, 1999, 1996, 2398, 1997, 6142, 3323, 1012, 2006, 2238, 1018, 1010, 2076, 1996, 2061, 2170, 12731, 21531, 7895, 3169, 1010, 1996, 6142, 2976, 2610, 4727, 2372, 1997, 21307, ...]","[0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, ...]","[1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, ...]"
7,2173,"Hamas wins Palestinian election. Mushir al-Masri, who won the election said in regards to Israel, negotiations with Israel are not on our agenda. January 29, 2005",none,"Palestinians to elect new president on January 9. Acting president Rawhi Fattuh has announced today that Palestinian elections will be held on January 9. November 14, 2004","[101, 22129, 5222, 9302, 2602, 1012, 14163, 6182, 2099, 2632, 1011, 16137, 3089, 1010, 2040, 2180, 1996, 2602, 2056, 1999, 12362, 2000, 3956, 1010, 7776, 2007, 3956, 2024, 2025, 2006, 2256, 11376, 1012, 2254, 2756, 1010, 2384, 102, 21524, 2000, 11322, 2047, 2343, 2006, 2254, 1023, 1012, 3772, 2343, 6315, 4048, 6638, 8525, 2232, 2038, 2623, 2651, 2008, 9302, 3864, 2097, 2022, 2218, 2006, 2254, 1023, 1012, 2281, 2403, 1010, 2432, 102, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, ...]","[0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, ...]","[1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, ...]"
8,1690,"President Bush: U.S. respects Pakistan's sovereignty. Bush also expressed full support for the Friends of Pakistan initiative to drum up international support for its economic development. September 23, 2008",contrast,"UN report says death of Benazir Bhutto preventable; fault of government. The report, released by a three-person UN commission, accused the Pakistani government of failing to take the necessary measures to respond to the extraordinary, fresh and urgent security risks that they knew she faced. April 16, 2010","[101, 2343, 5747, 1024, 1057, 1012, 1055, 1012, 17475, 4501, 1005, 1055, 12601, 1012, 5747, 2036, 5228, 2440, 2490, 2005, 1996, 2814, 1997, 4501, 6349, 2000, 6943, 2039, 2248, 2490, 2005, 2049, 3171, 2458, 1012, 2244, 2603, 1010, 2263, 102, 4895, 3189, 2758, 2331, 1997, 3841, 16103, 2099, 1038, 6979, 9284, 4652, 3085, 1025, 6346, 1997, 2231, 1012, 1996, 3189, 1010, 2207, 2011, 1037, 2093, 1011, 2711, 4895, 3222, 1010, 5496, 1996, 9889, 2231, 1997, 7989, 2000, 2202, 1996, 4072, 5761, 2000, 6869, 2000, 1996, 9313, 1010, 4840, 1998, 13661, 3036, 10831, 2008, 2027, 2354, 2016, 4320, 1012, 2258, 2385, ...]","[0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, ...]","[1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, ...]"
9,2454,"Palestinians to elect new president on January 9. The Haaretz had initially reported that former prime minister Mahmoud Abbas was selected by the Fatah central committee as their candidate for president, but Abbas has denied this, saying, the matter is still being discussed. November 14, 2004",temporal,"Egypt seals border with Gaza after 11 days. Egypt says at least 17 Palestinians have been arrested in Sinai carrying weapons and explosives since the crisis began. February 3, 2008","[101, 21524, 2000, 11322, 2047, 2343, 2006, 2254, 1023, 1012, 1996, 5292, 12069, 5753, 2018, 3322, 2988, 2008, 2280, 3539, 2704, 27278, 17532, 2001, 3479, 2011, 1996, 6638, 4430, 2430, 2837, 2004, 2037, 4018, 2005, 2343, 1010, 2021, 17532, 2038, 6380, 2023, 1010, 3038, 1010, 1996, 3043, 2003, 2145, 2108, 6936, 1012, 2281, 2403, 1010, 2432, 102, 5279, 13945, 3675, 2007, 14474, 2044, 2340, 2420, 1012, 5279, 2758, 2012, 2560, 2459, 21524, 2031, 2042, 4727, 1999, 20837, 4755, 4255, 1998, 14792, 2144, 1996, 5325, 2211, 1012, 2337, 1017, 1010, 2263, 102, 0, 0, 0, 0, 0, 0, 0, 0, 0, ...]","[0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, ...]","[1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, ...]"


## Create Dataset

In [12]:
class SemanticDataset(torch.utils.data.Dataset):
    def __init__(self, encodings, labels):
        self.encodings = encodings
        self.labels = labels

    def __getitem__(self, idx):
        item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}
        item['labels'] = torch.tensor(self.labels[idx])
        return item

    def __len__(self):
        return len(self.labels)

train_dataset = SemanticDataset(train_encodings, train_labels)
test_dataset = SemanticDataset(test_encodings, test_labels)

# Model

## Create Model

In [13]:
num_labels = len(labels)
model = AutoModelForSequenceClassification.from_pretrained(model_checkpoint, num_labels=num_labels)

Some weights of the model checkpoint at bert-base-uncased were not used when initializing BertForSequenceClassification: ['cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.weight', 'cls.seq_relationship.bias', 'cls.predictions.decoder.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.transform.dense.bias', 'cls.seq_relationship.weight', 'cls.predictions.bias']
- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of BertForSequenceClassification were not initialized from the model checkpoint at

## Create Trainer

In [14]:
trainer = Trainer(
    model,
    args,
    train_dataset=train_dataset,
    eval_dataset=test_dataset,
    tokenizer=tokenizer,
    compute_metrics=compute_metrics
)

## Train

In [15]:
trainer.train()

Epoch,Training Loss,Validation Loss,None Precision,None Recall,None F1-score,None Support,Attribution Precision,Attribution Recall,Attribution F1-score,Attribution Support,Causal Precision,Causal Recall,Causal F1-score,Causal Support,Conditional Precision,Conditional Recall,Conditional F1-score,Conditional Support,Contrast Precision,Contrast Recall,Contrast F1-score,Contrast Support,Description Precision,Description Recall,Description F1-score,Description Support,Equivalence Precision,Equivalence Recall,Equivalence F1-score,Equivalence Support,Fulfillment Precision,Fulfillment Recall,Fulfillment F1-score,Fulfillment Support,Identity Precision,Identity Recall,Identity F1-score,Identity Support,Purpose Precision,Purpose Recall,Purpose F1-score,Purpose Support,Summary Precision,Summary Recall,Summary F1-score,Summary Support,Temporal Precision,Temporal Recall,Temporal F1-score,Temporal Support,Accuracy,Macro avg Precision,Macro avg Recall,Macro avg F1-score,Macro avg Support,Weighted avg Precision,Weighted avg Recall,Weighted avg F1-score,Weighted avg Support
1,No log,0.882111,0.793292,0.982134,0.87767,2071,0.0,0.0,0.0,15,0.212766,0.143369,0.171306,279,0.0,0.0,0.0,35,0.0,0.0,0.0,105,0.0,0.0,0.0,30,0.5,0.063725,0.113043,204,0.0,0.0,0.0,24,0.0,0.0,0.0,52,0.0,0.0,0.0,15,0.0,0.0,0.0,12,0.253846,0.303681,0.276536,326,0.690025,0.146659,0.124409,0.11988,3168,0.595651,0.690025,0.624577,3168
2,1.097100,0.672051,0.932781,0.978271,0.954985,2071,0.0,0.0,0.0,15,0.290647,0.724014,0.414784,279,0.0,0.0,0.0,35,0.0,0.0,0.0,105,0.0,0.0,0.0,30,1.0,0.014706,0.028986,204,0.0,0.0,0.0,24,0.0,0.0,0.0,52,0.0,0.0,0.0,15,0.0,0.0,0.0,12,0.661074,0.604294,0.63141,326,0.766414,0.240375,0.193441,0.16918,3168,0.7678,0.766414,0.727668,3168
3,0.796900,0.584417,0.947051,0.984549,0.965436,2071,0.0,0.0,0.0,15,0.488449,0.530466,0.508591,279,0.0,0.0,0.0,35,0.0,0.0,0.0,105,0.0,0.0,0.0,30,0.425532,0.588235,0.493827,204,0.0,0.0,0.0,24,0.0,0.0,0.0,52,0.0,0.0,0.0,15,0.0,0.0,0.0,12,0.639535,0.843558,0.727513,326,0.815025,0.208381,0.245567,0.224614,3168,0.75534,0.815025,0.782583,3168
4,0.584100,0.469592,0.998033,0.980203,0.989038,2071,0.0,0.0,0.0,15,0.740741,0.645161,0.689655,279,0.0,0.0,0.0,35,0.0,0.0,0.0,105,0.0,0.0,0.0,30,0.377691,0.946078,0.53986,204,0.0,0.0,0.0,24,0.0,0.0,0.0,52,0.0,0.0,0.0,15,0.0,0.0,0.0,12,0.827586,0.957055,0.887624,326,0.857008,0.245338,0.294041,0.258848,3168,0.827158,0.857008,0.833399,3168
5,0.584100,0.412937,0.997569,0.990826,0.994186,2071,0.0,0.0,0.0,15,0.763251,0.774194,0.768683,279,0.0,0.0,0.0,35,0.0,0.0,0.0,105,0.0,0.0,0.0,30,0.403805,0.936275,0.564254,204,0.0,0.0,0.0,24,0.0,0.0,0.0,52,0.0,0.0,0.0,15,0.0,0.0,0.0,12,0.884181,0.960123,0.920588,326,0.875,0.254067,0.305118,0.270643,3168,0.836342,0.875,0.848687,3168


  if isinstance(v, collections.MutableMapping):


TrainOutput(global_step=1980, training_loss=0.7453565038815894, metrics={'train_runtime': 545.4221, 'train_samples_per_second': 3.63, 'total_flos': 0, 'epoch': 5.0})

## Evaluate

### Test Dataset

In [16]:
# Run Evaluation on Dataset with all trainers and return k-fold index of highest accuracy
def format_result(result):
    df = pd.DataFrame([result])
    display(HTML(df.T.to_html()))
    
format_result(trainer.evaluate(test_dataset))

Unnamed: 0,0
eval_loss,0.412937
eval_none__precision,0.997569
eval_none__recall,0.990826
eval_none__f1-score,0.994186
eval_none__support,2071.0
eval_attribution__precision,0.0
eval_attribution__recall,0.0
eval_attribution__f1-score,0.0
eval_attribution__support,15.0
eval_causal__precision,0.763251


## Prediction

In [17]:
# Take best trainer
#trainer = trainers[best_fold_idx]

In [18]:
prediction_output = trainer.predict(test_dataset)

### Prediction metrics

In [19]:
df = pd.DataFrame([prediction_output.metrics])
display(df.T)

Unnamed: 0,0
test_loss,0.412937
test_none__precision,0.997569
test_none__recall,0.990826
test_none__f1-score,0.994186
test_none__support,2071.0
test_attribution__precision,0.0
test_attribution__recall,0.0
test_attribution__f1-score,0.0
test_attribution__support,15.0
test_causal__precision,0.763251


### Prediction Examples

In [20]:
def example_prediction_output(result, origin_list, target_list, label_list, success=True, max_number=10):
    global labels
    # Real Relation
    data = []
    for n in range(len(origin_list)):
        data.append([origin_list[n], target_list[n], labels[label_list[n]]])
    df_real = pd.DataFrame(data, columns=['Origin', 'Target', 'Label'])
    # Predicted Label
    label_data = []
    for n in result.label_ids:
        i = np.argmax(result.predictions[n], axis=-1)
        label_data.append([labels[i]])
    df_pred_labels = pd.DataFrame(label_data, columns=["Prediction"])
    # Prediction Metrics
    df_predictions = pd.DataFrame(result.predictions, columns=labels)
    df_predictions = df_predictions.add_prefix("Pred_")
    df = pd.concat([df_real, df_pred_labels, df_predictions], axis=1)
    # Filter complete output to show example
    if success:
        # If possible only show examples with right predicted label that is not none
        df_tmp = df[(df.Label == df.Prediction) & (df.Label != "none")]
        if(df_tmp.size == 0):
            # if there is no match without label "none", print the "none"-matches
            df = df[(df.Label == df.Prediction)]
        else:
            df = df_tmp
    else:
        # If possible only show examples with right predicted label that is not none
        df_tmp = df[(df.Label != df.Prediction) & (df.Label != "none") & (df.Prediction != "none")]
        if(df_tmp.size == 0):
            df_tmp = df[(df.Label != df.Prediction) & ((df.Label != "none") | (df.Prediction != "none"))]
            if(df_tmp.size == 0):
                df = df[df.Label != df.Prediction]
            else:
                df = df_tmp
        else:
            df = df_tmp
    display(HTML(df.head(max_number).to_html()))

#### Successes

In [21]:
example_prediction_output(prediction_output, test_origin, test_target, test_labels)

Unnamed: 0,Origin,Target,Label,Prediction,Pred_none,Pred_attribution,Pred_causal,Pred_conditional,Pred_contrast,Pred_description,Pred_equivalence,Pred_fulfillment,Pred_identity,Pred_purpose,Pred_summary,Pred_temporal
0,"Canada confirms fifth case of Mad Cow Disease. This is Canada's fifth confirmed case of the disease since May 2003, and officials have tested more than 100,000 cows since the first case of the disease turned up in Alberta. April 14, 2006","Swine flu: recent developments worldwide. A majority of the cases were reported by the United States, which now has at least 10,053 confirmed infections from the disease. May 19, 2009",none,none,6.796221,-0.310706,-0.037133,-0.411199,-1.136399,-0.951643,-1.08762,-0.564183,-1.804138,-0.369897,-0.601369,0.821839
1,"Swine flu: recent developments worldwide. A majority of the cases were reported by the United States, which now has at least 10,053 confirmed infections from the disease. May 19, 2009","Canada confirms fifth case of Mad Cow Disease. This is Canada's fifth confirmed case of the disease since May 2003, and officials have tested more than 100,000 cows since the first case of the disease turned up in Alberta. April 14, 2006",none,none,6.937126,-0.426267,0.189443,-0.461942,-1.04427,-0.933352,-0.989166,-0.558361,-1.735762,-0.455372,-0.602375,0.421047
2,"U.K. National Portrait Gallery threatens U.S. citizen with legal action over Wikimedia images. David Gerard, former Press Officer for Wikimedia UK, the U.K. chapter of the Wikimedia Foundation, which has been involved with the Wikipedia Loves Art contest to create free content photographs of exhibits at the Victoria and Albert Museum, stated on Slashdot that The NPG actually acknowledges in their letter that the poster's actions were entirely legal in America, and that they're making a threat just because they think they can. July 11, 2009","Church of Scientology attempting to block 'intolerant' German film. Carl Bergengruen, the head of TV movies for Südwestrundfunk (SWR or Southwest Broadcasting), the public broadcaster backing the project defended their secrecy practices saying, Scientology kept trying to use a variety of methods to find out details about the project. March 15, 2010",none,none,7.684356,-0.934911,0.937986,-0.539007,-0.814859,-1.310764,-0.9842,-0.9214,-1.907234,-0.786805,-1.076709,-0.094654
3,"Church of Scientology attempting to block 'intolerant' German film. Carl Bergengruen, the head of TV movies for Südwestrundfunk (SWR or Southwest Broadcasting), the public broadcaster backing the project defended their secrecy practices saying, Scientology kept trying to use a variety of methods to find out details about the project. March 15, 2010","U.K. National Portrait Gallery threatens U.S. citizen with legal action over Wikimedia images. David Gerard, former Press Officer for Wikimedia UK, the U.K. chapter of the Wikimedia Foundation, which has been involved with the Wikipedia Loves Art contest to create free content photographs of exhibits at the Victoria and Albert Museum, stated on Slashdot that The NPG actually acknowledges in their letter that the poster's actions were entirely legal in America, and that they're making a threat just because they think they can. July 11, 2009",none,none,7.430922,-0.593533,0.461762,-0.423344,-0.868214,-1.037013,-0.982202,-0.813418,-1.888756,-0.603058,-0.726541,0.050769
4,"31 children rescued as UK police shut down global paedophile ring. Cox himself was found to have 75,960 indecent and explicit images on his computer and police found evidence he supplied at least 11,491 images to other paedophiles over the chatroom, on which he used the identity Son of God. He admitted to nine counts of possessing or distributing images of children. June 18, 2007","U.K. National Portrait Gallery threatens U.S. citizen with legal action over Wikimedia images. David Gerard, former Press Officer for Wikimedia UK, the U.K. chapter of the Wikimedia Foundation, which has been involved with the Wikipedia Loves Art contest to create free content photographs of exhibits at the Victoria and Albert Museum, stated on Slashdot that The NPG actually acknowledges in their letter that the poster's actions were entirely legal in America, and that they're making a threat just because they think they can. July 11, 2009",none,none,7.424087,-0.551083,0.339289,-0.402031,-0.980441,-1.001666,-1.054547,-0.743944,-1.918306,-0.571446,-0.710604,0.308223
5,"Bush speaks of goals for U.S. withdrawal from Iraq, decries calls for timetable. A day before the president's address, Sen. Hillary Clinton, in an E-mail to her supporters had said Given years of assurances that the war was nearly over and that the insurgents were in their 'last throes,' this administration was either not being honest with the American people or did not know what was going on in Iraq. November 30 2005","France knew of and told CIA about al-Qaeda hijack plans prior to 9/11. You have to remember that a plane hijack (in January 2001) did not have the same significance as it did after September 11. April 17, 2007",none,none,7.593912,-0.876651,0.6356,-0.518531,-0.812876,-1.278055,-1.096733,-0.992503,-2.099096,-0.853406,-1.054683,0.525095
6,"France knew of and told CIA about al-Qaeda hijack plans prior to 9/11. You have to remember that a plane hijack (in January 2001) did not have the same significance as it did after September 11. April 17, 2007","Bush speaks of goals for U.S. withdrawal from Iraq, decries calls for timetable. A day before the president's address, Sen. Hillary Clinton, in an E-mail to her supporters had said Given years of assurances that the war was nearly over and that the insurgents were in their 'last throes,' this administration was either not being honest with the American people or did not know what was going on in Iraq. November 30 2005",none,none,7.753581,-1.221486,1.300142,-0.623451,-0.753546,-1.500157,-1.126979,-1.017009,-1.912117,-0.800534,-1.315854,0.056387
7,"South Korean police clamp down on protests against US beef. He was forced to publicly apologize, and all but one of his top advisers were fired. June 30, 2008","Bush speaks of goals for U.S. withdrawal from Iraq, decries calls for timetable. A day before the president's address, Sen. Hillary Clinton, in an E-mail to her supporters had said Given years of assurances that the war was nearly over and that the insurgents were in their 'last throes,' this administration was either not being honest with the American people or did not know what was going on in Iraq. November 30 2005",none,none,7.159854,-0.527087,0.443114,-0.346904,-0.875457,-0.975675,-1.044084,-0.690082,-1.838717,-0.475215,-0.718884,0.194263
8,"15 Royal Navy sailors captured at gunpoint by Iranian guards. On that occasion the men were later released unharmed, but only after being paraded blindfolded on Iranian TV and made to apologise for their role in the incident. March 23, 2007","Bush speaks of goals for U.S. withdrawal from Iraq, decries calls for timetable. A day before the president's address, Sen. Hillary Clinton, in an E-mail to her supporters had said Given years of assurances that the war was nearly over and that the insurgents were in their 'last throes,' this administration was either not being honest with the American people or did not know what was going on in Iraq. November 30 2005",none,none,6.546415,-1.414657,2.130721,-0.931668,-0.234204,-1.52986,-0.628423,-1.291947,-1.831004,-1.304603,-1.703851,-0.053261
9,"China sentences six more to death over riots. An employee at the Xinjiang government's news center, who did not give her name, said that the sentencing was not over. October 12, 2009","Bush speaks of goals for U.S. withdrawal from Iraq, decries calls for timetable. A day before the president's address, Sen. Hillary Clinton, in an E-mail to her supporters had said Given years of assurances that the war was nearly over and that the insurgents were in their 'last throes,' this administration was either not being honest with the American people or did not know what was going on in Iraq. November 30 2005",none,none,7.637931,-1.251903,1.339247,-0.632884,-0.651235,-1.481616,-1.032817,-1.07315,-1.828598,-0.853998,-1.381876,-0.115074


#### Fails

In [22]:
example_prediction_output(prediction_output, test_origin, test_target, test_labels, False)

Unnamed: 0,Origin,Target,Label,Prediction,Pred_none,Pred_attribution,Pred_causal,Pred_conditional,Pred_contrast,Pred_description,Pred_equivalence,Pred_fulfillment,Pred_identity,Pred_purpose,Pred_summary,Pred_temporal
25,"Fatah assaults European Union office. 'This article has been archived as published, however, the gunmen, according to sources listed, were members of the Al Aqsa Martyrs' Brigades.' In a reaction to the ongoing controversy over the September publication of cartoons by the Danish newspaper Jyllands-Posten, gunmen from the Fatah assaulted a European Union (EU) office in the Gaza Strip on Monday, prompting Denmark to warn citizens to avoid travel to Saudi Arabia. January 27, 2006","New Zealand newspapers publish ""Mohammad Cartoons"". Two New Zealand newspapers, Fairfax-owned The Dominion Post and The Christchurch Press, today controversially published all 12 cartoons of the Prophet Mohammad, which have triggered international outrage. February 4, 2006",causal,none,-0.875474,-1.500314,1.978083,-0.978482,0.898743,-1.094446,1.575956,-1.153589,-0.140207,-1.223209,-1.754261,-0.816238
26,"New Zealand newspapers publish ""Mohammad Cartoons"". Two New Zealand newspapers, Fairfax-owned The Dominion Post and The Christchurch Press, today controversially published all 12 cartoons of the Prophet Mohammad, which have triggered international outrage. February 4, 2006","Fatah assaults European Union office. 'This article has been archived as published, however, the gunmen, according to sources listed, were members of the Al Aqsa Martyrs' Brigades.' In a reaction to the ongoing controversy over the September publication of cartoons by the Danish newspaper Jyllands-Posten, gunmen from the Fatah assaulted a European Union (EU) office in the Gaza Strip on Monday, prompting Denmark to warn citizens to avoid travel to Saudi Arabia. January 27, 2006",causal,none,-0.681203,-1.55325,2.171267,-0.872714,0.871357,-1.024705,1.64816,-1.05706,-0.299367,-1.301426,-1.839841,-0.661958
37,"Protests erupt in Pakistan over US air strike. Many Pakistanis took to the streets Saturday to demonstrate against the U.S. air strike of a village on the border of Afghanistan. January 14, 2006","At least 40 killed by bombing in Pakistan. The attack took place on the outskirts of Dara Adamkhel, a town which is close to the border with Afghanistan. March 2, 2008",causal,none,-1.815199,-1.472281,1.408857,-0.599616,0.705016,-0.678495,1.460095,-0.932614,-0.04045,-1.209824,-1.493517,0.211566
38,"At least 40 killed by bombing in Pakistan. The attack took place on the outskirts of Dara Adamkhel, a town which is close to the border with Afghanistan. March 2, 2008","Protests erupt in Pakistan over US air strike. Many Pakistanis took to the streets Saturday to demonstrate against the U.S. air strike of a village on the border of Afghanistan. January 14, 2006",causal,none,-0.386256,-1.546684,2.277749,-0.919457,0.997434,-1.010176,1.454126,-1.063916,-0.32105,-1.160465,-1.814899,-0.998759
54,"British Prime Minister Tony Blair suffers defeat in vote on terror laws. Opponents believe that by effectively giving the government the right to imprison for up to three months anyone who it alleged to have been involved in terrorism, without having to present any charges in court to justify the detention, the bill could have led to abuses of power. November 09, 2005","Documents allege U.S. Army kidnapped wives of enemy fighters. All of the released women had been accused of aiding terrorists or planting explosives, but an Iraqi government commission found there was insufficient evidence to continue holding them. January 28,2006",causal,none,-0.464692,-1.560784,2.302031,-0.969854,0.977077,-1.15442,1.414792,-1.136056,-0.351048,-1.312699,-1.828428,-0.858122
61,"Bomb blast kills 5 policemen in Islamabad, Pakistan. At least five policemen are dead after a bombing took place near the Islamabad, Pakistan. April 3, 2009","Seven policemen killed in Afghanistan after bomb explosion. At least seven policemen were killed in northeastern Afghanistan yesterday, according to reports, after a bomb went off near a police patrol vehicle. May 30, 2010",temporal,none,-0.202937,-1.120079,-0.164407,-0.360874,-0.696576,-0.634225,-0.551874,-0.848262,-1.093187,-1.093364,-1.203759,4.727787
62,"Ash-triggered flight disruptions cost airlines $1.7 billion. Restrictions over air travel in Europe have been lifted in many parts of the continent today; three-quarters of the scheduled flights were operating, and most of the European airspace having been opened. April 21, 2010","European airlines question flight bans. Some of Europe's airlines and airports have called into question whether the mass restrictions imposed on the continent's airspace, due to volcanic ash in the area, are necessary. April 17, 2010",causal,none,-3.470907,-0.757195,0.741208,-0.041966,1.200055,0.558963,1.652775,0.082559,1.07521,-0.429375,-0.68053,-0.905646
63,"European airlines question flight bans. Some of Europe's airlines and airports have called into question whether the mass restrictions imposed on the continent's airspace, due to volcanic ash in the area, are necessary. April 17, 2010","Ash-triggered flight disruptions cost airlines $1.7 billion. Restrictions over air travel in Europe have been lifted in many parts of the continent today; three-quarters of the scheduled flights were operating, and most of the European airspace having been opened. April 21, 2010",fulfillment,none,-3.781847,-0.666029,0.596304,0.117807,1.132663,0.606452,1.543783,0.109953,1.094619,-0.325294,-0.571536,-0.672498
68,"New videotape of Ayman al-Zawahiri aired on Aljazeera. During the broadcast, al-Zawahiri talks to the general Muslim population saying, I call upon them to reject any referendum on Palestine, because Palestine is not for bargaining or bidding. 2020-07-31T06:14:36Z","Muslim opens first Arab Holocaust museum in Nazareth. Mahameed is not without his critics, not only among Arabs who say that Mahameed should do more to draw attention to the situation of present-day Palestinians, but also representatives of the Israel office of the Jewish Anti-Defamation League (ADL), who have stated without visiting the museum that they consider some of the attitudes expressed on Mahameed's website to be anti-Semitic. May 6, 2005",causal,none,-0.285192,-1.675672,2.516045,-0.865789,0.928935,-1.140686,1.401313,-1.085238,-0.531101,-1.358472,-1.976486,-0.52707
106,"Documents allege U.S. Army kidnapped wives of enemy fighters. All of the released women had been accused of aiding terrorists or planting explosives, but an Iraqi government commission found there was insufficient evidence to continue holding them. January 28,2006","British Prime Minister Tony Blair suffers defeat in vote on terror laws. Opponents believe that by effectively giving the government the right to imprison for up to three months anyone who it alleged to have been involved in terrorism, without having to present any charges in court to justify the detention, the bill could have led to abuses of power. November 09, 2005",causal,none,-0.045373,-1.5903,2.545204,-0.976182,0.93,-1.170197,1.304607,-1.138442,-0.498146,-1.314314,-1.893509,-0.974941


### Prediction output

In [23]:
def format_prediction_output(result, origin_list, target_list, label_list):
    global labels
    # Real Relation
    data = []
    for n in range(len(origin_list)):
        data.append([origin_list[n], target_list[n], labels[label_list[n]]])
    df_real = pd.DataFrame(data, columns=['Origin', 'Target', 'Label'])
    # Predicted Label
    label_data = []
    for n in result.label_ids:
        i = np.argmax(result.predictions[n], axis=-1)
        label_data.append([labels[i]])
    df_pred_labels = pd.DataFrame(label_data, columns=["Prediction"])
    # Prediction Metrics
    df_predictions = pd.DataFrame(result.predictions, columns=labels)
    df_predictions = df_predictions.add_prefix("Pred_")
    df = pd.concat([df_real, df_pred_labels, df_predictions], axis=1)
    display(HTML(df.to_html()))
    
format_prediction_output(prediction_output, test_origin, test_target, test_labels)

Unnamed: 0,Origin,Target,Label,Prediction,Pred_none,Pred_attribution,Pred_causal,Pred_conditional,Pred_contrast,Pred_description,Pred_equivalence,Pred_fulfillment,Pred_identity,Pred_purpose,Pred_summary,Pred_temporal
0,"Canada confirms fifth case of Mad Cow Disease. This is Canada's fifth confirmed case of the disease since May 2003, and officials have tested more than 100,000 cows since the first case of the disease turned up in Alberta. April 14, 2006","Swine flu: recent developments worldwide. A majority of the cases were reported by the United States, which now has at least 10,053 confirmed infections from the disease. May 19, 2009",none,none,6.796221,-0.310706,-0.037133,-0.411199,-1.136399,-0.951643,-1.08762,-0.564183,-1.804138,-0.369897,-0.601369,0.821839
1,"Swine flu: recent developments worldwide. A majority of the cases were reported by the United States, which now has at least 10,053 confirmed infections from the disease. May 19, 2009","Canada confirms fifth case of Mad Cow Disease. This is Canada's fifth confirmed case of the disease since May 2003, and officials have tested more than 100,000 cows since the first case of the disease turned up in Alberta. April 14, 2006",none,none,6.937126,-0.426267,0.189443,-0.461942,-1.04427,-0.933352,-0.989166,-0.558361,-1.735762,-0.455372,-0.602375,0.421047
2,"U.K. National Portrait Gallery threatens U.S. citizen with legal action over Wikimedia images. David Gerard, former Press Officer for Wikimedia UK, the U.K. chapter of the Wikimedia Foundation, which has been involved with the Wikipedia Loves Art contest to create free content photographs of exhibits at the Victoria and Albert Museum, stated on Slashdot that The NPG actually acknowledges in their letter that the poster's actions were entirely legal in America, and that they're making a threat just because they think they can. July 11, 2009","Church of Scientology attempting to block 'intolerant' German film. Carl Bergengruen, the head of TV movies for Südwestrundfunk (SWR or Southwest Broadcasting), the public broadcaster backing the project defended their secrecy practices saying, Scientology kept trying to use a variety of methods to find out details about the project. March 15, 2010",none,none,7.684356,-0.934911,0.937986,-0.539007,-0.814859,-1.310764,-0.9842,-0.9214,-1.907234,-0.786805,-1.076709,-0.094654
3,"Church of Scientology attempting to block 'intolerant' German film. Carl Bergengruen, the head of TV movies for Südwestrundfunk (SWR or Southwest Broadcasting), the public broadcaster backing the project defended their secrecy practices saying, Scientology kept trying to use a variety of methods to find out details about the project. March 15, 2010","U.K. National Portrait Gallery threatens U.S. citizen with legal action over Wikimedia images. David Gerard, former Press Officer for Wikimedia UK, the U.K. chapter of the Wikimedia Foundation, which has been involved with the Wikipedia Loves Art contest to create free content photographs of exhibits at the Victoria and Albert Museum, stated on Slashdot that The NPG actually acknowledges in their letter that the poster's actions were entirely legal in America, and that they're making a threat just because they think they can. July 11, 2009",none,none,7.430922,-0.593533,0.461762,-0.423344,-0.868214,-1.037013,-0.982202,-0.813418,-1.888756,-0.603058,-0.726541,0.050769
4,"31 children rescued as UK police shut down global paedophile ring. Cox himself was found to have 75,960 indecent and explicit images on his computer and police found evidence he supplied at least 11,491 images to other paedophiles over the chatroom, on which he used the identity Son of God. He admitted to nine counts of possessing or distributing images of children. June 18, 2007","U.K. National Portrait Gallery threatens U.S. citizen with legal action over Wikimedia images. David Gerard, former Press Officer for Wikimedia UK, the U.K. chapter of the Wikimedia Foundation, which has been involved with the Wikipedia Loves Art contest to create free content photographs of exhibits at the Victoria and Albert Museum, stated on Slashdot that The NPG actually acknowledges in their letter that the poster's actions were entirely legal in America, and that they're making a threat just because they think they can. July 11, 2009",none,none,7.424087,-0.551083,0.339289,-0.402031,-0.980441,-1.001666,-1.054547,-0.743944,-1.918306,-0.571446,-0.710604,0.308223
5,"Bush speaks of goals for U.S. withdrawal from Iraq, decries calls for timetable. A day before the president's address, Sen. Hillary Clinton, in an E-mail to her supporters had said Given years of assurances that the war was nearly over and that the insurgents were in their 'last throes,' this administration was either not being honest with the American people or did not know what was going on in Iraq. November 30 2005","France knew of and told CIA about al-Qaeda hijack plans prior to 9/11. You have to remember that a plane hijack (in January 2001) did not have the same significance as it did after September 11. April 17, 2007",none,none,7.593912,-0.876651,0.6356,-0.518531,-0.812876,-1.278055,-1.096733,-0.992503,-2.099096,-0.853406,-1.054683,0.525095
6,"France knew of and told CIA about al-Qaeda hijack plans prior to 9/11. You have to remember that a plane hijack (in January 2001) did not have the same significance as it did after September 11. April 17, 2007","Bush speaks of goals for U.S. withdrawal from Iraq, decries calls for timetable. A day before the president's address, Sen. Hillary Clinton, in an E-mail to her supporters had said Given years of assurances that the war was nearly over and that the insurgents were in their 'last throes,' this administration was either not being honest with the American people or did not know what was going on in Iraq. November 30 2005",none,none,7.753581,-1.221486,1.300142,-0.623451,-0.753546,-1.500157,-1.126979,-1.017009,-1.912117,-0.800534,-1.315854,0.056387
7,"South Korean police clamp down on protests against US beef. He was forced to publicly apologize, and all but one of his top advisers were fired. June 30, 2008","Bush speaks of goals for U.S. withdrawal from Iraq, decries calls for timetable. A day before the president's address, Sen. Hillary Clinton, in an E-mail to her supporters had said Given years of assurances that the war was nearly over and that the insurgents were in their 'last throes,' this administration was either not being honest with the American people or did not know what was going on in Iraq. November 30 2005",none,none,7.159854,-0.527087,0.443114,-0.346904,-0.875457,-0.975675,-1.044084,-0.690082,-1.838717,-0.475215,-0.718884,0.194263
8,"15 Royal Navy sailors captured at gunpoint by Iranian guards. On that occasion the men were later released unharmed, but only after being paraded blindfolded on Iranian TV and made to apologise for their role in the incident. March 23, 2007","Bush speaks of goals for U.S. withdrawal from Iraq, decries calls for timetable. A day before the president's address, Sen. Hillary Clinton, in an E-mail to her supporters had said Given years of assurances that the war was nearly over and that the insurgents were in their 'last throes,' this administration was either not being honest with the American people or did not know what was going on in Iraq. November 30 2005",none,none,6.546415,-1.414657,2.130721,-0.931668,-0.234204,-1.52986,-0.628423,-1.291947,-1.831004,-1.304603,-1.703851,-0.053261
9,"China sentences six more to death over riots. An employee at the Xinjiang government's news center, who did not give her name, said that the sentencing was not over. October 12, 2009","Bush speaks of goals for U.S. withdrawal from Iraq, decries calls for timetable. A day before the president's address, Sen. Hillary Clinton, in an E-mail to her supporters had said Given years of assurances that the war was nearly over and that the insurgents were in their 'last throes,' this administration was either not being honest with the American people or did not know what was going on in Iraq. November 30 2005",none,none,7.637931,-1.251903,1.339247,-0.632884,-0.651235,-1.481616,-1.032817,-1.07315,-1.828598,-0.853998,-1.381876,-0.115074
