In [1]:
import json

#### Read Dataset

In [2]:
factuality_data = json.load(open('../data/xsum_hallucination_annotations/factuality_annotations_xsum_summaries.json'))
hallucination_data = json.load(open('../data/xsum_hallucination_annotations/hallucination_annotations_xsum_summaries.json'))

In [3]:
print(len(factuality_data))
print(len(hallucination_data))

5597
11185


In [4]:
set([f['system'] for f in factuality_data])

{'BERTS2S', 'PtGen', 'TConvS2S', 'TranS2S'}

In [5]:
factuality_data[0]

{'bbcid': 29911712,
 'system': 'BERTS2S',
 'summary': 'more than 50 pupils at a bristol academy have been sent home from school because of a lack of uniform.',
 'is_factual': 'no',
 'worker_id': 'wid_0'}

In [6]:
hallucination_data[0]

{'bbcid': 34687720,
 'system': 'BERTS2S',
 'summary': 'rory mcilroy will take a one-shot lead into the final round of the wgc-hsbc champions after carding a three-under',
 'hallucination_type': 'extrinsic',
 'hallucinated_span': 'rory mcilroy will take a one-shot lead into the final round of the wgc-hsbc champions after carding a three-under',
 'worker_id': 'wid_0'}

#### Read Calculated Probability

In [7]:
google_data_with_proba = json.load(open('../data/Maynez_entity_data_with_prob.json', 'r'))

In [8]:
print(len(google_data_with_proba))

500


In [9]:
google_data_with_proba['34687720']['BERTS2S']

{'summary': 'rory mcilroy will take a one-shot lead into the final round of the wgc-hsbc champions after carding a three-under',
 'summary_upper': 'Rory McIlroy will take a one-shot lead into the final round of the Wgc-Hsbc champions after carding a Three-Under',
 'ents': [{'start': 0,
   'end': 4,
   'label': 2,
   'type': 'PERSON',
   'ent': 'Rory',
   'bart.large': 0.379150390625,
   'xsum_cmlm_bos': 0.923828125,
   'cnndm_cmlm_cedar': 0.1370849609375,
   'bart.large.xsum': 0.6513671875},
  {'start': 5,
   'end': 12,
   'label': 2,
   'type': 'PERSON',
   'ent': 'McIlroy',
   'bart.large': 0.97119140625,
   'xsum_cmlm_bos': 0.7802734375,
   'cnndm_cmlm_cedar': 0.82861328125,
   'bart.large.xsum': 0.80712890625},
  {'start': 25,
   'end': 28,
   'label': 2,
   'type': 'CARDINAL',
   'ent': 'one',
   'bart.large': 0.004116058349609375,
   'xsum_cmlm_bos': 0.1072998046875,
   'cnndm_cmlm_cedar': 0.423095703125,
   'bart.large.xsum': 0.400146484375},
  {'start': 63,
   'end': 75,
   'la

#### Labeling

In [10]:
import copy
import random

In [11]:
from utils import read_document

In [14]:
bbcid = random.sample(google_data_with_proba.keys(), 1)[0]
bbcid = '34687720'
print(bbcid)

34687720


In [15]:
google_data_with_proba[bbcid].keys()

dict_keys(['BERTS2S', 'TConvS2S', 'Gold', 'PtGen', 'TranS2S'])

In [16]:
google_data_with_proba[bbcid]

{'BERTS2S': {'summary': 'rory mcilroy will take a one-shot lead into the final round of the wgc-hsbc champions after carding a three-under',
  'summary_upper': 'Rory McIlroy will take a one-shot lead into the final round of the Wgc-Hsbc champions after carding a Three-Under',
  'ents': [{'start': 0,
    'end': 4,
    'label': 2,
    'type': 'PERSON',
    'ent': 'Rory',
    'bart.large': 0.379150390625,
    'xsum_cmlm_bos': 0.923828125,
    'cnndm_cmlm_cedar': 0.1370849609375,
    'bart.large.xsum': 0.6513671875},
   {'start': 5,
    'end': 12,
    'label': 2,
    'type': 'PERSON',
    'ent': 'McIlroy',
    'bart.large': 0.97119140625,
    'xsum_cmlm_bos': 0.7802734375,
    'cnndm_cmlm_cedar': 0.82861328125,
    'bart.large.xsum': 0.80712890625},
   {'start': 25,
    'end': 28,
    'label': 2,
    'type': 'CARDINAL',
    'ent': 'one',
    'bart.large': 0.004116058349609375,
    'xsum_cmlm_bos': 0.1072998046875,
    'cnndm_cmlm_cedar': 0.423095703125,
    'bart.large.xsum': 0.40014648437

In [17]:
document_dir = '/home/mcao610/scratch/summarization/XSum/xsum-preprocessed/document/'
document = read_document(int(bbcid), document_dir)

print(google_data_with_proba[bbcid]['Gold']['summary_upper'], end='\n\n')
print(document)

Rory McIlroy moved to within a shot of joint leaders Victor Dubuisson and Jaco van Zyl after the third round of the Turkish Airlines open .

France 's Dubuisson carded a 67 to tie with overnight leader Van Zyl of South Africa on 16 under par . McIlroy carded a third straight five under - par 67 to move to 15 under par with Thailand 's Kiradech Aphibarnrat . The world number three 's round included an eagle on the 12th as he bids to win his first title since May . " The 67s I 've shot this week have all been a little different and I feel like I 've played within myself for all of them , " said four - time major winner McIlroy of Northern Ireland . " I feel there 's a low round out there for me and hopefully it 's tomorrow . " McIlroy was level par for the day after 10 holes , dropping his first shots of the week by three - putting the third and 10th , the latter mistake prompting the 26 - year - old to throw his putter at his bag . But he hit back with a birdie on the par - five 11th an

In [18]:
labeled_maynez = {}

labeled_maynez['32584708'] = {'BERTS2S': {'summary': "italy's lower house of parliament has passed a controversial parliamentary reform of the country's electoral system.",
  'summary_upper': "Italy 's lower house of parliament has passed a controversial parliamentary reform of the country 's electoral system .",
  'ents': [{'start': 0,
    'end': 5,
    'label': 0,
    'type': 'GPE',
    'ent': 'Italy',
    'bart.large': 0.00510406494140625,
    'xsum_cmlm_bos': 0.9208984375,
    'cnndm_cmlm_cedar': 0.90283203125,
    'bart.large.xsum': 0.5498046875}]},
 'TConvS2S': {'summary': "italy's lower house of parliament has voted to end the process of reducing the country's power system.",
  'summary_upper': "Italy 's lower house of parliament has voted to end the process of reducing the country 's power system .",
  'ents': [{'start': 0,
    'end': 5,
    'label': 0,
    'type': 'GPE',
    'ent': 'Italy',
    'bart.large': 0.0022430419921875,
    'xsum_cmlm_bos': 0.91357421875,
    'cnndm_cmlm_cedar': 0.8984375,
    'bart.large.xsum': 0.5498046875}]},
 'Gold': {'summary': 'the italian parliament has approved a long-debated and extensive electoral reform that aims to give the country more political stability.',
  'summary_upper': 'The Italian parliament has approved a long-debated and extensive electoral reform that aims to give the country more political stability .',
  'ents': [{'start': 4,
    'end': 11,
    'label': 0,
    'type': 'NORP',
    'ent': 'Italian',
    'bart.large': 0.0017480850219726562,
    'xsum_cmlm_bos': 0.92529296875,
    'cnndm_cmlm_cedar': 0.93701171875,
    'bart.large.xsum': 0.8994140625}]},
 'PtGen': {'summary': 'voters in italy have voted overwhelmingly to elect a new president in the wake of the italian election system.',
  'summary_upper': 'Voters in Italy have voted overwhelmingly to elect a new president in the wake of the Italian election system .',
  'ents': [{'start': 10,
    'end': 15,
    'label': 0,
    'type': 'GPE',
    'ent': 'Italy',
    'bart.large': 0.036529541015625,
    'xsum_cmlm_bos': 0.9013671875,
    'cnndm_cmlm_cedar': 0.88623046875,
    'bart.large.xsum': 0.8388671875},
   {'start': 86,
    'end': 93,
    'label': 2,
    'type': 'NORP',
    'ent': 'Italian',
    'bart.large': 0.005596160888671875,
    'xsum_cmlm_bos': 0.0035915374755859375,
    'cnndm_cmlm_cedar': 0.00798797607421875,
    'bart.large.xsum': 0.007762908935546875}]},
 'TranS2S': {'summary': "italian prime minister matteo renzi has won the latest stage in a vote in italy's parliament.",
  'summary_upper': "Italian prime minister Matteo Renzi has won the latest stage in a vote in Italy 's parliament .",
  'ents': [{'start': 0,
    'end': 7,
    'label': 0,
    'type': 'NORP',
    'ent': 'Italian',
    'bart.large': 0.10858154296875,
    'xsum_cmlm_bos': 0.8994140625,
    'cnndm_cmlm_cedar': 0.94384765625,
    'bart.large.xsum': 0.0740966796875},
   {'start': 23,
    'end': 29,
    'label': 0,
    'type': 'PERSON',
    'ent': 'Matteo',
    'bart.large': 0.045196533203125,
    'xsum_cmlm_bos': 0.89306640625,
    'cnndm_cmlm_cedar': 0.90380859375,
    'bart.large.xsum': 0.7763671875},
   {'start': 30,
    'end': 35,
    'label': 0,
    'type': 'PERSON',
    'ent': 'Renzi',
    'bart.large': 0.9130859375,
    'xsum_cmlm_bos': 0.8330078125,
    'cnndm_cmlm_cedar': 0.8359375,
    'bart.large.xsum': 0.79833984375},
   {'start': 74,
    'end': 79,
    'label': 0,
    'type': 'GPE',
    'ent': 'Italy',
    'bart.large': 0.1138916015625,
    'xsum_cmlm_bos': 0.2105712890625,
    'cnndm_cmlm_cedar': 0.69091796875,
    'bart.large.xsum': 0.0021991729736328125}]}}


labeled_maynez['38450424'] = {
  'BERTS2S': {'summary': "israel's decision to abstain from developing jewish settlements in the occupied west bank has been called off.",
  'summary_upper': "Israel 's decision to abstain from developing Jewish settlements in the occupied West Bank has been called off .",
  'ents': [{'start': 0,
    'end': 6,
    'label': 0,
    'type': 'GPE',
    'ent': 'Israel',
    'bart.large': 0.12548828125,
    'xsum_cmlm_bos': 0.92626953125,
    'cnndm_cmlm_cedar': 0.89697265625,
    'bart.large.xsum': 0.54736328125},
   {'start': 46,
    'end': 52,
    'label': 0,
    'type': 'NORP',
    'ent': 'Jewish',
    'bart.large': 0.00104522705078125,
    'xsum_cmlm_bos': 0.95068359375,
    'cnndm_cmlm_cedar': 0.000911712646484375,
    'bart.large.xsum': 0.0028972625732421875},
   {'start': 81,
    'end': 90,
    'label': 0,
    'type': 'GPE',
    'ent': 'West Bank',
    'bart.large': 0.6640625,
    'xsum_cmlm_bos': 0.83837890625,
    'cnndm_cmlm_cedar': 0.19921875,
    'bart.large.xsum': 0.83251953125}]},
 'TConvS2S': {'summary': 'israeli prime minister benjamin netanyahu has said it is deeply disappointed" that israel\'s new prime minister',
  'summary_upper': "Israeli Prime Minister Benjamin Netanyahu has said it is deeply disappointed '' that Israel 's new prime minister",
  'ents': [{'start': 0,
    'end': 7,
    'label': 0,
    'type': 'NORP',
    'ent': 'Israeli',
    'bart.large': 0.0229949951171875,
    'xsum_cmlm_bos': 0.904296875,
    'cnndm_cmlm_cedar': 0.89453125,
    'bart.large.xsum': 0.038665771484375},
   {'start': 23,
    'end': 31,
    'label': 0,
    'type': 'PERSON',
    'ent': 'Benjamin',
    'bart.large': 0.89697265625,
    'xsum_cmlm_bos': 0.9404296875,
    'cnndm_cmlm_cedar': 0.94677734375,
    'bart.large.xsum': 0.9208984375},
   {'start': 32,
    'end': 41,
    'label': 0,
    'type': 'PERSON',
    'ent': 'Netanyahu',
    'bart.large': 0.9892578125,
    'xsum_cmlm_bos': 0.92529296875,
    'cnndm_cmlm_cedar': 0.93212890625,
    'bart.large.xsum': 0.8740234375},
   {'start': 85,
    'end': 91,
    'label': 0,
    'type': 'GPE',
    'ent': 'Israel',
    'bart.large': 0.0196685791015625,
    'xsum_cmlm_bos': 0.044769287109375,
    'cnndm_cmlm_cedar': 0.001491546630859375,
    'bart.large.xsum': 0.01219940185546875}]},
 'Gold': {'summary': 'an israeli committee has postponed a vote to authorise construction of almost 500 new homes in jewish settlements in occupied east jerusalem.',
  'summary_upper': 'An Israeli committee has postponed a vote to authorise construction of almost 500 new homes in Jewish settlements in occupied East Jerusalem .',
  'ents': [{'start': 3,
    'end': 10,
    'label': 0,
    'type': 'NORP',
    'ent': 'Israeli',
    'bart.large': 0.94580078125,
    'xsum_cmlm_bos': 0.84375,
    'cnndm_cmlm_cedar': 0.85888671875,
    'bart.large.xsum': 0.861328125},
   {'start': 71,
    'end': 81,
    'label': 1,
    'type': 'CARDINAL',
    'ent': 'almost 500',
    'bart.large': 0.00024580955505371094,
    'xsum_cmlm_bos': 0.04046630859375,
    'cnndm_cmlm_cedar': 2.294778823852539e-05,
    'bart.large.xsum': 0.031005859375},
   {'start': 95,
    'end': 101,
    'label': 0,
    'type': 'NORP',
    'ent': 'Jewish',
    'bart.large': 0.035552978515625,
    'xsum_cmlm_bos': 0.0161590576171875,
    'cnndm_cmlm_cedar': 3.9696693420410156e-05,
    'bart.large.xsum': 0.095458984375},
   {'start': 126,
    'end': 140,
    'label': 0,
    'type': 'GPE',
    'ent': 'East Jerusalem',
    'bart.large': 0.595703125,
    'xsum_cmlm_bos': 0.400634765625,
    'cnndm_cmlm_cedar': 0.39697265625,
    'bart.large.xsum': 0.52734375}]},
 'PtGen': {'summary': "israel's security council has rejected a proposal by the us government to press ahead with a resolution calling for an end to the construction of a two-state solution.",
  'summary_upper': "Israel 's Security Council has rejected a proposal by the US government to press ahead with a resolution calling for an end to the construction of a two-state solution .",
  'ents': [{'start': 0,
    'end': 6,
    'label': 0,
    'type': 'GPE',
    'ent': 'Israel',
    'bart.large': 0.04107666015625,
    'xsum_cmlm_bos': 0.8671875,
    'cnndm_cmlm_cedar': 0.89453125,
    'bart.large.xsum': 0.54638671875},
   {'start': 10,
    'end': 26,
    'label': 3,
    'type': 'ORG',
    'ent': 'Security Council',
    'bart.large': 0.004177093505859375,
    'xsum_cmlm_bos': 0.07257080078125,
    'cnndm_cmlm_cedar': 0.77587890625,
    'bart.large.xsum': 5.984306335449219e-05},
   {'start': 58,
    'end': 60,
    'label': 0,
    'type': 'GPE',
    'ent': 'US',
    'bart.large': 0.227294921875,
    'xsum_cmlm_bos': 0.0035381317138671875,
    'cnndm_cmlm_cedar': 0.001178741455078125,
    'bart.large.xsum': 0.00237274169921875},
   {'start': 149,
    'end': 152,
    'label': 0,
    'type': 'CARDINAL',
    'ent': 'two',
    'bart.large': 0.157958984375,
    'xsum_cmlm_bos': 0.8876953125,
    'cnndm_cmlm_cedar': 0.91357421875,
    'bart.large.xsum': 0.00018787384033203125}]},
 'TranS2S': {'summary': "the us has vetoed a un resolution against israel's prime minister benjamin netanyahu, accusing him of violating a un security law.",
  'summary_upper': "The US has vetoed a UN resolution against Israel 's prime minister Benjamin Netanyahu , accusing him of violating a UN Security law .",
  'ents': [{'start': 4,
    'end': 6,
    'label': 0,
    'type': 'GPE',
    'ent': 'US',
    'bart.large': 0.454345703125,
    'xsum_cmlm_bos': 0.892578125,
    'cnndm_cmlm_cedar': 0.7841796875,
    'bart.large.xsum': 0.0753173828125},
   {'start': 20,
    'end': 22,
    'label': 0,
    'type': 'ORG',
    'ent': 'UN',
    'bart.large': 0.358154296875,
    'xsum_cmlm_bos': 0.58837890625,
    'cnndm_cmlm_cedar': 0.4140625,
    'bart.large.xsum': 0.23681640625},
   {'start': 42,
    'end': 48,
    'label': 0,
    'type': 'GPE',
    'ent': 'Israel',
    'bart.large': 0.343994140625,
    'xsum_cmlm_bos': 0.91943359375,
    'cnndm_cmlm_cedar': 0.90869140625,
    'bart.large.xsum': 0.02947998046875},
   {'start': 67,
    'end': 75,
    'label': 0,
    'type': 'PERSON',
    'ent': 'Benjamin',
    'bart.large': 0.78125,
    'xsum_cmlm_bos': 0.94287109375,
    'cnndm_cmlm_cedar': 0.9443359375,
    'bart.large.xsum': 0.0003254413604736328},
   {'start': 76,
    'end': 85,
    'label': 0,
    'type': 'PERSON',
    'ent': 'Netanyahu',
    'bart.large': 0.99755859375,
    'xsum_cmlm_bos': 0.93359375,
    'cnndm_cmlm_cedar': 0.94287109375,
    'bart.large.xsum': 0.923828125},
   {'start': 116,
    'end': 127,
    'label': 0,
    'type': 'ORG',
    'ent': 'UN Security',
    'bart.large': 0.01568603515625,
    'xsum_cmlm_bos': 1.2516975402832031e-06,
    'cnndm_cmlm_cedar': 8.344650268554688e-06,
    'bart.large.xsum': 0.0264434814453125}]}}

labeled_maynez['27775709'] = {
  'BERTS2S': {'summary': 'three schools have been threatened with legal action over an alleged trojan horse affair, the education secretary has said.',
  'summary_upper': 'Three schools have been threatened with legal action over an alleged Trojan horse affair , the education secretary has said .',
  'ents': [{'start': 0,
    'end': 5,
    'label': 3,
    'type': 'CARDINAL',
    'ent': 'Three',
    'bart.large': 0.0101776123046875,
    'xsum_cmlm_bos': 0.8935546875,
    'cnndm_cmlm_cedar': 0.308349609375,
    'bart.large.xsum': 0.48681640625},
   {'start': 69,
    'end': 75,
    'label': 0,
    'type': 'ORG',
    'ent': 'Trojan',
    'bart.large': 0.000186920166015625,
    'xsum_cmlm_bos': 0.98974609375,
    'cnndm_cmlm_cedar': 0.9833984375,
    'bart.large.xsum': 0.458740234375}]},
 'TConvS2S': {'summary': 'the head teacher of a birmingham school has been placed in special measures after being found guilty of misconduct.',
  'summary_upper': 'The head teacher of a Birmingham school has been placed in special measures after being found guilty of misconduct .',
  'ents': [{'start': 22,
    'end': 32,
    'label': 0,
    'type': 'GPE',
    'ent': 'Birmingham',
    'bart.large': 0.005329132080078125,
    'xsum_cmlm_bos': 0.0204315185546875,
    'cnndm_cmlm_cedar': 0.65478515625,
    'bart.large.xsum': 0.08184814453125}]},
 'Gold': {'summary': 'two schools at the centre of the trojan horse inquiry are to lose their government funding.',
  'summary_upper': 'Two schools at the centre of the Trojan horse inquiry are to lose their government funding .',
  'ents': [{'start': 0,
    'end': 3,
    'label': 0,
    'type': 'CARDINAL',
    'ent': 'Two',
    'bart.large': 0.0183868408203125,
    'xsum_cmlm_bos': 0.0183258056640625,
    'cnndm_cmlm_cedar': 0.2470703125,
    'bart.large.xsum': 0.09735107421875},
   {'start': 33,
    'end': 39,
    'label': 0,
    'type': 'GPE',
    'ent': 'Trojan',
    'bart.large': 0.0007348060607910156,
    'xsum_cmlm_bos': 0.962890625,
    'cnndm_cmlm_cedar': 0.95361328125,
    'bart.large.xsum': 0.5859375}]},
 'PtGen': {'summary': 'a primary school in birmingham has been rated "inadequate" by a senior ofsted inspector who has been rated "inadequate" by ofsted.',
  'summary_upper': "A primary school in Birmingham has been rated `` inadequate '' by a senior Ofsted inspector who has been rated `` inadequate '' by Ofsted .",
  'ents': [{'start': 20,
    'end': 30,
    'label': 0,
    'type': 'GPE',
    'ent': 'Birmingham',
    'bart.large': 0.00577545166015625,
    'xsum_cmlm_bos': 0.849609375,
    'cnndm_cmlm_cedar': 0.87939453125,
    'bart.large.xsum': 0.419921875},
   {'start': 75,
    'end': 81,
    'label': 0,
    'type': 'ORG',
    'ent': 'Ofsted',
    'bart.large': 0.1636962890625,
    'xsum_cmlm_bos': 0.85791015625,
    'cnndm_cmlm_cedar': 0.8701171875,
    'bart.large.xsum': 0.78466796875},
   {'start': 131,
    'end': 137,
    'label': 0,
    'type': 'ORG',
    'ent': 'Ofsted',
    'bart.large': 0.00249481201171875,
    'xsum_cmlm_bos': 0.0024166107177734375,
    'cnndm_cmlm_cedar': 0.791015625,
    'bart.large.xsum': 0.0511474609375}]},
 'TranS2S': {'summary': 'pupils at a school in birmingham have been told they will lose their jobs because of a lack of funding.',
  'summary_upper': 'Pupils at a school in Birmingham have been told they will lose their jobs because of a lack of funding .',
  'ents': [{'start': 22,
    'end': 32,
    'label': 0,
    'type': 'GPE',
    'ent': 'Birmingham',
    'bart.large': 0.0103759765625,
    'xsum_cmlm_bos': 0.85546875,
    'cnndm_cmlm_cedar': 0.90087890625,
    'bart.large.xsum': 0.64599609375}]}}

labeled_maynez['32219005'] = {'BERTS2S': {'summary': "children at the centre of a controversy over the treatment of baby ashya king's parents may have been denied treatment, say doctors.",
  'summary_upper': "Children at the centre of a controversy over the treatment of baby Ashya King 's parents may have been denied treatment , say doctors .",
  'ents': [{'start': 67,
    'end': 77,
    'label': 0,
    'type': 'ORG',
    'ent': "Ashya King",
    'bart.large': 0.0,
    'xsum_cmlm_bos': 0.66748046875,
    'cnndm_cmlm_cedar': 0.00015485286712646484,
    'bart.large.xsum': 0.5009765625}]},
 'TConvS2S': {'summary': 'brain tumour patient ashya king has been diagnosed with cancer, the bbc has learned.',
  'summary_upper': 'Brain tumour patient Ashya King has been diagnosed with cancer , the BBC has learned .',
  'ents': [{'start': 21,
    'end': 31,
    'label': 0,
    'type': 'ORG',
    'ent': 'Ashya King',
    'bart.large': 0.0,
    'xsum_cmlm_bos': 0.66748046875,
    'cnndm_cmlm_cedar': 0.0015926361083984375,
    'bart.large.xsum': 0.5009765625},
   {'start': 69,
    'end': 72,
    'label': 0,
    'type': 'ORG',
    'ent': 'BBC',
    'bart.large': 0.09735107421875,
    'xsum_cmlm_bos': 0.912109375,
    'cnndm_cmlm_cedar': 0.87060546875,
    'bart.large.xsum': 0.9208984375}]},
 'Gold': {'summary': 'doctors and nurses who treated cancer patient ashya king have criticised his parents while speaking out for the first time in a bbc documentary.',
  'summary_upper': 'Doctors and nurses who treated cancer patient Ashya King have criticised his parents while speaking out for the first time in a BBC documentary .',
  'ents': [{'start': 46,
    'end': 56,
    'label': 0,
    'type': 'ORG',
    'ent': 'Ashya King',
    'bart.large': 0.0,
    'xsum_cmlm_bos': 0.662109375,
    'cnndm_cmlm_cedar': 0.018280029296875,
    'bart.large.xsum': 0.52783203125},
   {'start': 112,
    'end': 117,
    'label': 1,
    'type': 'ORDINAL',
    'ent': 'first',
    'bart.large': 0.9873046875,
    'xsum_cmlm_bos': 0.89794921875,
    'cnndm_cmlm_cedar': 0.87744140625,
    'bart.large.xsum': 0.7685546875},
   {'start': 128,
    'end': 131,
    'label': 0,
    'type': 'ORG',
    'ent': 'BBC',
    'bart.large': 0.2305908203125,
    'xsum_cmlm_bos': 0.91552734375,
    'cnndm_cmlm_cedar': 0.92578125,
    'bart.large.xsum': 0.80224609375}]},
 'PtGen': {'summary': 'ashya king, whose parents were treated for cancer, has been cured for his treatment for treatment for cancer.',
  'summary_upper': 'Ashya King , whose parents were treated for cancer , has been cured for his treatment for treatment for cancer .',
  'ents': [{'start': 0,
    'end': 10,
    'label': 0,
    'type': 'ORG',
    'ent': 'Ashya King',
    'bart.large': 0.0,
    'xsum_cmlm_bos': 0.57958984375,
    'cnndm_cmlm_cedar': 0.0011310577392578125,
    'bart.large.xsum': 0.03192138671875}]},
 'TranS2S': {'summary': 'a terminally ill five-year-old ashya king suffered chemotherapy as a result of treatment for leukaemia, his family have said.',
  'summary_upper': 'A terminally ill five-year-old Ashya king suffered chemotherapy as a result of treatment for Leukaemia , his family have said .',
  'ents': [{'start': 17,
    'end': 30,
    'label': 0,
    'type': 'DATE',
    'ent': 'five-year-old',
    'bart.large': 0.0024089813232421875,
    'xsum_cmlm_bos': 0.0114593505859375,
    'cnndm_cmlm_cedar': 0.37841796875,
    'bart.large.xsum': 0.0090484619140625},
   {'start': 31,
    'end': 36,
    'label': 0,
    'type': 'PRODUCT',
    'ent': 'Ashya',
    'bart.large': 0.0,
    'xsum_cmlm_bos': 0.00022780895233154297,
    'cnndm_cmlm_cedar': 0.000766754150390625,
    'bart.large.xsum': 0.0016374588012695312},
   {'start': 93,
    'end': 102,
    'label': 0,
    'type': 'PERSON',
    'ent': 'Leukaemia',
    'bart.large': 0.0005216598510742188,
    'xsum_cmlm_bos': 0.024505615234375,
    'cnndm_cmlm_cedar': 0.007293701171875,
    'bart.large.xsum': 0.00086212158203125}]}}

labeled_maynez['36457308'] = {'BERTS2S': {
  'summary': 'gianni giaccherini scored twice as italy beat belgium 2-0 to reach the last 16 of the european championship for the first time.',
  'summary_upper': 'Gianni Giaccherini scored twice as Italy beat Belgium 2-0 to reach the last 16 of the European championship for the first time .',
  'ents': [{'start': 7,
    'end': 18,
    'label': 0,
    'type': 'PERSON',
    'ent': 'Giaccherini',
    'bart.large': 0.00019919872283935547,
    'xsum_cmlm_bos': 0.48828125,
    'cnndm_cmlm_cedar': 0.03302001953125,
    'bart.large.xsum': 0.1951904296875},
   {'start': 35,
    'end': 40,
    'label': 0,
    'type': 'GPE',
    'ent': 'Italy',
    'bart.large': 0.544921875,
    'xsum_cmlm_bos': 0.8916015625,
    'cnndm_cmlm_cedar': 0.85986328125,
    'bart.large.xsum': 0.861328125},
   {'start': 46,
    'end': 53,
    'label': 0,
    'type': 'GPE',
    'ent': 'Belgium',
    'bart.large': 0.02423095703125,
    'xsum_cmlm_bos': 0.92529296875,
    'cnndm_cmlm_cedar': 0.87353515625,
    'bart.large.xsum': 0.7783203125},
   {'start': 67,
    'end': 78,
    'label': 0,
    'type': 'DATE',
    'ent': 'the last 16',
    'bart.large': 0.11419677734375,
    'xsum_cmlm_bos': 0.5908203125,
    'cnndm_cmlm_cedar': 0.482177734375,
    'bart.large.xsum': 0.324462890625},
   {'start': 86,
    'end': 94,
    'label': 2,
    'type': 'NORP',
    'ent': 'European',
    'bart.large': 0.391845703125,
    'xsum_cmlm_bos': 0.7841796875,
    'cnndm_cmlm_cedar': 0.436767578125,
    'bart.large.xsum': 0.266357421875},
   {'start': 116,
    'end': 121,
    'label': 2,
    'type': 'ORDINAL',
    'ent': 'first',
    'bart.large': 0.8125,
    'xsum_cmlm_bos': 0.9287109375,
    'cnndm_cmlm_cedar': 0.74609375,
    'bart.large.xsum': 0.630859375}]},
 'TConvS2S': {'summary': "virgil van dijk scored a hat-trick as italy came from behind to beat italy and reach the women's euro 2017 semi-finals.",
  'summary_upper': "Virgil van Dijk scored a hat-trick as Italy came from behind to beat Italy and reach the women 's euro 2017 semi-finals .",
  'ents': [{'start': 0,
    'end': 6,
    'label': 2,
    'type': 'PERSON',
    'ent': 'Virgil',
    'bart.large': 0.01129150390625,
    'xsum_cmlm_bos': 0.055419921875,
    'cnndm_cmlm_cedar': 0.0014257431030273438,
    'bart.large.xsum': 6.449222564697266e-05},
   {'start': 7,
    'end': 10,
    'label': 2,
    'type': 'PERSON',
    'ent': 'van',
    'bart.large': 0.93017578125,
    'xsum_cmlm_bos': 0.83251953125,
    'cnndm_cmlm_cedar': 0.98388671875,
    'bart.large.xsum': 0.0027408599853515625},
   {'start': 11,
    'end': 15,
    'label': 2,
    'type': 'PERSON',
    'ent': 'Dijk',
    'bart.large': 0.63037109375,
    'xsum_cmlm_bos': 0.00820159912109375,
    'cnndm_cmlm_cedar': 0.06402587890625,
    'bart.large.xsum': 0.22900390625},
   {'start': 38,
    'end': 43,
    'label': 2,
    'type': 'GPE',
    'ent': 'Italy',
    'bart.large': 0.004787445068359375,
    'xsum_cmlm_bos': 0.0006585121154785156,
    'cnndm_cmlm_cedar': 7.957220077514648e-05,
    'bart.large.xsum': 0.837890625},
   {'start': 69,
    'end': 74,
    'label': 2,
    'type': 'GPE',
    'ent': 'Italy',
    'bart.large': 0.00164031982421875,
    'xsum_cmlm_bos': 0.00022172927856445312,
    'cnndm_cmlm_cedar': 0.0002772808074951172,
    'bart.large.xsum': 0.0009450912475585938},
   {'start': 103,
    'end': 107,
    'label': 2,
    'type': 'CARDINAL',
    'ent': '2017',
    'bart.large': 0.0182952880859375,
    'xsum_cmlm_bos': 0.0304412841796875,
    'cnndm_cmlm_cedar': 0.0029964447021484375,
    'bart.large.xsum': 0.00754547119140625}]},
 'Gold': {'summary': 'emanuele giaccherini and graziano pelle scored as italy began their euro 2016 campaign with victory over much-fancied belgium in lyon.',
  'summary_upper': 'Emanuele Giaccherini and Graziano Pelle scored as Italy began their Euro 2016 campaign with victory over Much-Fancied Belgium in Lyon .',
  'ents': [{'start': 0,
    'end': 8,
    'label': -1,
    'type': 'PERSON',
    'ent': 'Emanuele',
    'bart.large': 0.00045990943908691406,
    'xsum_cmlm_bos': 7.510185241699219e-06,
    'cnndm_cmlm_cedar': 6.318092346191406e-06,
    'bart.large.xsum': 1.6927719116210938e-05},
   {'start': 9,
    'end': 20,
    'label': -1,
    'type': 'PERSON',
    'ent': 'Giaccherini',
    'bart.large': 0.84619140625,
    'xsum_cmlm_bos': 0.6962890625,
    'cnndm_cmlm_cedar': 0.0709228515625,
    'bart.large.xsum': 0.19775390625},
   {'start': 25,
    'end': 33,
    'label': -1,
    'type': 'PERSON',
    'ent': 'Graziano',
    'bart.large': 0.00013756752014160156,
    'xsum_cmlm_bos': 0.00835418701171875,
    'cnndm_cmlm_cedar': 5.960464477539062e-07,
    'bart.large.xsum': 0.0022430419921875},
   {'start': 34,
    'end': 39,
    'label': -1,
    'type': 'PERSON',
    'ent': 'Pelle',
    'bart.large': 0.86328125,
    'xsum_cmlm_bos': 0.87255859375,
    'cnndm_cmlm_cedar': 0.9013671875,
    'bart.large.xsum': 0.83935546875},
   {'start': 50,
    'end': 55,
    'label': -1,
    'type': 'GPE',
    'ent': 'Italy',
    'bart.large': 0.38671875,
    'xsum_cmlm_bos': 0.9169921875,
    'cnndm_cmlm_cedar': 0.880859375,
    'bart.large.xsum': 0.87353515625},
   {'start': 68,
    'end': 77,
    'label': -1,
    'type': 'LAW',
    'ent': 'Euro 2016',
    'bart.large': 0.023040771484375,
    'xsum_cmlm_bos': 0.72021484375,
    'cnndm_cmlm_cedar': 0.001476287841796875,
    'bart.large.xsum': 0.55908203125},
   {'start': 105,
    'end': 125,
    'label': -1,
    'type': 'ORG',
    'ent': 'Much-Fancied Belgium',
    'bart.large': 0.0,
    'xsum_cmlm_bos': 0.0,
    'cnndm_cmlm_cedar': 0.0,
    'bart.large.xsum': 0.0},
   {'start': 129,
    'end': 133,
    'label': -1,
    'type': 'GPE',
    'ent': 'Lyon',
    'bart.large': 0.004119873046875,
    'xsum_cmlm_bos': 0.05743408203125,
    'cnndm_cmlm_cedar': 0.0015192031860351562,
    'bart.large.xsum': 0.0235137939453125}]},
 'PtGen': {'summary': 'italy scored two late goals to beat italy in the first leg of their copa del rey victory over belgium.',
  'summary_upper': 'Italy scored two late goals to beat Italy in the first leg of their Copa del Rey victory over Belgium .',
  'ents': [{'start': 0,
    'end': 5,
    'label': 2,
    'type': 'GPE',
    'ent': 'Italy',
    'bart.large': 0.0019245147705078125,
    'xsum_cmlm_bos': 0.04461669921875,
    'cnndm_cmlm_cedar': 0.00035452842712402344,
    'bart.large.xsum': 0.54443359375},
   {'start': 13,
    'end': 16,
    'label': 0,
    'type': 'CARDINAL',
    'ent': 'two',
    'bart.large': 0.25537109375,
    'xsum_cmlm_bos': 0.94189453125,
    'cnndm_cmlm_cedar': 0.685546875,
    'bart.large.xsum': 0.3486328125},
   {'start': 36,
    'end': 41,
    'label': 2,
    'type': 'GPE',
    'ent': 'Italy',
    'bart.large': 0.00848388671875,
    'xsum_cmlm_bos': 0.0014486312866210938,
    'cnndm_cmlm_cedar': 0.00023317337036132812,
    'bart.large.xsum': 0.0010547637939453125},
   {'start': 49,
    'end': 54,
    'label': 2,
    'type': 'ORDINAL',
    'ent': 'first',
    'bart.large': 0.1075439453125,
    'xsum_cmlm_bos': 0.67333984375,
    'cnndm_cmlm_cedar': 0.331787109375,
    'bart.large.xsum': 0.03955078125},
   {'start': 68,
    'end': 80,
    'label': 2,
    'type': 'ORG',
    'ent': 'Copa del Rey',
    'bart.large': 0.00020456314086914062,
    'xsum_cmlm_bos': 3.325939178466797e-05,
    'cnndm_cmlm_cedar': 0.0,
    'bart.large.xsum': 0.00015163421630859375},
   {'start': 94,
    'end': 101,
    'label': 0,
    'type': 'GPE',
    'ent': 'Belgium',
    'bart.large': 0.00859832763671875,
    'xsum_cmlm_bos': 0.91796875,
    'cnndm_cmlm_cedar': 0.8125,
    'bart.large.xsum': 0.84130859375}]},
 'TranS2S': {'summary': 'romelu lukaku scored twice as italy beat italy for the second time in three years to go top of the premier league.',
  'summary_upper': 'Romelu Lukaku scored twice as Italy beat Italy for the second time in three years to go top of the Premier League .',
  'ents': [{'start': 30,
    'end': 35,
    'label': 0,
    'type': 'GPE',
    'ent': 'Italy',
    'bart.large': 7.110834121704102e-05,
    'xsum_cmlm_bos': 0.0005602836608886719,
    'cnndm_cmlm_cedar': 9.292364120483398e-05,
    'bart.large.xsum': 0.70751953125},
   {'start': 41,
    'end': 46,
    'label': 0,
    'type': 'GPE',
    'ent': 'Italy',
    'bart.large': 0.0196685791015625,
    'xsum_cmlm_bos': 0.0005145072937011719,
    'cnndm_cmlm_cedar': 0.0004673004150390625,
    'bart.large.xsum': 0.0007557868957519531},
   {'start': 55,
    'end': 61,
    'label': 2,
    'type': 'ORDINAL',
    'ent': 'second',
    'bart.large': 0.25927734375,
    'xsum_cmlm_bos': 0.32080078125,
    'cnndm_cmlm_cedar': 0.40673828125,
    'bart.large.xsum': 0.2548828125},
   {'start': 70,
    'end': 81,
    'label': 2,
    'type': 'DATE',
    'ent': 'three years',
    'bart.large': 0.0287322998046875,
    'xsum_cmlm_bos': 0.01520538330078125,
    'cnndm_cmlm_cedar': 0.045318603515625,
    'bart.large.xsum': 0.05419921875},
   {'start': 95,
    'end': 113,
    'label': 2,
    'type': 'ORG',
    'ent': 'the Premier League',
    'bart.large': 0.001789093017578125,
    'xsum_cmlm_bos': 8.64267349243164e-06,
    'cnndm_cmlm_cedar': 2.086162567138672e-06,
    'bart.large.xsum': 5.364418029785156e-07}]}}