In [9]:
import nltk
from nltk.tokenize import word_tokenize
from nltk.tag import pos_tag
import json
from nltk.chunk import conlltags2tree, tree2conlltags
from pprint import pprint
import random
import string
import re

In [10]:
def clean(text):
    emoji_pattern = re.compile("["
        u"\U0001F600-\U0001F64F"  # emoticons
        u"\U0001F300-\U0001F5FF"  # symbols & pictographs
        u"\U0001F680-\U0001F6FF"  # transport & map symbols
        u"\U0001F1E0-\U0001F1FF"  # flags (iOS)
                           "]+", flags=re.UNICODE)
    
    
    text = re.sub(r"https.*\s*", '', text)
    text = emoji_pattern.sub(r'', text)
    text = re.sub(r"RT @.*:", '', text)
    text = re.sub(r"@.* ", '', text)

    text = text.translate(text.maketrans('','',string.punctuation))
    text = text.replace('\n',' ')
    text = text.lower()
    return text
    
def preprocess(sent):
    sent = nltk.word_tokenize(sent)
    sent = nltk.pos_tag(sent)
    return sent


In [11]:
import spacy
from spacy import displacy
from collections import Counter
# import en_core_web_sm
# people”, “business”, “person”, and “location”. 
# Place-Place, Person-Place, Language-Place,
# Person, GPE, LOC, ORG, 
def ner(text):
    nlp = spacy.load("en_core_web_sm")
    doc = nlp(text)
    entities = [X.text for X in doc.ents if X.label_ in ['PERSON', 'GPE', 'LOC', 'ORG']]
        
    
    return entities




In [15]:
# Loading data

data = json.load(open("data.json"))

random.shuffle(data)


ans = set()
fw = open("predict.json", 'w', encoding='utf-8')


for item in data:
    try:
        text = item["text"]
        text = clean(text)
    #     print(text)
        entities = list(set(ner(text)))

        for i in range (len(entities)):
            if " " in entities[i]:
                new = entities[i].replace(" ", "_")
                text = text.replace(entities[i], new)
                entities[i] = new


        pairs = [(a, b) for idx, a in enumerate(entities) for b in entities[idx + 1:] if len(entities) >= 2]

        for pair in pairs: 
            if text.index(pair[0]) < text.index(pair[1]):

                instance = dict(
                        head=pair[0],
                        tail=pair[1],
                        sentence=text,
                    )

                print(instance)
                json.dump(instance, fw, ensure_ascii=False)
                fw.write('\n')
    except Exception as e:
        print("Error occured")

fw.close()


{'head': 'italy', 'tail': 'germany', 'sentence': 'italy faring better than germany in 4th covid19 wave '}
{'head': 'florida', 'tail': 'california', 'sentence': ' based on population size the death rate per capita in florida over the last four months was 4x greater than california’…'}
{'head': 'china', 'tail': 'syria', 'sentence': ' china has donated 500000 doses of covid19 vaccines to wartorn syria which has one of the worlds lowest inoculation rates and…'}
{'head': 'yok', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning at chai_daen sai yok district kanchanaburi from i…'}
{'head': 'chai_daen', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning at chai_daen sai yok district kanchanaburi from i…'}
{'head': 'healthcare_workers', 'tail': 'uk', 'sentence': ' a significant proportion of healthcare_workers hcws in the uk exposed to sarscov2 during the 1st wave of covid19 nev…'}
{'head'

{'head': 'france', 'tail': 'uk_un_usa', 'sentence': ' brbreaking thousands of people protested against the vaccine pass   breakingnews france paris uk_un_usa austri…'}
{'head': 'france', 'tail': 'paris', 'sentence': ' brbreaking thousands of people protested against the vaccine pass   breakingnews france paris uk_un_usa austri…'}
{'head': 'healthcare_workers', 'tail': 'uk', 'sentence': ' a significant proportion of healthcare_workers hcws in the uk exposed to sarscov2 during the 1st wave of covid19 nev…'}
{'head': 'healthcare_workers', 'tail': 'covid19', 'sentence': ' a significant proportion of healthcare_workers hcws in the uk exposed to sarscov2 during the 1st wave of covid19 nev…'}
{'head': 'uk', 'tail': 'covid19', 'sentence': ' a significant proportion of healthcare_workers hcws in the uk exposed to sarscov2 during the 1st wave of covid19 nev…'}
{'head': 'lincoln', 'tail': 'us', 'sentence': ' three snow leopards at the lincoln childrens zoo in the us state of nebraska have died of

{'head': 'kerala', 'tail': 'india_kerala', 'sentence': 'govt  31923 covid19 cases detected on wednesday kerala reported 19675 cases with  301 lakh active cases in india_kerala has over 161 lakh active cases  of 282 deaths reported  142 from kerala__'}
{'head': 'kerala', 'tail': 'kerala__', 'sentence': 'govt  31923 covid19 cases detected on wednesday kerala reported 19675 cases with  301 lakh active cases in india_kerala has over 161 lakh active cases  of 282 deaths reported  142 from kerala__'}
{'head': 'india_kerala', 'tail': 'kerala__', 'sentence': 'govt  31923 covid19 cases detected on wednesday kerala reported 19675 cases with  301 lakh active cases in india_kerala has over 161 lakh active cases  of 282 deaths reported  142 from kerala__'}
{'head': 'nbc_abc_cbs', 'tail': 'cnn', 'sentence': ' clips from nbc_abc_cbs and cnn show pfizer one of the main manufacturers of the covid19 injection is funding many s…'}
{'head': 'khalid_bin', 'tail': 'jose', 'sentence': 'the general manager of

{'head': 'yok', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning at chai_daen sai yok district kanchanaburi from i…'}
{'head': 'chai_daen', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning at chai_daen sai yok district kanchanaburi from i…'}
{'head': 'murali_vijay', 'tail': 'covid19', 'sentence': ' murali_vijay has made himself unavailable for tamil nadu selections as hes hesitant to take the covid19 vaccine vijay…'}
{'head': 'china', 'tail': 'tha', 'sentence': ' china on friday donated 128 million yuan 2 millionworth covid19 nucleic acid test kits and sample releaser buffers tha…'}
{'head': 'arkansas', 'tail': 'florida', 'sentence': ' alabama arkansas florida georgia louisiana…'}
{'head': 'arkansas', 'tail': 'georgia', 'sentence': ' alabama arkansas florida georgia louisiana…'}
{'head': 'arkansas', 'tail': 'louisiana', 'sentence': ' alabama arkansas florida georgia louisiana…'

{'head': 'yok', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning at chai_daen sai yok district kanchanaburi from i…'}
{'head': 'chai_daen', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning at chai_daen sai yok district kanchanaburi from i…'}
{'head': 'healthcare_workers', 'tail': 'uk', 'sentence': ' a significant proportion of healthcare_workers hcws in the uk exposed to sarscov2 during the 1st wave of covid19 nev…'}
{'head': 'healthcare_workers', 'tail': 'covid19', 'sentence': ' a significant proportion of healthcare_workers hcws in the uk exposed to sarscov2 during the 1st wave of covid19 nev…'}
{'head': 'uk', 'tail': 'covid19', 'sentence': ' a significant proportion of healthcare_workers hcws in the uk exposed to sarscov2 during the 1st wave of covid19 nev…'}
{'head': 'richard', 'tail': 'richard_urso_d', 'sentence': ' covid19 watch covid summit in kansas city  speakers inclu

{'head': 'china', 'tail': 'grou', 'sentence': ' more than 8439 million children aged 3 to 11 in china have received covid19 vaccines 4944 million children of the age grou…'}
{'head': 'florida', 'tail': 'california', 'sentence': ' based on population size the death rate per capita in florida over the last four months was 4x greater than california’…'}
{'head': 'orlando', 'tail': 'florida', 'sentence': 'expert house cleaning service  cleaning clean cleaningservice housecleaning homecleaning residentialcleaning cleanhouse bathroom kitchen moving realestate money today family love orlando florida millenia covid19 '}
{'head': 'yok', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning at chai_daen sai yok district kanchanaburi from i…'}
{'head': 'chai_daen', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning at chai_daen sai yok district kanchanaburi from i…'}
{'head': 'europe_eu', 'tail'

{'head': 'healthcare_workers', 'tail': 'uk', 'sentence': ' a significant proportion of healthcare_workers hcws in the uk exposed to sarscov2 during the 1st wave of covid19 nev…'}
{'head': 'healthcare_workers', 'tail': 'covid19', 'sentence': ' a significant proportion of healthcare_workers hcws in the uk exposed to sarscov2 during the 1st wave of covid19 nev…'}
{'head': 'uk', 'tail': 'covid19', 'sentence': ' a significant proportion of healthcare_workers hcws in the uk exposed to sarscov2 during the 1st wave of covid19 nev…'}
{'head': 'national_guard_general', 'tail': 'pentagon', 'sentence': 'national_guard_general defies pentagon’s covid19 vaccine mandate for soldiers — rt usa news '}
{'head': 'florida', 'tail': 'individual_freedo', 'sentence': ' california and florida both see the same amount of excess deaths since pandemic start  florida respects individual_freedo…'}
{'head': 'california', 'tail': 'individual_freedo', 'sentence': ' california and florida both see the same amount of e

{'head': 'ghana', 'tail': 'africa', 'sentence': 'kusi ideas festival organized by nation media group is back and will be held in accra ghana on 10th amp 11th december 2021 this year’s conference comes nearly two years into the covid19 pandemic that has upended the world and africa in ways nothing else has   kusifest2021 '}
{'head': 'kusi', 'tail': 'africa', 'sentence': 'kusi ideas festival organized by nation media group is back and will be held in accra ghana on 10th amp 11th december 2021 this year’s conference comes nearly two years into the covid19 pandemic that has upended the world and africa in ways nothing else has   kusifest2021 '}
{'head': 's', 'tail': 'hainan', 'sentence': ' worlds 1st aerosolized inhaled covid19 vaccine made debut at a health expo in s chinas hainan developed by chinas_cans…'}
{'head': 's', 'tail': 'chinas_cans', 'sentence': ' worlds 1st aerosolized inhaled covid19 vaccine made debut at a health expo in s chinas hainan developed by chinas_cans…'}
{'head': '

{'head': 'iowa', 'tail': 'gop', 'sentence': 'control_iowa counties wworst covid19 vaccination rates are heavily republican the iowa gop candidates ago'}
{'head': 'the_health_department', 'tail': 'south_africa', 'sentence': 'the_health_department has launched the vax champs campaign and has invited everyone living in south_africa to become an ambassador for vaccination against covid19 dr fundile nyati elaborates on the campaign  watch newzroom405 '}
{'head': 'china', 'tail': 'eu', 'sentence': 'titfortat subsidy dynamics  within six months of china introducing a subsidy in a product line 58 of the time the eu awarded a subsidy in the same line of business   read more here covid19 '}
{'head': 'titfortat', 'tail': 'eu', 'sentence': 'titfortat subsidy dynamics  within six months of china introducing a subsidy in a product line 58 of the time the eu awarded a subsidy in the same line of business   read more here covid19 '}
{'head': 'europe', 'tail': 'measur', 'sentence': ' the patterns that 

{'head': 'china', 'tail': 'syria', 'sentence': ' china has donated 500000 doses of covid19 vaccines to wartorn syria which has one of the worlds lowest inoculation rates and…'}
{'head': 'boris_johnson', 'tail': 'knell_britain_brexit_borishasfailedbritain_borisjohnson', 'sentence': 'boris_johnson britains death knell_britain_brexit_borishasfailedbritain_borisjohnson '}
{'head': 'healthcare_workers', 'tail': 'uk', 'sentence': ' a significant proportion of healthcare_workers hcws in the uk exposed to sarscov2 during the 1st wave of covid19 nev…'}
{'head': 'healthcare_workers', 'tail': 'covid19', 'sentence': ' a significant proportion of healthcare_workers hcws in the uk exposed to sarscov2 during the 1st wave of covid19 nev…'}
{'head': 'uk', 'tail': 'covid19', 'sentence': ' a significant proportion of healthcare_workers hcws in the uk exposed to sarscov2 during the 1st wave of covid19 nev…'}
{'head': 'europe', 'tail': 'uk', 'sentence': ' boris_johnson suggested he is worried a wave of cov

{'head': 'china', 'tail': 'moscow', 'sentence': 'thats because the chinese version quickly changed from wet market to developed on a military base in america and us soldiers brought it to china most russians believe that version by the way according to my moscow source covid19 china '}
{'head': 'america', 'tail': 'moscow', 'sentence': 'thats because the chinese version quickly changed from wet market to developed on a military base in america and us soldiers brought it to china most russians believe that version by the way according to my moscow source covid19 china '}
{'head': 'china', 'tail': 'syria', 'sentence': ' china has donated 500000 doses of covid19 vaccines to wartorn syria which has one of the worlds lowest inoculation rates and…'}
{'head': 'new_york', 'tail': 'rodrick_wallace', 'sentence': 'coming soon the recurrence of covid19 in new_york state and new_york city surfing the second wave by deborah_wallace and rodrick_wallace '}
Error occured
{'head': 'yok', 'tail': 'kanchan

{'head': 'australia', 'tail': 'ghana', 'sentence': 'blacklivesmatter nickiminaj maga 2a alberta_ontario_toronto health covid19 covid19 cancer corruption wakey science sciencewins australia india ghana deltavariant arizona israel murder children mamabear notaboutavirus '}
{'head': 'australia', 'tail': 'arizona', 'sentence': 'blacklivesmatter nickiminaj maga 2a alberta_ontario_toronto health covid19 covid19 cancer corruption wakey science sciencewins australia india ghana deltavariant arizona israel murder children mamabear notaboutavirus '}
{'head': 'australia', 'tail': 'india', 'sentence': 'blacklivesmatter nickiminaj maga 2a alberta_ontario_toronto health covid19 covid19 cancer corruption wakey science sciencewins australia india ghana deltavariant arizona israel murder children mamabear notaboutavirus '}
{'head': 'ghana', 'tail': 'arizona', 'sentence': 'blacklivesmatter nickiminaj maga 2a alberta_ontario_toronto health covid19 covid19 cancer corruption wakey science sciencewins austr

{'head': 'australia', 'tail': 'ghana', 'sentence': 'blacklivesmatter nickiminaj maga 2a alberta_ontario_toronto health covid19 covid19 cancer corruption wakey science sciencewins australia india ghana deltavariant arizona israel murder children mamabear notaboutavirus  china quarantine camps truck '}
{'head': 'australia', 'tail': 'arizona', 'sentence': 'blacklivesmatter nickiminaj maga 2a alberta_ontario_toronto health covid19 covid19 cancer corruption wakey science sciencewins australia india ghana deltavariant arizona israel murder children mamabear notaboutavirus  china quarantine camps truck '}
{'head': 'australia', 'tail': 'india', 'sentence': 'blacklivesmatter nickiminaj maga 2a alberta_ontario_toronto health covid19 covid19 cancer corruption wakey science sciencewins australia india ghana deltavariant arizona israel murder children mamabear notaboutavirus  china quarantine camps truck '}
{'head': 'ghana', 'tail': 'arizona', 'sentence': 'blacklivesmatter nickiminaj maga 2a albert

{'head': 'kerala', 'tail': 'lalitha_kala_academy', 'sentence': ' it is absolutely disgusting that idiotic jurors of kerala lalitha_kala_academy have ridiculed the hard work and sacrifices…'}
{'head': 'italy', 'tail': 'france', 'sentence': ' and in italy and france you got surges of vaccination with the introduction of vaccination measures  but introducing new v…'}
{'head': 'national_guard_general', 'tail': 'pentagon', 'sentence': 'national_guard_general defies pentagon’s covid19 vaccine mandate for soldiers — rt usa news '}
{'head': 'china', 'tail': 'grou', 'sentence': ' more than 8439 million children aged 3 to 11 in china have received covid19 vaccines 4944 million children of the age grou…'}
{'head': 'yok', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning at chai_daen sai yok district kanchanaburi from i…'}
{'head': 'chai_daen', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morni

{'head': 'kamloops_british_columbia', 'tail': 'canada', 'sentence': 'icymi a fourth unit has an outbreak of covid19 at royal inland hospital in kamloops_british_columbia via ⬇️  bcpoli canada covid19bc healthcare '}
{'head': 'wellington_parliament', 'tail': 'new_zealand', 'sentence': ' new  protest against covid19 measures and restrictions outside wellington_parliament in new_zealand  '}
{'head': 'the_caribbean_jamaica', 'tail': 'cuba', 'sentence': 'covid19 dashboard for the_caribbean_jamaica edition haití cuba dominicanrepublic coronavirusrd coronavirus rd '}
{'head': 'china', 'tail': 'biden_usa_texas', 'sentence': 'yes america  sue the fuck out of every company in america   they can get their money back from china and fauci  cryptocurrency elon dogelonmars nfl binance biden_usa_texas covid19'}
{'head': 'china', 'tail': 'nfl', 'sentence': 'yes america  sue the fuck out of every company in america   they can get their money back from china and fauci  cryptocurrency elon dogelonmars nfl

{'head': 'yok', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning at chai_daen sai yok district kanchanaburi from i…'}
{'head': 'chai_daen', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning at chai_daen sai yok district kanchanaburi from i…'}
{'head': 'india', 'tail': 'uk', 'sentence': '   who approved emergency use of bharat biotechs covaxin   111 crore vaccinations done so far in india  96 countries including us uk many european and\xa0middle east \xa0nations  have agreed to  recognize covid19 vaccination certificates issued in india  covid19'}
{'head': 'australia', 'tail': 'uk_nato', 'sentence': ' america not a christian country anymore eu_canada australia uk_nato atta…'}
{'head': 'eu_canada', 'tail': 'uk_nato', 'sentence': ' america not a christian country anymore eu_canada australia uk_nato atta…'}
{'head': 'maría_caridad_rivera', 'tail': 'st_catherine', 'sentence': ' profe

{'head': 'iqbal', 'tail': 'siemens', 'sentence': ' another addition to one of our hundreds of certified of 2021                     congratulations   to mr asim iqbal from siemens to pass the pmp exam  with all above target projectmanagement pmp pmi pmpcertified pmptraining covid19 '}
{'head': 'florida', 'tail': 'california', 'sentence': ' based on population size the death rate per capita in florida over the last four months was 4x greater than california’…'}
{'head': 'china', 'tail': 'grou', 'sentence': ' more than 8439 million children aged 3 to 11 in china have received covid19 vaccines 4944 million children of the age grou…'}
{'head': 'mtosterholm_covidcanada', 'tail': 'govtomwolf', 'sentence': 'covid19 mtosterholm_covidcanada nytimes govtomwolf  leader in contagion in the north  ohio rt 202 more than 3200 new suspected cases and 361 deaths reported today last two days on the top of this '}
{'head': 'china', 'tail': 'tha', 'sentence': ' china on friday donated 128 million yuan 2 m

{'head': 'florida', 'tail': 'individual_freedo', 'sentence': ' california and florida both see the same amount of excess deaths since pandemic start  florida respects individual_freedo…'}
{'head': 'california', 'tail': 'individual_freedo', 'sentence': ' california and florida both see the same amount of excess deaths since pandemic start  florida respects individual_freedo…'}
{'head': 'scotland', 'tail': 'north_west__', 'sentence': 'english regions scotland wales ni amp roi covid19 cases per 100000 residents reported in the last 7 days  west midlands moves above north_west__east of england moves above north_east__england increases from 359 cases per 100k thursday to 372 per 100k friday '}
{'head': 'scotland', 'tail': 'north_east__england', 'sentence': 'english regions scotland wales ni amp roi covid19 cases per 100000 residents reported in the last 7 days  west midlands moves above north_west__east of england moves above north_east__england increases from 359 cases per 100k thursday to

{'head': 'cuba', 'tail': 'guyana_surinam', 'sentence': 'covid19 dashboard for the caribbean haití  dominicanrepublic coronavirusrd cases per million correlations pie plot investigating significant correlations among jamaica amp cuba surinam amp cuba stkitts amp guyana_surinam amp guyana trinidad amp guyana_r_gt 05 '}
{'head': 'jamaica', 'tail': 'guyana_surinam', 'sentence': 'covid19 dashboard for the caribbean haití  dominicanrepublic coronavirusrd cases per million correlations pie plot investigating significant correlations among jamaica amp cuba surinam amp cuba stkitts amp guyana_surinam amp guyana trinidad amp guyana_r_gt 05 '}
{'head': 'thomas_mancinos', 'tail': 'covid19', 'sentence': ' pentagon responds to new adjutant general thomas_mancinos move to rescind the covid19 vaccine mandate for…'}
{'head': 'dublin', 'tail': 'georgia', 'sentence': ' michael lancaster 66yo nurse practitioner dublin georgia died of covid19 61021 after a 6 week fight he was an avid out…'}
{'head': '▒', '

{'head': 'brazil', 'tail': 'yeg_yyc', 'sentence': 'go brazil howdareyou  caseademic serveandprotect against treason plandemic nuremberg2  crimesagainsthumanity  coercivecontrol  supportlocal covid19 covid19on covid19mb covid19sk covid19ab covid19bc ableg abpoli cndpoli yeg_yyc '}
{'head': 'brazil', 'tail': 'covid19ab', 'sentence': 'go brazil howdareyou  caseademic serveandprotect against treason plandemic nuremberg2  crimesagainsthumanity  coercivecontrol  supportlocal covid19 covid19on covid19mb covid19sk covid19ab covid19bc ableg abpoli cndpoli yeg_yyc '}
{'head': 'liza_l_mangubat', 'tail': 'canada', 'sentence': 'liza_l_mangubat calapandayan subic zambales philippines 2209 im support the covid19 social distancing fismash fished wash your hands stay at home to continue to developing technology i want to help to travel us canada to all country all around the world  '}
{'head': 'anc', 'tail': 'ramaphosa_dlaminizuma', 'sentence': 'interesting thoughts and read  will mogoeng become the co

{'head': 'india', 'tail': 'israel', 'sentence': 'blacklivesmatter nickiminaj maga 2a alberta ontario toronto covid19 corruption wake science sciencewins australia india arizona israel murder children notaboutavirus  pharmacy tried to do a workaround when child doses unavailable  '}
{'head': 'india', 'tail': 'arizona', 'sentence': 'blacklivesmatter nickiminaj maga 2a alberta ontario toronto covid19 corruption wake science sciencewins australia india arizona israel murder children notaboutavirus  pharmacy tried to do a workaround when child doses unavailable  '}
{'head': 'australia', 'tail': 'israel', 'sentence': 'blacklivesmatter nickiminaj maga 2a alberta ontario toronto covid19 corruption wake science sciencewins australia india arizona israel murder children notaboutavirus  pharmacy tried to do a workaround when child doses unavailable  '}
{'head': 'australia', 'tail': 'arizona', 'sentence': 'blacklivesmatter nickiminaj maga 2a alberta ontario toronto covid19 corruption wake science 

{'head': 'yok', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning at chai_daen sai yok district kanchanaburi from i…'}
{'head': 'chai_daen', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning at chai_daen sai yok district kanchanaburi from i…'}
{'head': 'florida', 'tail': 'individual_freedo', 'sentence': ' california and florida both see the same amount of excess deaths since pandemic start  florida respects individual_freedo…'}
{'head': 'california', 'tail': 'individual_freedo', 'sentence': ' california and florida both see the same amount of excess deaths since pandemic start  florida respects individual_freedo…'}
{'head': 'gauteng', 'tail': 'eastern', 'sentence': 'jeez and there i thought we in gauteng were naturally streets ahead of limpopo and eastern cape covid19 vaccines '}
{'head': 'kuwait', 'tail': 'arab_arabia', 'sentence': 'kuwait against covid tyranny freedom  covidvac

{'head': 'yok', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning at chai_daen sai yok district kanchanaburi from i…'}
{'head': 'chai_daen', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning at chai_daen sai yok district kanchanaburi from i…'}
{'head': 'wellington_parliament', 'tail': 'new_zealand', 'sentence': ' new  protest against covid19 measures and restrictions outside wellington_parliament in new_zealand  '}
{'head': 'australia', 'tail': 'ghana', 'sentence': 'blacklivesmatter nickiminaj maga 2a alberta_ontario_toronto health covid19 covid19 cancer corruption wakey science sciencewins australia india ghana arizona israel murder children notaboutavirus  must see please share ❤ '}
{'head': 'australia', 'tail': 'arizona', 'sentence': 'blacklivesmatter nickiminaj maga 2a alberta_ontario_toronto health covid19 covid19 cancer corruption wakey science sciencewins australia india g

{'head': 'yok', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning at chai_daen sai yok district kanchanaburi from i…'}
{'head': 'chai_daen', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning at chai_daen sai yok district kanchanaburi from i…'}
{'head': 'yok', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning at chai_daen sai yok district kanchanaburi from i…'}
{'head': 'chai_daen', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning at chai_daen sai yok district kanchanaburi from i…'}
{'head': 'nba_nfl', 'tail': 'mlb', 'sentence': ' nba_nfl mlb nhl_mls nascar uefa uci_esports_business_ai treasure covid19 gf2640 the big picture of the dig…'}
{'head': 'nba_nfl', 'tail': 'nhl_mls', 'sentence': ' nba_nfl mlb nhl_mls nascar uefa uci_esports_business_ai treasure covid19 gf2640 the 

{'head': 'charlie_mitchell', 'tail': 'katie_kenny', 'sentence': ' simon thornley is a fraud he promotes lies his credibility is zero  charlie_mitchell amp katie_kenny rip thornley a new o…'}
{'head': 'healthcare_workers', 'tail': 'uk', 'sentence': ' a significant proportion of healthcare_workers hcws in the uk exposed to sarscov2 during the 1st wave of covid19 nev…'}
{'head': 'healthcare_workers', 'tail': 'covid19', 'sentence': ' a significant proportion of healthcare_workers hcws in the uk exposed to sarscov2 during the 1st wave of covid19 nev…'}
{'head': 'uk', 'tail': 'covid19', 'sentence': ' a significant proportion of healthcare_workers hcws in the uk exposed to sarscov2 during the 1st wave of covid19 nev…'}
{'head': 'healthcare_workers', 'tail': 'uk', 'sentence': ' a significant proportion of healthcare_workers hcws in the uk exposed to sarscov2 during the 1st wave of covid19 nev…'}
{'head': 'healthcare_workers', 'tail': 'covid19', 'sentence': ' a significant proportion of healthc

{'head': 'wellington_parliament', 'tail': 'new_zealand', 'sentence': ' new  protest against covid19 measures and restrictions outside wellington_parliament in new_zealand  '}
{'head': 'uk', 'tail': 'pediat', 'sentence': ' 99995 children survive covid19  uk data shows a 12 month study from 4 uk universities nhs amp specialists in pediat…'}
{'head': 'yok', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning at chai_daen sai yok district kanchanaburi from i…'}
{'head': 'chai_daen', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning at chai_daen sai yok district kanchanaburi from i…'}
{'head': 'thomas_mancinos', 'tail': 'covid19', 'sentence': ' pentagon responds to new adjutant general thomas_mancinos move to rescind the covid19 vaccine mandate for…'}
{'head': 'robert_f_kennedy_jr_speaking', 'tail': 'berlin', 'sentence': ' 89 robert_f_kennedy_jr_speaking truth in berlin  ichbineinberlin

{'head': 'china', 'tail': 'tha', 'sentence': ' china on friday donated 128 million yuan 2 millionworth covid19 nucleic acid test kits and sample releaser buffers tha…'}
{'head': 'india', 'tail': 'biggboss15', 'sentence': 'india administered 112 crore covid19 vaccines  gfvip btc biggboss15 prelemi giveaways  quote ada heeseung qnt bb15 yargi indiancricketteam '}
{'head': 'florida', 'tail': 'california', 'sentence': ' based on population size the death rate per capita in florida over the last four months was 4x greater than california’…'}
{'head': 'f1_japan', 'tail': 'london', 'sentence': 'read the quran   jesus muslim islam quote f1_japan twitter covid19 london italia formel1 lapalma '}
{'head': 'islam', 'tail': 'london', 'sentence': 'read the quran   jesus muslim islam quote f1_japan twitter covid19 london italia formel1 lapalma '}
{'head': 'yok', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning at chai_daen sai yok district kancha

{'head': 'switzerland', 'tail': 'estonia', 'sentence': 'switzerland vs estonia up to 20211114  switzerland     total cases 317017     total deaths 4236  estonia     total cases 11698     total deaths 109  switzerland estonia covid19 coronavirus '}
{'head': 'europe', 'tail': 'india', 'sentence': 'coronavirus news live updates is waning immunity of astrazeneca vaccine behind covid resurgence in europe coronavirus news live updates the eus diseases agency said 10 countries in the 27member bloc faced a covid s india by news18 '}
{'head': 'china', 'tail': 'tha', 'sentence': ' china on friday donated 128 million yuan 2 millionworth covid19 nucleic acid test kits and sample releaser buffers tha…'}
{'head': 'moderna_covid19_vaccine', 'tail': 'uganda', 'sentence': ' great news as 19m moderna_covid19_vaccine doses donated by the canadian government arrived in uganda yesturday the donatio…'}
{'head': 'wellington_parliament', 'tail': 'new_zealand', 'sentence': ' new  protest against covid19 measur

{'head': 'national_guard_general', 'tail': 'pentagon', 'sentence': 'national_guard_general defies pentagon’s covid19 vaccine mandate for soldiers  hold the line '}
{'head': 'charlie_mitchell', 'tail': 'katie_kenny', 'sentence': ' simon thornley is a fraud he promotes lies his credibility is zero  charlie_mitchell amp katie_kenny rip thornley a new o…'}
{'head': 'china', 'tail': 'hong_kong', 'sentence': '1 new case in china hong_kong sar   1010 gmt coronavirus coronavirusupdate covid19 coronaviruspandemic'}
{'head': 'florida', 'tail': 'california', 'sentence': ' based on population size the death rate per capita in florida over the last four months was 4x greater than california’…'}
{'head': 'ali_mokdad', 'tail': 'the_university_of_washington', 'sentence': '“delta and waning immunity — the combination of these two have set us back” said ali_mokdad a professor of health metrics sciences at the_university_of_washington “this virus is going to stick with us for a long long time” pandemic c

{'head': 'india', 'tail': 'se_ladega', 'sentence': ' ‘mask pehnega india corona se_ladega india’  we all have to be responsible in our fight against covid19 and take all the…'}
{'head': 'liam_jones', 'tail': 'carlton_blues_retires', 'sentence': 'afl player liam_jones of carlton_blues_retires after covid19 vaccine saga afl covid19 vaccination policy '}
{'head': 'yok', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning at chai_daen sai yok district kanchanaburi from i…'}
{'head': 'chai_daen', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning at chai_daen sai yok district kanchanaburi from i…'}
{'head': 'georgia', 'tail': 'california', 'sentence': ' imagine saying the covid19 deaths in georgia are not comparable to those of california due to higher  of african americans…'}
{'head': 'yok', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early 

{'head': 'max', 'tail': '🤣', 'sentence': 'this is fascinating though i admit to understanding only 20 of it max  you just know the idiots are going to get stuck on “nanoparticles” and “luciferase” though 🤣  covid19 '}
{'head': 'kazakhstan', 'tail': 'iran', 'sentence': ' virus  you can get one in china india russia kazakhstan iran…'}
{'head': 'china', 'tail': 'india', 'sentence': ' virus  you can get one in china india russia kazakhstan iran…'}
{'head': 'china', 'tail': 'russia', 'sentence': ' virus  you can get one in china india russia kazakhstan iran…'}
{'head': 'india', 'tail': 'russia', 'sentence': ' virus  you can get one in china india russia kazakhstan iran…'}
{'head': 'irancovid19', 'tail': 'victimsgt475300', 'sentence': 'irancovid19 victimsgt475300  '}
{'head': 'california', 'tail': 'colorado', 'sentence': ' officials in california colorado and newmexico are expanding access to boostershots against covid19 as they grapple…'}
{'head': 'europe', 'tail': 'spain', 'sentence': ' do

{'head': 'marriott', 'tail': 'sha_tin', 'sentence': 'labour and welfare chief law chikwong says the courtyard by marriott in sha_tin will next month become a covid19 quarantine hotel for foreign domestic helpers arriving in hongkong '}
{'head': 'india', 'tail': 'kerala', 'sentence': ' last 24 hours india reports 11271 covid19 new cases out of which 6468 are from kerala'}
{'head': 'kerala', 'tail': 'lalitha_kala_academy', 'sentence': ' it is absolutely disgusting that idiotic jurors of kerala lalitha_kala_academy have ridiculed the hard work and sacrifices…'}
{'head': 'yok', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning at chai_daen sai yok district kanchanaburi from i…'}
{'head': 'chai_daen', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning at chai_daen sai yok district kanchanaburi from i…'}
{'head': 'india', 'tail': 'the_ministry_of_health', 'sentence': 'coronavirusindiaup

{'head': 'orlando', 'tail': 'florida', 'sentence': 'reliable cleaning amp maid service  cleaning clean cleaningservice housecleaning homecleaning residentialcleaning cleanhouse bathroom kitchen moving realestate money today family love orlando florida millenia covid19 '}
{'head': 'china', 'tail': 'grou', 'sentence': ' more than 8439 million children aged 3 to 11 in china have received covid19 vaccines 4944 million children of the age grou…'}
{'head': 'yok', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning at chai_daen sai yok district kanchanaburi from i…'}
{'head': 'chai_daen', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning at chai_daen sai yok district kanchanaburi from i…'}
{'head': 'china', 'tail': 'wuhan', 'sentence': ' three detained over packed esports celebration in china’s wuhan  '}
{'head': 'california', 'tail': 'colorado', 'sentence': ' officials in california colo

{'head': 'california', 'tail': 'colorado', 'sentence': ' officials in california colorado and newmexico are expanding access to boostershots against covid19 as they grapple…'}
{'head': 'robert37959944', 'tail': 'usa', 'sentence': ' thank you robert37959944 i was writing amp recording in usa when this was informally announced but dismissed as …'}
{'head': 'brazil', 'tail': 'jair_bolsonaro', 'sentence': 'covid19 brazil president jair_bolsonaro confronted who head tedros adhanom on covid19 restrictions and ask why people are still dying after the second dose and asserted that all over the world there are people who need to work to feed themselves '}
{'head': 'yok', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning at chai_daen sai yok district kanchanaburi from i…'}
{'head': 'chai_daen', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning at chai_daen sai yok district kanchanaburi fro

{'head': 'yok', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning at chai_daen sai yok district kanchanaburi from i…'}
{'head': 'chai_daen', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning at chai_daen sai yok district kanchanaburi from i…'}
{'head': 'auspol', 'tail': 'uk', 'sentence': 'auspol   uk parliament   '}
{'head': 'malaysia', 'tail': 'cases2541147', 'sentence': 'coronavirus latest updates  malaysia  daily cases  14 nov 2021  5809 new cases 55 new deaths source total cases2541147  recovered2446197  deaths29631  source coronavirus covid19 coronavirusupdates'}
{'head': 'china', 'tail': 'pr', 'sentence': ' china provided another batch of covid19 vaccines ampantipandemic supplies to thailand on friday thai prime minister pr…'}
{'head': 'china', 'tail': 'thailand', 'sentence': ' china provided another batch of covid19 vaccines ampantipandemic supplies to thailand on friday t

{'head': 'france', 'tail': 'uk_un_usa', 'sentence': ' breaking thousands of people protested against the vaccine pass   breakingnews france paris uk_un_usa austria_austra…'}
{'head': 'france', 'tail': 'austria_austra', 'sentence': ' breaking thousands of people protested against the vaccine pass   breakingnews france paris uk_un_usa austria_austra…'}
{'head': 'france', 'tail': 'paris', 'sentence': ' breaking thousands of people protested against the vaccine pass   breakingnews france paris uk_un_usa austria_austra…'}
{'head': 'uk_un_usa', 'tail': 'austria_austra', 'sentence': ' breaking thousands of people protested against the vaccine pass   breakingnews france paris uk_un_usa austria_austra…'}
{'head': 'queensland', 'tail': 'abc_news__', 'sentence': 'queensland hits 70pc double covid vaccination milestone  abc_news__'}
{'head': 'america', 'tail': 'iran', 'sentence': 'embarrassing stealing muslims oil while america and nato is stealing oil gold and denying food and medicine covid19 va

{'head': 'china', 'tail': 'grou', 'sentence': ' more than 8439 million children aged 3 to 11 in china have received covid19 vaccines 4944 million children of the age grou…'}
{'head': 'china', 'tail': 'grou', 'sentence': ' more than 8439 million children aged 3 to 11 in china have received covid19 vaccines 4944 million children of the age grou…'}
{'head': 'victoria_doh', 'tail': 'covid19vicdata_covid19vic_covid19aus', 'sentence': 'victoria_doh daily covid19 stats now show icu cleared cases  people who are cleared of infection but still in intensive care due to massive damage to their heartlungsetc covid19vicdata_covid19vic_covid19aus '}
{'head': 'healthcare_workers', 'tail': 'uk', 'sentence': ' a significant proportion of healthcare_workers hcws in the uk exposed to sarscov2 during the 1st wave of covid19 nev…'}
{'head': 'healthcare_workers', 'tail': 'covid19', 'sentence': ' a significant proportion of healthcare_workers hcws in the uk exposed to sarscov2 during the 1st wave of covid19 

{'head': 'yok', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning at chai_daen sai yok district kanchanaburi from i…'}
{'head': 'chai_daen', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning at chai_daen sai yok district kanchanaburi from i…'}
{'head': 'kazakhstan', 'tail': 'iran', 'sentence': 'virus  you can get one in china india russia kazakhstan iran  fancy your chances  covid19 vaccinessavelives'}
{'head': 'china', 'tail': 'india', 'sentence': 'virus  you can get one in china india russia kazakhstan iran  fancy your chances  covid19 vaccinessavelives'}
{'head': 'china', 'tail': 'russia', 'sentence': 'virus  you can get one in china india russia kazakhstan iran  fancy your chances  covid19 vaccinessavelives'}
{'head': 'india', 'tail': 'russia', 'sentence': 'virus  you can get one in china india russia kazakhstan iran  fancy your chances  covid19 vaccinessavelives'}
{'head': '

{'head': 'wellington_parliament', 'tail': 'new_zealand', 'sentence': ' new  protest against covid19 measures and restrictions outside wellington_parliament in new_zealand  '}
{'head': 'america_eu_canada', 'tail': 'australia', 'sentence': 'sweden suspends moderna shot indefinitely after vaxxed patients develop crippling heart condition while america_eu_canada australia uk_nato_force unproven dangerous vaccine covid19 '}
{'head': 'america_eu_canada', 'tail': 'uk_nato_force', 'sentence': 'sweden suspends moderna shot indefinitely after vaxxed patients develop crippling heart condition while america_eu_canada australia uk_nato_force unproven dangerous vaccine covid19 '}
{'head': 'australia', 'tail': 'uk_nato_force', 'sentence': 'sweden suspends moderna shot indefinitely after vaxxed patients develop crippling heart condition while america_eu_canada australia uk_nato_force unproven dangerous vaccine covid19 '}
{'head': 'sweden', 'tail': 'uk_nato_force', 'sentence': 'sweden suspends moderna 

{'head': 'yok', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning at chai_daen sai yok district kanchanaburi from i…'}
{'head': 'chai_daen', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning at chai_daen sai yok district kanchanaburi from i…'}
{'head': '🧡🧡🧡', 'tail': '🧡🧡🧡__🧡', 'sentence': ' 🧡🧡🧡sunday newsletter 🧡🧡🧡__🧡 we remember mortality and morbidity  🧡 new  guidelines 🧡 lckchampion danielgri…'}
{'head': 'kerala', 'tail': 'lalitha_kala_academy', 'sentence': ' it is absolutely disgusting that idiotic jurors of kerala lalitha_kala_academy have ridiculed the hard work and sacrifices…'}
{'head': 'europe', 'tail': 'central_asia', 'sentence': ' europe and central_asia again at the epicentre of the pandem…'}
{'head': 'china', 'tail': 'pr', 'sentence': ' china provided another batch of covid19 vaccines ampantipandemic supplies to thailand on friday thai prime minister pr…'}
{'head': '

{'head': 'california', 'tail': 'san_joaquin_valley_faces', 'sentence': 'california’s san_joaquin_valley_faces eternal wave of\xa0covid '}
{'head': 'healthcare_workers', 'tail': 'uk', 'sentence': ' a significant proportion of healthcare_workers hcws in the uk exposed to sarscov2 during the 1st wave of covid19 nev…'}
{'head': 'healthcare_workers', 'tail': 'covid19', 'sentence': ' a significant proportion of healthcare_workers hcws in the uk exposed to sarscov2 during the 1st wave of covid19 nev…'}
{'head': 'uk', 'tail': 'covid19', 'sentence': ' a significant proportion of healthcare_workers hcws in the uk exposed to sarscov2 during the 1st wave of covid19 nev…'}
{'head': 'india', 'tail': 'unite2fightcorona', 'sentence': 'aai and its officials are dedicated to serving the nation but without your assistance we cannot achieve a covid19 free india while travelling always follow safety guidelines amp protect yourself and others as all indians unite2fightcorona '}
{'head': 'california', 'tail'

{'head': 'toronto', 'tail': 'canada', 'sentence': 'the cure was worse than the disease death of the gym fitness industry toronto ontario canada 395 total days closed since pandemic started '}
{'head': 'yok', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning at chai_daen sai yok district kanchanaburi from i…'}
{'head': 'chai_daen', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning at chai_daen sai yok district kanchanaburi from i…'}
{'head': 'la_county', 'tail': 'covid_winter', 'sentence': 'la_county health director says covid_winter flare a ‘real possibility’ – cbs los\xa0angeles '}
{'head': 'pittsburgh', 'tail': 'ben', 'sentence': ' pittsburgh ap — pittsburgh quarterback ben roethlisberger has been placed on the covid19 list and will miss the steelers’ gam…'}
{'head': 'healthcare_workers', 'tail': 'uk', 'sentence': ' a significant proportion of healthcare_workers hcws in the uk 

{'head': 'italy', 'tail': 'france', 'sentence': 'italy france portugal introduced vaccine control measures before they relaxed other restrictions and at a time when public mobilisation over covid19 was still high this gave time for vaccine controls to become a matter of routine timing matters a lot in generating compliance'}
{'head': 'frankfurt', 'tail': 'hong_kong', 'sentence': ' cathay_pacific_pilots who passed through frankfurt ‘to be sent to hong_kong quarantine’ scores of cargo pilots affected …'}
{'head': 'cathay_pacific_pilots', 'tail': 'hong_kong', 'sentence': ' cathay_pacific_pilots who passed through frankfurt ‘to be sent to hong_kong quarantine’ scores of cargo pilots affected …'}
{'head': 'yok', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning at chai_daen sai yok district kanchanaburi from i…'}
{'head': 'chai_daen', 'tail': 'kanchanaburi', 'sentence': ' surasi force arrested 133 illegal immigrants in the early morning 

{'head': 's', 'tail': 'ms_miller', 'sentence': 'liza mangubat im support all senate vote mr beckerman ms_miller s stout mr blumenthal ms b i to support the covid19 social distancing fismash fished wash to continue to developing technology electricity carbon solar gasolines hydrogen innovation climate  '}
{'head': 'new_mexico', 'tail': 'denver', 'sentence': 'colorado joins new_mexico and california to deliver covid boosters to all adults – cbs\xa0denver '}
{'head': 'new_mexico', 'tail': 'california', 'sentence': 'colorado joins new_mexico and california to deliver covid boosters to all adults – cbs\xa0denver '}
{'head': 'france', 'tail': 'uk_un_usa', 'sentence': ' breaking thousands of people protested against the vaccine pass   breakingnews france paris uk_un_usa austria …'}
{'head': 'france', 'tail': 'paris', 'sentence': ' breaking thousands of people protested against the vaccine pass   breakingnews france paris uk_un_usa austria …'}
{'head': 'orlando', 'tail': 'florida', 'sentence':

{'head': 'healthcare_workers', 'tail': 'uk', 'sentence': ' a significant proportion of healthcare_workers hcws in the uk exposed to sarscov2 during the 1st wave of covid19 nev…'}
{'head': 'healthcare_workers', 'tail': 'covid19', 'sentence': ' a significant proportion of healthcare_workers hcws in the uk exposed to sarscov2 during the 1st wave of covid19 nev…'}
{'head': 'uk', 'tail': 'covid19', 'sentence': ' a significant proportion of healthcare_workers hcws in the uk exposed to sarscov2 during the 1st wave of covid19 nev…'}
{'head': 'china', 'tail': 'pakistan', 'sentence': 'china gifted 100000 novel coronavirus nucleic acid test kits and sample releaser buffers worth about 2 million to pakistan in support of the fight against the covid19 amid celebrations of bilateral ties for 70 years '}
{'head': 'guyana', 'tail': 'ali', 'sentence': 'guyana president ali promises to eliminate crime covid19 covid pandemic world caribbean vaccine vaccination 2021 guyana'}
{'head': 'national_guard_gener

{'head': 'europe', 'tail': 'uk', 'sentence': ' boris_johnson suggested he is worried a wave of covid19 infections in europe could affect the uk for avoidance of any doubt…'}
{'head': 'boris_johnson', 'tail': 'uk', 'sentence': ' boris_johnson suggested he is worried a wave of covid19 infections in europe could affect the uk for avoidance of any doubt…'}
{'head': 'healthcare_workers', 'tail': 'uk', 'sentence': ' a significant proportion of healthcare_workers hcws in the uk exposed to sarscov2 during the 1st wave of covid19 nev…'}
{'head': 'healthcare_workers', 'tail': 'covid19', 'sentence': ' a significant proportion of healthcare_workers hcws in the uk exposed to sarscov2 during the 1st wave of covid19 nev…'}
{'head': 'uk', 'tail': 'covid19', 'sentence': ' a significant proportion of healthcare_workers hcws in the uk exposed to sarscov2 during the 1st wave of covid19 nev…'}
{'head': 'haitian', 'tail': 'beijing', 'sentence': ' four confirmed covid19 infections and one asymptomatic case a

In [1]:
{"head": "la_jolla", "tail": "san_diego", "sentence": "la jolla is in san diego"}