This notebook explore the data for the relations between a location and humans, including:
* P19: place of birth
* P20: place of death
* P27: country of citizenship
* P937: work location


In [1]:
import pandas as pd
pd.set_option('display.max_colwidth', None)

In [2]:
P19_path = 'https://drive.google.com/uc?id=1iV55_NPswKMYCmAskdXqOKxnnRcQSsO6'
P20_path = 'https://drive.google.com/uc?id=18GC3W4SWf0iDtzY_KX5Vv9UQdgi8sCmZ'
P27_path = 'https://drive.google.com/uc?id=1FN5UWBdCuTHozfir1quXpwnOKtVdT3Ig'
P937_path = 'https://drive.google.com/uc?id=1znIwPdriMCW3opM1x8YTRmkcWEYlSUA9'
geo_path = 'geodata.csv'

In [3]:
df19_original = pd.read_json(P19_path, lines = True)
df20_original = pd.read_json(P20_path, lines = True)
df27_original = pd.read_json(P27_path, lines = True)
df937_original = pd.read_json(P937_path, lines = True)

In [4]:
def extract(df):
  return df.drop(["uuid", "obj_uri", "sub_uri", "predicate_id"], axis = 1)

In [5]:
dataframes = [extract(df) for df in [df19_original, df20_original, df27_original, df937_original]]
concat_data = pd.concat(dataframes, ignore_index = True)
concat_data

Unnamed: 0,obj_label,sub_label,evidences
0,Alexandra,Allan Peiper,"[{'sub_surface': 'Allan Peiper', 'obj_surface': 'Alexandra, Victoria', 'masked_sentence': 'Allan Peiper (born 26 April 1960 in [MASK], Australia) is a former Professional cyclist, who competed in five Tour de France cycle races.'}, {'sub_surface': 'Allan Peiper', 'obj_surface': 'Alexandra, Victoria', 'masked_sentence': 'Allan Peiper (born 26 April 1960 in [MASK], Australia) is a former Professional cyclist, who competed in five Tour de France cycle races.'}]"
1,Doncaster,Anthony Barber,"[{'sub_surface': 'Anthony Barber', 'obj_surface': 'Doncaster', 'masked_sentence': 'It was won by the Conservative candidate Anthony Barber, who returned after losing his [MASK] constituency in the 1964 General Election.'}]"
2,Scotland,Paul Mounsey,"[{'sub_surface': 'Paul Mounsey', 'obj_surface': 'Scottish', 'masked_sentence': 'NahooToo is the second album by [MASK] musician Paul Mounsey.'}, {'sub_surface': 'Paul Mounsey', 'obj_surface': 'Scottish', 'masked_sentence': 'City of Walls is the fourth album by [MASK] musician Paul Mounsey released in 2003 (see 2003 in music).'}, {'sub_surface': 'Paul Mounsey', 'obj_surface': 'Scotland', 'masked_sentence': 'Paul Mounsey (born 15 April 1959) is a composer, arranger and producer from [MASK].'}, {'sub_surface': 'Paul Mounsey', 'obj_surface': 'Scotland', 'masked_sentence': 'Paul Mounsey (born 15 April 1959) is a composer, arranger and producer from [MASK].'}]"
3,Toronto,Moe Koffman,"[{'sub_surface': 'Moe Koffman', 'obj_surface': 'Toronto', 'masked_sentence': 'He has performed with many of [MASK]'s foremost musicians including as a longstanding and charter member of Bernie Senensky's Moe Koffman Tribute Band.'}]"
4,Vienna,Kurt Schwertsik,"[{'sub_surface': 'Kurt Schwertsik', 'obj_surface': 'Vienna', 'masked_sentence': 'Kurt Schwertsik (born 25 June 1935, [MASK]) is an Austrian contemporary composer.'}, {'sub_surface': 'Kurt Schwertsik', 'obj_surface': 'Vienna', 'masked_sentence': 'Kurt Schwertsik (born 25 June 1935, [MASK]) is an Austrian contemporary composer.'}]"
...,...,...,...
3812,Gloucester,Arthur Headlam,"[{'sub_surface': 'Arthur Cayley Headlam', 'obj_surface': 'Gloucester', 'masked_sentence': 'Arthur Cayley Headlam CH (2 August 1862 – 17 January 1947) was an English theologian who served as Bishop of [MASK] from 1923 to 1945.'}, {'sub_surface': 'Arthur Cayley Headlam', 'obj_surface': 'Gloucester', 'masked_sentence': 'Arthur Cayley Headlam CH (2 August 1862 – 17 January 1947) was an English theologian who served as Bishop of [MASK] from 1923 to 1945.'}]"
3813,Vienna,Salomon Stricker,"[{'sub_surface': 'Salomon Stricker', 'obj_surface': 'Viennese', 'masked_sentence': 'In 1871 he visited England to help in the translation of a German work Handbuch der Lehre von den Geweben des Menchen und des There by his [MASK] teachers Salomon Stricker (1834-1898).'}]"
3814,Berlin,Carl Joseph Begas,"[{'sub_surface': 'Carl Joseph Begas', 'obj_surface': 'Berlin', 'masked_sentence': 'His first master was Seig in Magdeburg, and in 1828 he entered the studio of Carl Joseph Begas in [MASK], and went in 1831 to Düsseldorf, to the atelier of Friedrich Wilhelm Schadow, with whom he remained six years.'}]"
3815,Munich,Eugen Roth,"[{'sub_surface': 'Eugen Roth', 'obj_surface': 'Munich', 'masked_sentence': 'Eugen Roth (January 24, 1895 in [MASK] – April 28, 1976 in Munich) was a German lyricist and poet who wrote mostly humorous verse.'}, {'sub_surface': 'Eugen Roth', 'obj_surface': 'Munich', 'masked_sentence': 'Eugen Roth (January 24, 1895 in Munich – April 28, 1976 in [MASK]) was a German lyricist and poet who wrote mostly humorous verse.'}, {'sub_surface': 'Eugen Roth', 'obj_surface': 'Munich', 'masked_sentence': 'Eugen Roth (January 24, 1895 in [MASK] – April 28, 1976 in Munich) was a German lyricist and poet who wrote mostly humorous verse.'}, {'sub_surface': 'Eugen Roth', 'obj_surface': 'Munich', 'masked_sentence': 'Eugen Roth (January 24, 1895 in Munich – April 28, 1976 in [MASK]) was a German lyricist and poet who wrote mostly humorous verse.'}]"


In [6]:
def extract_text(evidences):
  return [evidence["masked_sentence"] for evidence in evidences]

In [7]:
concat_data["text"] = concat_data["evidences"].apply(extract_text)
concat_data.explode("text", ignore_index = True)

Unnamed: 0,obj_label,sub_label,evidences,text
0,Alexandra,Allan Peiper,"[{'sub_surface': 'Allan Peiper', 'obj_surface': 'Alexandra, Victoria', 'masked_sentence': 'Allan Peiper (born 26 April 1960 in [MASK], Australia) is a former Professional cyclist, who competed in five Tour de France cycle races.'}, {'sub_surface': 'Allan Peiper', 'obj_surface': 'Alexandra, Victoria', 'masked_sentence': 'Allan Peiper (born 26 April 1960 in [MASK], Australia) is a former Professional cyclist, who competed in five Tour de France cycle races.'}]","Allan Peiper (born 26 April 1960 in [MASK], Australia) is a former Professional cyclist, who competed in five Tour de France cycle races."
1,Alexandra,Allan Peiper,"[{'sub_surface': 'Allan Peiper', 'obj_surface': 'Alexandra, Victoria', 'masked_sentence': 'Allan Peiper (born 26 April 1960 in [MASK], Australia) is a former Professional cyclist, who competed in five Tour de France cycle races.'}, {'sub_surface': 'Allan Peiper', 'obj_surface': 'Alexandra, Victoria', 'masked_sentence': 'Allan Peiper (born 26 April 1960 in [MASK], Australia) is a former Professional cyclist, who competed in five Tour de France cycle races.'}]","Allan Peiper (born 26 April 1960 in [MASK], Australia) is a former Professional cyclist, who competed in five Tour de France cycle races."
2,Doncaster,Anthony Barber,"[{'sub_surface': 'Anthony Barber', 'obj_surface': 'Doncaster', 'masked_sentence': 'It was won by the Conservative candidate Anthony Barber, who returned after losing his [MASK] constituency in the 1964 General Election.'}]","It was won by the Conservative candidate Anthony Barber, who returned after losing his [MASK] constituency in the 1964 General Election."
3,Scotland,Paul Mounsey,"[{'sub_surface': 'Paul Mounsey', 'obj_surface': 'Scottish', 'masked_sentence': 'NahooToo is the second album by [MASK] musician Paul Mounsey.'}, {'sub_surface': 'Paul Mounsey', 'obj_surface': 'Scottish', 'masked_sentence': 'City of Walls is the fourth album by [MASK] musician Paul Mounsey released in 2003 (see 2003 in music).'}, {'sub_surface': 'Paul Mounsey', 'obj_surface': 'Scotland', 'masked_sentence': 'Paul Mounsey (born 15 April 1959) is a composer, arranger and producer from [MASK].'}, {'sub_surface': 'Paul Mounsey', 'obj_surface': 'Scotland', 'masked_sentence': 'Paul Mounsey (born 15 April 1959) is a composer, arranger and producer from [MASK].'}]",NahooToo is the second album by [MASK] musician Paul Mounsey.
4,Scotland,Paul Mounsey,"[{'sub_surface': 'Paul Mounsey', 'obj_surface': 'Scottish', 'masked_sentence': 'NahooToo is the second album by [MASK] musician Paul Mounsey.'}, {'sub_surface': 'Paul Mounsey', 'obj_surface': 'Scottish', 'masked_sentence': 'City of Walls is the fourth album by [MASK] musician Paul Mounsey released in 2003 (see 2003 in music).'}, {'sub_surface': 'Paul Mounsey', 'obj_surface': 'Scotland', 'masked_sentence': 'Paul Mounsey (born 15 April 1959) is a composer, arranger and producer from [MASK].'}, {'sub_surface': 'Paul Mounsey', 'obj_surface': 'Scotland', 'masked_sentence': 'Paul Mounsey (born 15 April 1959) is a composer, arranger and producer from [MASK].'}]",City of Walls is the fourth album by [MASK] musician Paul Mounsey released in 2003 (see 2003 in music).
...,...,...,...,...
12908,London,Joseph Chamberlain,"[{'sub_surface': 'Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'At the same time he contested West Islington in [MASK] as a Gladstone Liberal, attempting to unseat Richard Chamberlain, who like his older brother Joseph Chamberlain had deserted the Liberal party rather than vote for the First Irish Home Rule Bill, and was standing as a Liberal Unionist.'}, {'sub_surface': 'Joseph Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'At the same time he contested West Islington in [MASK] as a Gladstone Liberal, attempting to unseat Richard Chamberlain, who like his older brother Joseph Chamberlain had deserted the Liberal party rather than vote for the First Irish Home Rule Bill, and was standing as a Liberal Unionist.'}, {'sub_surface': 'Joseph Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'Its resulting high level of social mobility also fostered a culture of broad-based political radicalism, that under leaders from Thomas Attwood to Joseph Chamberlain was to give it a political influence unparalleled in Britain outside [MASK], and a pivotal role in the development of British democracy.'}, {'sub_surface': 'Joseph Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'The conference was convened in [MASK] by Colonial Secretary Joseph Chamberlain in 1897 on the occasion of Diamond Jubilee of Queen Victoria.'}, {'sub_surface': 'Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'Benjamin Scott (1814–1892) served as Chamberlain of the City of [MASK] from 1858 until his death, as well as being a committed social activist.'}, {'sub_surface': 'Joseph Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'R. B. Prosser was educated at University College School, [MASK] where he was a fellow pupil of Joseph Chamberlain.'}, {'sub_surface': 'Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'He was born in [MASK] to John Sutton Nettlefold who, in 1854, dispatched him to manage the business of Nettlefold and Chamberlain in Birmingham with his brother Edward John and cousin Joseph Chamberlain.'}, {'sub_surface': 'Joseph Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'He was born in [MASK] to John Sutton Nettlefold who, in 1854, dispatched him to manage the business of Nettlefold and Chamberlain in Birmingham with his brother Edward John and cousin Joseph Chamberlain.'}, {'sub_surface': 'Joseph Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'The [MASK] School of Tropical Medicine was established here in October 1899, by Sir Patrick Manson with assistance from the British Secretary of State for the Colonies (Joseph Chamberlain).Together with the Hospital for Tropical Diseases they moved to Euston in February 1920.'}, {'sub_surface': 'Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'It received its name from the Highbury area of [MASK], where Chamberlain lived as a child.'}]","R. B. Prosser was educated at University College School, [MASK] where he was a fellow pupil of Joseph Chamberlain."
12909,London,Joseph Chamberlain,"[{'sub_surface': 'Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'At the same time he contested West Islington in [MASK] as a Gladstone Liberal, attempting to unseat Richard Chamberlain, who like his older brother Joseph Chamberlain had deserted the Liberal party rather than vote for the First Irish Home Rule Bill, and was standing as a Liberal Unionist.'}, {'sub_surface': 'Joseph Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'At the same time he contested West Islington in [MASK] as a Gladstone Liberal, attempting to unseat Richard Chamberlain, who like his older brother Joseph Chamberlain had deserted the Liberal party rather than vote for the First Irish Home Rule Bill, and was standing as a Liberal Unionist.'}, {'sub_surface': 'Joseph Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'Its resulting high level of social mobility also fostered a culture of broad-based political radicalism, that under leaders from Thomas Attwood to Joseph Chamberlain was to give it a political influence unparalleled in Britain outside [MASK], and a pivotal role in the development of British democracy.'}, {'sub_surface': 'Joseph Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'The conference was convened in [MASK] by Colonial Secretary Joseph Chamberlain in 1897 on the occasion of Diamond Jubilee of Queen Victoria.'}, {'sub_surface': 'Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'Benjamin Scott (1814–1892) served as Chamberlain of the City of [MASK] from 1858 until his death, as well as being a committed social activist.'}, {'sub_surface': 'Joseph Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'R. B. Prosser was educated at University College School, [MASK] where he was a fellow pupil of Joseph Chamberlain.'}, {'sub_surface': 'Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'He was born in [MASK] to John Sutton Nettlefold who, in 1854, dispatched him to manage the business of Nettlefold and Chamberlain in Birmingham with his brother Edward John and cousin Joseph Chamberlain.'}, {'sub_surface': 'Joseph Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'He was born in [MASK] to John Sutton Nettlefold who, in 1854, dispatched him to manage the business of Nettlefold and Chamberlain in Birmingham with his brother Edward John and cousin Joseph Chamberlain.'}, {'sub_surface': 'Joseph Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'The [MASK] School of Tropical Medicine was established here in October 1899, by Sir Patrick Manson with assistance from the British Secretary of State for the Colonies (Joseph Chamberlain).Together with the Hospital for Tropical Diseases they moved to Euston in February 1920.'}, {'sub_surface': 'Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'It received its name from the Highbury area of [MASK], where Chamberlain lived as a child.'}]","He was born in [MASK] to John Sutton Nettlefold who, in 1854, dispatched him to manage the business of Nettlefold and Chamberlain in Birmingham with his brother Edward John and cousin Joseph Chamberlain."
12910,London,Joseph Chamberlain,"[{'sub_surface': 'Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'At the same time he contested West Islington in [MASK] as a Gladstone Liberal, attempting to unseat Richard Chamberlain, who like his older brother Joseph Chamberlain had deserted the Liberal party rather than vote for the First Irish Home Rule Bill, and was standing as a Liberal Unionist.'}, {'sub_surface': 'Joseph Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'At the same time he contested West Islington in [MASK] as a Gladstone Liberal, attempting to unseat Richard Chamberlain, who like his older brother Joseph Chamberlain had deserted the Liberal party rather than vote for the First Irish Home Rule Bill, and was standing as a Liberal Unionist.'}, {'sub_surface': 'Joseph Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'Its resulting high level of social mobility also fostered a culture of broad-based political radicalism, that under leaders from Thomas Attwood to Joseph Chamberlain was to give it a political influence unparalleled in Britain outside [MASK], and a pivotal role in the development of British democracy.'}, {'sub_surface': 'Joseph Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'The conference was convened in [MASK] by Colonial Secretary Joseph Chamberlain in 1897 on the occasion of Diamond Jubilee of Queen Victoria.'}, {'sub_surface': 'Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'Benjamin Scott (1814–1892) served as Chamberlain of the City of [MASK] from 1858 until his death, as well as being a committed social activist.'}, {'sub_surface': 'Joseph Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'R. B. Prosser was educated at University College School, [MASK] where he was a fellow pupil of Joseph Chamberlain.'}, {'sub_surface': 'Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'He was born in [MASK] to John Sutton Nettlefold who, in 1854, dispatched him to manage the business of Nettlefold and Chamberlain in Birmingham with his brother Edward John and cousin Joseph Chamberlain.'}, {'sub_surface': 'Joseph Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'He was born in [MASK] to John Sutton Nettlefold who, in 1854, dispatched him to manage the business of Nettlefold and Chamberlain in Birmingham with his brother Edward John and cousin Joseph Chamberlain.'}, {'sub_surface': 'Joseph Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'The [MASK] School of Tropical Medicine was established here in October 1899, by Sir Patrick Manson with assistance from the British Secretary of State for the Colonies (Joseph Chamberlain).Together with the Hospital for Tropical Diseases they moved to Euston in February 1920.'}, {'sub_surface': 'Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'It received its name from the Highbury area of [MASK], where Chamberlain lived as a child.'}]","He was born in [MASK] to John Sutton Nettlefold who, in 1854, dispatched him to manage the business of Nettlefold and Chamberlain in Birmingham with his brother Edward John and cousin Joseph Chamberlain."
12911,London,Joseph Chamberlain,"[{'sub_surface': 'Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'At the same time he contested West Islington in [MASK] as a Gladstone Liberal, attempting to unseat Richard Chamberlain, who like his older brother Joseph Chamberlain had deserted the Liberal party rather than vote for the First Irish Home Rule Bill, and was standing as a Liberal Unionist.'}, {'sub_surface': 'Joseph Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'At the same time he contested West Islington in [MASK] as a Gladstone Liberal, attempting to unseat Richard Chamberlain, who like his older brother Joseph Chamberlain had deserted the Liberal party rather than vote for the First Irish Home Rule Bill, and was standing as a Liberal Unionist.'}, {'sub_surface': 'Joseph Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'Its resulting high level of social mobility also fostered a culture of broad-based political radicalism, that under leaders from Thomas Attwood to Joseph Chamberlain was to give it a political influence unparalleled in Britain outside [MASK], and a pivotal role in the development of British democracy.'}, {'sub_surface': 'Joseph Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'The conference was convened in [MASK] by Colonial Secretary Joseph Chamberlain in 1897 on the occasion of Diamond Jubilee of Queen Victoria.'}, {'sub_surface': 'Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'Benjamin Scott (1814–1892) served as Chamberlain of the City of [MASK] from 1858 until his death, as well as being a committed social activist.'}, {'sub_surface': 'Joseph Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'R. B. Prosser was educated at University College School, [MASK] where he was a fellow pupil of Joseph Chamberlain.'}, {'sub_surface': 'Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'He was born in [MASK] to John Sutton Nettlefold who, in 1854, dispatched him to manage the business of Nettlefold and Chamberlain in Birmingham with his brother Edward John and cousin Joseph Chamberlain.'}, {'sub_surface': 'Joseph Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'He was born in [MASK] to John Sutton Nettlefold who, in 1854, dispatched him to manage the business of Nettlefold and Chamberlain in Birmingham with his brother Edward John and cousin Joseph Chamberlain.'}, {'sub_surface': 'Joseph Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'The [MASK] School of Tropical Medicine was established here in October 1899, by Sir Patrick Manson with assistance from the British Secretary of State for the Colonies (Joseph Chamberlain).Together with the Hospital for Tropical Diseases they moved to Euston in February 1920.'}, {'sub_surface': 'Chamberlain', 'obj_surface': 'London', 'masked_sentence': 'It received its name from the Highbury area of [MASK], where Chamberlain lived as a child.'}]","The [MASK] School of Tropical Medicine was established here in October 1899, by Sir Patrick Manson with assistance from the British Secretary of State for the Colonies (Joseph Chamberlain).Together with the Hospital for Tropical Diseases they moved to Euston in February 1920."


In [8]:
concat_data["obj_label"].unique()

array(['Alexandra', 'Doncaster', 'Scotland', 'Toronto', 'Vienna', 'Paris',
       'Yokohama', 'Antwerp', 'Barcelona', 'Rome', 'Guangzhou', 'Lahore',
       'Florence', 'Belfast', 'Budapest', 'Odessa', 'Melbourne', 'Lyon',
       'Halifax', 'Tokyo', 'London', 'Montreal', 'Queensland', 'Sydney',
       'Helsinki', 'Preston', 'Seoul', 'Detroit', 'Bangkok', 'Nebraska',
       'Madrid', 'Constantinople', 'Bristol', 'Glasgow', 'Cebu',
       'Ukraine', 'Houston', 'Lund', 'Milan', 'Tehran', 'Atlanta',
       'Thailand', 'Angeles', 'Staffordshire', 'Salt', 'Shanghai',
       'Berlin', 'Taipei', 'Gothenburg', 'Guangdong', 'Luton', 'Boston',
       'Havana', 'Essex', 'Newmarket', 'Verona', 'Hamilton', 'Auckland',
       'Chicago', 'Brunswick', 'Denver', 'Perth', 'Utrecht', 'Harlem',
       'Granada', 'Strasbourg', 'Copenhagen', 'Siena', 'Amsterdam',
       'Cincinnati', 'Leigh', 'Naples', 'Beirut', 'Manchester',
       'Brighton', 'Bohemia', 'Bremen', 'Kota', 'Stockholm', 'Mumbai',
       'Turin

In [9]:
concat_data = concat_data.sort_values("obj_label", ignore_index = True)

In [10]:
concat_data

Unnamed: 0,obj_label,sub_label,evidences,text
0,Adelaide,John Lavington Bonython,"[{'sub_surface': 'John Lavington Bonython', 'obj_surface': 'Adelaide', 'masked_sentence': 'In 1930 he married Elizabeth (Betty) Hornabrook Bonython (25 January 1907 – 25 September 2008), born in [MASK], the eldest daughter of Adelaide Advertiser editor, and Lord mayor of Adelaide, Sir John Lavington Bonython (1875–1960) and his first wife Blanche Ada Bray (1881–1908).'}, {'sub_surface': 'John Lavington Bonython', 'obj_surface': 'Adelaide', 'masked_sentence': 'In 1930 he married Elizabeth (Betty) Hornabrook Bonython (25 January 1907 – 25 September 2008), born in Adelaide, the eldest daughter of Adelaide Advertiser editor, and Lord mayor of [MASK], Sir John Lavington Bonython (1875–1960) and his first wife Blanche Ada Bray (1881–1908).'}, {'sub_surface': 'Blanche Ada Bray', 'obj_surface': 'Adelaide', 'masked_sentence': 'In 1930 he married Elizabeth (Betty) Hornabrook Bonython (25 January 1907 – 25 September 2008), born in [MASK], the eldest daughter of Adelaide Advertiser editor, and Lord mayor of Adelaide, Sir John Lavington Bonython (1875–1960) and his first wife Blanche Ada Bray (1881–1908).'}, {'sub_surface': 'Blanche Ada Bray', 'obj_surface': 'Adelaide', 'masked_sentence': 'In 1930 he married Elizabeth (Betty) Hornabrook Bonython (25 January 1907 – 25 September 2008), born in Adelaide, the eldest daughter of Adelaide Advertiser editor, and Lord mayor of [MASK], Sir John Lavington Bonython (1875–1960) and his first wife Blanche Ada Bray (1881–1908).'}, {'sub_surface': 'John Lavington Bonython', 'obj_surface': 'Adelaide', 'masked_sentence': 'In 1930 he married Elizabeth (Betty) Hornabrook Bonython (25 January 1907 – 25 September 2008), born in [MASK], the eldest daughter of Adelaide Advertiser editor, and Lord mayor of Adelaide, Sir John Lavington Bonython (1875–1960) and his first wife Blanche Ada Bray (1881–1908).'}, {'sub_surface': 'John Lavington Bonython', 'obj_surface': 'Adelaide', 'masked_sentence': 'In 1930 he married Elizabeth (Betty) Hornabrook Bonython (25 January 1907 – 25 September 2008), born in Adelaide, the eldest daughter of Adelaide Advertiser editor, and Lord mayor of [MASK], Sir John Lavington Bonython (1875–1960) and his first wife Blanche Ada Bray (1881–1908).'}, {'sub_surface': 'Blanche Ada Bray', 'obj_surface': 'Adelaide', 'masked_sentence': 'In 1930 he married Elizabeth (Betty) Hornabrook Bonython (25 January 1907 – 25 September 2008), born in [MASK], the eldest daughter of Adelaide Advertiser editor, and Lord mayor of Adelaide, Sir John Lavington Bonython (1875–1960) and his first wife Blanche Ada Bray (1881–1908).'}, {'sub_surface': 'Blanche Ada Bray', 'obj_surface': 'Adelaide', 'masked_sentence': 'In 1930 he married Elizabeth (Betty) Hornabrook Bonython (25 January 1907 – 25 September 2008), born in Adelaide, the eldest daughter of Adelaide Advertiser editor, and Lord mayor of [MASK], Sir John Lavington Bonython (1875–1960) and his first wife Blanche Ada Bray (1881–1908).'}, {'sub_surface': 'John Lavington Bonython', 'obj_surface': 'Adelaide', 'masked_sentence': 'His son was named Sir John Lavington Bonython (1875-1960)His grandson was named John Langdon Bonython (1905–1992) Sir John Langdon Bonython KCMG (/bɒˈnaɪθən/; 15 October 1848 – 22 October 1939), editor, newspaper proprietor, philanthropist, Australian politician and journalist, was a Member of the First Australian Parliament, and was editor of the [MASK] daily morning broadsheet, The Advertiser, for 35 years.'}, {'sub_surface': 'John Lavington Bonython', 'obj_surface': 'Adelaide', 'masked_sentence': 'Sir John Lavington Bonython (1875–1960) was a prominent public figure in [MASK], known for his work in journalism, business and politics.'}, {'sub_surface': 'John Lavington Bonython', 'obj_surface': 'Adelaide', 'masked_sentence': 'Sir John Lavington Bonython (1875–1960) was a prominent public figure in [MASK], known for his work in journalism, business and politics.'}]","[In 1930 he married Elizabeth (Betty) Hornabrook Bonython (25 January 1907 – 25 September 2008), born in [MASK], the eldest daughter of Adelaide Advertiser editor, and Lord mayor of Adelaide, Sir John Lavington Bonython (1875–1960) and his first wife Blanche Ada Bray (1881–1908)., In 1930 he married Elizabeth (Betty) Hornabrook Bonython (25 January 1907 – 25 September 2008), born in Adelaide, the eldest daughter of Adelaide Advertiser editor, and Lord mayor of [MASK], Sir John Lavington Bonython (1875–1960) and his first wife Blanche Ada Bray (1881–1908)., In 1930 he married Elizabeth (Betty) Hornabrook Bonython (25 January 1907 – 25 September 2008), born in [MASK], the eldest daughter of Adelaide Advertiser editor, and Lord mayor of Adelaide, Sir John Lavington Bonython (1875–1960) and his first wife Blanche Ada Bray (1881–1908)., In 1930 he married Elizabeth (Betty) Hornabrook Bonython (25 January 1907 – 25 September 2008), born in Adelaide, the eldest daughter of Adelaide Advertiser editor, and Lord mayor of [MASK], Sir John Lavington Bonython (1875–1960) and his first wife Blanche Ada Bray (1881–1908)., In 1930 he married Elizabeth (Betty) Hornabrook Bonython (25 January 1907 – 25 September 2008), born in [MASK], the eldest daughter of Adelaide Advertiser editor, and Lord mayor of Adelaide, Sir John Lavington Bonython (1875–1960) and his first wife Blanche Ada Bray (1881–1908)., In 1930 he married Elizabeth (Betty) Hornabrook Bonython (25 January 1907 – 25 September 2008), born in Adelaide, the eldest daughter of Adelaide Advertiser editor, and Lord mayor of [MASK], Sir John Lavington Bonython (1875–1960) and his first wife Blanche Ada Bray (1881–1908)., In 1930 he married Elizabeth (Betty) Hornabrook Bonython (25 January 1907 – 25 September 2008), born in [MASK], the eldest daughter of Adelaide Advertiser editor, and Lord mayor of Adelaide, Sir John Lavington Bonython (1875–1960) and his first wife Blanche Ada Bray (1881–1908)., In 1930 he married Elizabeth (Betty) Hornabrook Bonython (25 January 1907 – 25 September 2008), born in Adelaide, the eldest daughter of Adelaide Advertiser editor, and Lord mayor of [MASK], Sir John Lavington Bonython (1875–1960) and his first wife Blanche Ada Bray (1881–1908)., His son was named Sir John Lavington Bonython (1875-1960)His grandson was named John Langdon Bonython (1905–1992) Sir John Langdon Bonython KCMG (/bɒˈnaɪθən/; 15 October 1848 – 22 October 1939), editor, newspaper proprietor, philanthropist, Australian politician and journalist, was a Member of the First Australian Parliament, and was editor of the [MASK] daily morning broadsheet, The Advertiser, for 35 years., Sir John Lavington Bonython (1875–1960) was a prominent public figure in [MASK], known for his work in journalism, business and politics., Sir John Lavington Bonython (1875–1960) was a prominent public figure in [MASK], known for his work in journalism, business and politics.]"
1,Adelaide,Tony Vidmar,"[{'sub_surface': 'Tony Vidmar', 'obj_surface': 'Adelaide', 'masked_sentence': 'Former [MASK] player Richie Alagich, along with Michael Barnett and former Socceroos Tony Vidmar and Joe Mullen joined the coaching staff of these teams.'}]","[Former [MASK] player Richie Alagich, along with Michael Barnett and former Socceroos Tony Vidmar and Joe Mullen joined the coaching staff of these teams.]"
2,Adelaide,Cory Bernardi,"[{'sub_surface': 'Cory Bernardi', 'obj_surface': 'Adelaide', 'masked_sentence': 'Cory Bernardi (born 6 November 1969, [MASK]) is an Australian politician and the author of The Conservative Revolution.'}, {'sub_surface': 'Cory Bernardi', 'obj_surface': 'Adelaide', 'masked_sentence': 'Cory Bernardi (born 6 November 1969, [MASK]) is an Australian politician and the author of The Conservative Revolution.'}]","[Cory Bernardi (born 6 November 1969, [MASK]) is an Australian politician and the author of The Conservative Revolution., Cory Bernardi (born 6 November 1969, [MASK]) is an Australian politician and the author of The Conservative Revolution.]"
3,Adelaide,John McConnell Black,"[{'sub_surface': 'J.M.Black', 'obj_surface': 'Adelaide', 'masked_sentence': 'J.M.Black received the following distinctions for his botanical work:- 1927, Honorary Lecturer in Systematic Botany at the University of [MASK]; 1930, Associate honoris causa of the Linnean Society, London; 1930, Sir Joseph Verco Medal of the Royal Society of South Australia; 1932 Ferdinand von Mueller Medal (Australian and New Zealand Association for the Advancement of Science; 1933-34, President of the Royal Society of South Australia; in 1942, the M.B.E.'}, {'sub_surface': 'J.M.Black', 'obj_surface': 'Adelaide', 'masked_sentence': 'J.M.Black received the following distinctions for his botanical work:- 1927, Honorary Lecturer in Systematic Botany at the University of [MASK]; 1930, Associate honoris causa of the Linnean Society, London; 1930, Sir Joseph Verco Medal of the Royal Society of South Australia; 1932 Ferdinand von Mueller Medal (Australian and New Zealand Association for the Advancement of Science; 1933-34, President of the Royal Society of South Australia; in 1942, the M.B.E.'}]","[J.M.Black received the following distinctions for his botanical work:- 1927, Honorary Lecturer in Systematic Botany at the University of [MASK]; 1930, Associate honoris causa of the Linnean Society, London; 1930, Sir Joseph Verco Medal of the Royal Society of South Australia; 1932 Ferdinand von Mueller Medal (Australian and New Zealand Association for the Advancement of Science; 1933-34, President of the Royal Society of South Australia; in 1942, the M.B.E., J.M.Black received the following distinctions for his botanical work:- 1927, Honorary Lecturer in Systematic Botany at the University of [MASK]; 1930, Associate honoris causa of the Linnean Society, London; 1930, Sir Joseph Verco Medal of the Royal Society of South Australia; 1932 Ferdinand von Mueller Medal (Australian and New Zealand Association for the Advancement of Science; 1933-34, President of the Royal Society of South Australia; in 1942, the M.B.E.]"
4,Afghanistan,Nashenas,"[{'sub_surface': 'Nashenas', 'obj_surface': 'Afghanistan', 'masked_sentence': 'Nashenas (Pashto/Dari: ناشناس), born as Sadiq Fitrat Habibi, (Pashto/Persian: صادق فطرت) is one of the oldest surviving musicians from [MASK].'}, {'sub_surface': 'Nashenas', 'obj_surface': 'Afghanistan', 'masked_sentence': 'Nashenas (Pashto/Dari: ناشناس), born as Sadiq Fitrat Habibi, (Pashto/Persian: صادق فطرت) is one of the oldest surviving musicians from [MASK].'}]","[Nashenas (Pashto/Dari: ناشناس), born as Sadiq Fitrat Habibi, (Pashto/Persian: صادق فطرت) is one of the oldest surviving musicians from [MASK]., Nashenas (Pashto/Dari: ناشناس), born as Sadiq Fitrat Habibi, (Pashto/Persian: صادق فطرت) is one of the oldest surviving musicians from [MASK].]"
...,...,...,...,...
3812,Zagreb,Boris Papandopulo,"[{'sub_surface': 'Boris Papandopulo', 'obj_surface': 'Zagreb', 'masked_sentence': 'Boris Papandopulo (Honnef am Rhein, February 25, 1906 – [MASK], October 16, 1991), Croatian composer and conductor of Russian Jewish descent.'}, {'sub_surface': 'Boris Papandopulo', 'obj_surface': 'Zagreb', 'masked_sentence': 'Boris Papandopulo (Honnef am Rhein, February 25, 1906 – [MASK], October 16, 1991), Croatian composer and conductor of Russian Jewish descent.'}]","[Boris Papandopulo (Honnef am Rhein, February 25, 1906 – [MASK], October 16, 1991), Croatian composer and conductor of Russian Jewish descent., Boris Papandopulo (Honnef am Rhein, February 25, 1906 – [MASK], October 16, 1991), Croatian composer and conductor of Russian Jewish descent.]"
3813,Zagreb,Edmund Glaise-Horstenau,"[{'sub_surface': 'Edmund Glaise von Horstenau', 'obj_surface': 'Agram', 'masked_sentence': 'In 1941 he was saved by deportation by the Independent State of Croatia, through his friend Edmund Glaise von Horstenau, the Deutscher kommandierender General in [MASK].'}]","[In 1941 he was saved by deportation by the Independent State of Croatia, through his friend Edmund Glaise von Horstenau, the Deutscher kommandierender General in [MASK].]"
3814,Zagreb,Miko Tripalo,"[{'sub_surface': 'Miko Tripalo', 'obj_surface': 'Zagreb', 'masked_sentence': 'Miko Tripalo (Sinj, 1926 – [MASK], 1995) was a Croatian and Yugoslav politician.'}, {'sub_surface': 'Miko Tripalo', 'obj_surface': 'Zagreb', 'masked_sentence': 'Miko Tripalo (Sinj, 1926 – [MASK], 1995) was a Croatian and Yugoslav politician.'}]","[Miko Tripalo (Sinj, 1926 – [MASK], 1995) was a Croatian and Yugoslav politician., Miko Tripalo (Sinj, 1926 – [MASK], 1995) was a Croatian and Yugoslav politician.]"
3815,Zimbabwe,Patrick Chinamasa,"[{'sub_surface': 'Chinamasa', 'obj_surface': 'Zimbabwe', 'masked_sentence': 'Patrick Antony Chinamasa is a Zimbabwean politician who has served in the government of [MASK] as Minister of Finance since 2013.'}, {'sub_surface': 'Chinamasa', 'obj_surface': 'Zimbabwe', 'masked_sentence': 'Patrick Antony Chinamasa is a Zimbabwean politician who has served in the government of [MASK] as Minister of Finance since 2013.'}]","[Patrick Antony Chinamasa is a Zimbabwean politician who has served in the government of [MASK] as Minister of Finance since 2013., Patrick Antony Chinamasa is a Zimbabwean politician who has served in the government of [MASK] as Minister of Finance since 2013.]"


In [11]:
concat_data = concat_data.explode("text", ignore_index = True)

We will process the dataset with these steps:
- Remove rows that their "obj_label" is not capitalized (not a city/ country)
- Remove the "evidence" column
- Check for duplication in "text"
- Split into two dataframes that is called "text" and "texts" ("text" contains the first row of every "obj_label" and "texts" include all corresponding sentence)

In [12]:
concat_data = concat_data[concat_data["obj_label"].str[0].str.isupper()]

In [13]:
concat_data = concat_data.drop(columns = ["evidences", "sub_label"])

In [14]:
concat_data = concat_data.drop_duplicates(subset = ["text"])

In [15]:
concat_data = concat_data.dropna()

In [16]:
concat_data = concat_data[concat_data["text"].str.endswith("[MASK].", na=False)]

In [17]:
concat_data

Unnamed: 0,obj_label,text
16,Afghanistan,"Nashenas (Pashto/Dari: ناشناس), born as Sadiq Fitrat Habibi, (Pashto/Persian: صادق فطرت) is one of the oldest surviving musicians from [MASK]."
18,Afghanistan,Abdul Malik Pahlawan is an Uzbek politician based in Faryab Province in northern [MASK].
27,Afghanistan,This garden was built by Maharajah Ranjit Singh in 1813 to celebrate the capture of the famous Koh-i-Noor Diamond from Shah Shujah of [MASK].
29,Afghanistan,"His father was a Qazi in the city of Qandahar, as well as being a some-time minister during the reign of Shah Shujah Durrani (1785-1842), King of [MASK]."
32,Ajax,"Tyler Williams (born February 25, 1988), professionally known as T-Minus, is a Canadian hip-hop and R&B producer from [MASK]."
...,...,...
12722,Windsor,"Williams married in 1812 Delia Ellsworth, daughter of Founding Father Oliver Ellsworth of [MASK]."
12726,Winnipeg,"Although Hasselfield had never run for provincial office, she was known in Manitoba as a prominent organizer for the Liberal Party and was supported by the party's establishment against Kevin Lamoureux, a maverick MLA from north-end [MASK]."
12732,Wisconsin,"Diane Hendricks (born 1947) is an American businesswoman, film producer and philanthropist from [MASK]."
12738,Wolverhampton,"She married, in November 1930, Geoffrey Mander MP for East [MASK]."


In [18]:
concat_data["obj_label"].unique()

array(['Afghanistan', 'Ajax', 'Albania', 'Algeria', 'Amherst',
       'Amsterdam', 'Angola', 'Antwerp', 'Argentina', 'Armagh', 'Armenia',
       'Athens', 'Atlanta', 'Auckland', 'Augsburg', 'Australia',
       'Austria', 'Baghdad', 'Baku', 'Baltimore', 'Bangkok', 'Bangladesh',
       'Barcelona', 'Bari', 'Basel', 'Beijing', 'Beirut', 'Belgium',
       'Bend', 'Berlin', 'Bern', 'Bhutan', 'Bihar', 'Birmingham',
       'Bohemia', 'Bolivia', 'Bologna', 'Bolton', 'Bonn', 'Boston',
       'Brazil', 'Bremen', 'Brooklyn', 'Bucharest', 'Bulgaria', 'Cairo',
       'Calgary', 'California', 'Cambodia', 'Cambridge', 'Camden',
       'Canada', 'Canterbury', 'Cebu', 'Chester', 'Chicago', 'Chile',
       'Cincinnati', 'Cleveland', 'Colchester', 'Cologne', 'Colombia',
       'Constantinople', 'Copenhagen', 'Dallas', 'Denmark', 'Denver',
       'Derby', 'Detroit', 'Dresden', 'Dubai', 'Dublin', 'Edinburgh',
       'Egypt', 'England', 'Ethiopia', 'Exeter', 'Fiji', 'Finland',
       'Florence', 'Florida', 

In [19]:
concat_data["text"] = concat_data["text"].str.replace(r"\[MASK\]\.?", "", regex=True)

In [20]:
concat_data

Unnamed: 0,obj_label,text
16,Afghanistan,"Nashenas (Pashto/Dari: ناشناس), born as Sadiq Fitrat Habibi, (Pashto/Persian: صادق فطرت) is one of the oldest surviving musicians from"
18,Afghanistan,Abdul Malik Pahlawan is an Uzbek politician based in Faryab Province in northern
27,Afghanistan,This garden was built by Maharajah Ranjit Singh in 1813 to celebrate the capture of the famous Koh-i-Noor Diamond from Shah Shujah of
29,Afghanistan,"His father was a Qazi in the city of Qandahar, as well as being a some-time minister during the reign of Shah Shujah Durrani (1785-1842), King of"
32,Ajax,"Tyler Williams (born February 25, 1988), professionally known as T-Minus, is a Canadian hip-hop and R&B producer from"
...,...,...
12722,Windsor,"Williams married in 1812 Delia Ellsworth, daughter of Founding Father Oliver Ellsworth of"
12726,Winnipeg,"Although Hasselfield had never run for provincial office, she was known in Manitoba as a prominent organizer for the Liberal Party and was supported by the party's establishment against Kevin Lamoureux, a maverick MLA from north-end"
12732,Wisconsin,"Diane Hendricks (born 1947) is an American businesswoman, film producer and philanthropist from"
12738,Wolverhampton,"She married, in November 1930, Geoffrey Mander MP for East"


In [21]:
data = concat_data.groupby("obj_label").agg(
    text=("text", lambda x: str(x.iloc[0])),
    texts=("text", lambda x: [str(i) for i in x[0:]])
).reset_index()

In [22]:
data.rename(columns={'obj_label': 'location'}, inplace=True)

In [24]:
data['text'] = data['text'].astype(str)
data['location'] = data['location'].astype(str)
import ast
data["texts"] = data["texts"].apply(lambda x: ast.literal_eval(x) if isinstance(x, str) else x)

In [27]:
print(data['text'].head())
print(data['texts'].head())
print(type(data['texts'][0]))  # Check type of a single value

0                                                                                                  Nashenas (Pashto/Dari: ناشناس), born as Sadiq Fitrat Habibi, (Pashto/Persian: صادق فطرت) is one of the oldest surviving musicians from 
1                                                                                                                   Tyler Williams (born February 25, 1988), professionally known as T-Minus, is a Canadian hip-hop and R&B producer from 
2                                                                                                   Together with Hekuran Isai , Pali Miska, and Qirjako Mihali he was one of the new generation of leaders within the Party of Labour of 
3    Noumérat – Moufdi Zakaria Airport (French: Aéroport de Ghardaïa / Noumérat – Moufdi Zakaria) (IATA: GHA, ICAO: DAUG), also known as Noumerate Airport, is a public airport serving Ghardaïa, the capital of the Ghardaïa Province in 
4                                                           

In [28]:
data.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 250 entries, 0 to 249
Data columns (total 3 columns):
 #   Column    Non-Null Count  Dtype 
---  ------    --------------  ----- 
 0   location  250 non-null    object
 1   text      250 non-null    object
 2   texts     250 non-null    object
dtypes: object(3)
memory usage: 6.0+ KB


In [29]:
data

Unnamed: 0,location,text,texts
0,Afghanistan,"Nashenas (Pashto/Dari: ناشناس), born as Sadiq Fitrat Habibi, (Pashto/Persian: صادق فطرت) is one of the oldest surviving musicians from","[Nashenas (Pashto/Dari: ناشناس), born as Sadiq Fitrat Habibi, (Pashto/Persian: صادق فطرت) is one of the oldest surviving musicians from , Abdul Malik Pahlawan is an Uzbek politician based in Faryab Province in northern , This garden was built by Maharajah Ranjit Singh in 1813 to celebrate the capture of the famous Koh-i-Noor Diamond from Shah Shujah of , His father was a Qazi in the city of Qandahar, as well as being a some-time minister during the reign of Shah Shujah Durrani (1785-1842), King of ]"
1,Ajax,"Tyler Williams (born February 25, 1988), professionally known as T-Minus, is a Canadian hip-hop and R&B producer from","[Tyler Williams (born February 25, 1988), professionally known as T-Minus, is a Canadian hip-hop and R&B producer from ]"
2,Albania,"Together with Hekuran Isai , Pali Miska, and Qirjako Mihali he was one of the new generation of leaders within the Party of Labour of","[Together with Hekuran Isai , Pali Miska, and Qirjako Mihali he was one of the new generation of leaders within the Party of Labour of , Gjin Aleksi's Mosque (Albanian: Xhamia e Gjin Aleksit) is a 15th century mosque in the village of Rusan, near Delvinë, , he emphasized that Djemo was in fact Albanian nobleman Gjin Muzaki because he assumed that Serbian epic poetry about struggle between Marko Kraljević and Djemo the Mountaneer was based on real struggles between Prince Marko and Muzaka family from ]"
3,Algeria,"Noumérat – Moufdi Zakaria Airport (French: Aéroport de Ghardaïa / Noumérat – Moufdi Zakaria) (IATA: GHA, ICAO: DAUG), also known as Noumerate Airport, is a public airport serving Ghardaïa, the capital of the Ghardaïa Province in","[Noumérat – Moufdi Zakaria Airport (French: Aéroport de Ghardaïa / Noumérat – Moufdi Zakaria) (IATA: GHA, ICAO: DAUG), also known as Noumerate Airport, is a public airport serving Ghardaïa, the capital of the Ghardaïa Province in , Rabah Bitat Airport (IATA: AAE, ICAO: DABB), formerly known as Les Salines Airport, and popularly as El Mellah Airport is an international airport located 9 km south of Annaba, a city in ]"
4,Amherst,"Joseph Charles Bequaert was an American naturalist of Belgian origin, born 24 May 1886 in Torhout (Belgium) and died on 12 January 1982 in","[Joseph Charles Bequaert was an American naturalist of Belgian origin, born 24 May 1886 in Torhout (Belgium) and died on 12 January 1982 in ]"
...,...,...,...
245,Windsor,"Williams married in 1812 Delia Ellsworth, daughter of Founding Father Oliver Ellsworth of","[Williams married in 1812 Delia Ellsworth, daughter of Founding Father Oliver Ellsworth of ]"
246,Winnipeg,"Although Hasselfield had never run for provincial office, she was known in Manitoba as a prominent organizer for the Liberal Party and was supported by the party's establishment against Kevin Lamoureux, a maverick MLA from north-end","[Although Hasselfield had never run for provincial office, she was known in Manitoba as a prominent organizer for the Liberal Party and was supported by the party's establishment against Kevin Lamoureux, a maverick MLA from north-end ]"
247,Wisconsin,"Diane Hendricks (born 1947) is an American businesswoman, film producer and philanthropist from","[Diane Hendricks (born 1947) is an American businesswoman, film producer and philanthropist from ]"
248,Wolverhampton,"She married, in November 1930, Geoffrey Mander MP for East","[She married, in November 1930, Geoffrey Mander MP for East ]"


In [30]:
data.to_csv(geo_path, index=False)

print(f"File saved to {geo_path}")

File saved to geodata.csv


In [31]:
from google.colab import files

# Download the CSV file
files.download(geo_path)

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>