In [1]:
import os
from IPython.display import display, HTML

import numpy as np
import pandas as pd

# Investigating claims on performance made in the paper
LLMs perform worse on the proposed TempTabQA dataset than humans. The authors split data into a head and tail set, i.e., into more common and less common domains. Of all LLMs, GPT performs the best. Transforming tables to knowledge graphs improves performance further.

Key claims I want to investigate are:
- LLMs perform better in head set than in tail set. Human performance roughly similar.
- _How many_ questions are the hardest for humans. _Who_ questions are the hardest for LLMs
- LLMs and humans struggle with _summation_, _difference_, and _comparison_ questions.
- Explicit time-related questions are harder then implicit questions.
- Money, and person-related tail questions are hard for LLMs and humans.

## Inspect training, head, and tail datasets
In the following, I will start with inspecting the training data. Later, I look into the head and tail dataset where the head set is supposed to cover more common domains and where the tail data set is supposed to cover less common domains.

### Training data

In [2]:
df_train = pd.read_csv("../../data/maindata/qapairs/train-set/train-set.csv", index_col=0)

In [3]:
df_train.head()

Unnamed: 0,question,answer,category,table_id
0,How many years prior to Davis's death did she ...,57,actor,4
1,How much longer was Davis married to Gary Merr...,7 years,actor,4
2,How long after Davis career began did she take...,6,actor,4
3,Who was Bette Davis married to in 1942?,Arthur Farnsworth,actor,4
4,When was the first time that Bette Davis becam...,1943,actor,4


In [4]:
df_train.loc[:, "category"].unique()

array(['actor', 'swimming', 'wrestling', 'empire', 'legislature',
       'footballer', 'tennis', 'golf', 'rugby', 'nba', 'volleyball',
       'emperor', 'badminton', 'tabletennis', 'album', 'civil war',
       'conference', 'aircraft', 'economy', 'court', 'racing',
       'car driver', 'curling', 'nobel', 'painter', 'scientist', 'person',
       'body builder', 'christian leader', 'musician', 'baseball',
       'lacrosse', 'country', 'space probe', 'railway', 'football',
       'handball', 'athelete', 'martial artist', 'nfl', 'ice hockey',
       'basketball', 'company', 'website', 'university', 'stadium',
       'launchpad', 'sailor', 'book', 'skier', 'church', 'monument',
       'figure skating', 'office holder', 'song', 'concert', 'painting',
       'military conflict', 'war/conflict', 'current war', 'earthquake',
       'space program', 'music', 'character', 'movie', 'show',
       'rail line', 'agency', 'national cricket team', 'board game',
       'game', 'national football team'

In [5]:
df_train.shape

(7680, 4)

In [6]:
df_train.drop_duplicates(subset=["question", "answer"]).shape

(7299, 4)

In [7]:
def remove_persons_and_duplicates(df: pd.DataFrame) -> pd.DataFrame:
    return df.drop_duplicates(subset=["question", "answer"]).query(
        "category.isin(['empire', 'legislature', 'emperor', 'album', 'civil war', 'conference', 'aircraft','economy', 'court', 'nobel', 'country', 'space probe', 'railway', 'company','website', 'university', 'stadium', 'launchpad',  'book', 'church', 'monument', 'office holder','song', 'concert', 'painting', 'military conflict', 'war/conflict','current war', 'earthquake', 'space program', 'music', 'character','movie', 'show', 'rail line', 'agency','board game', 'game'])"
    )

In [8]:
df_without_persons = df_train.pipe(remove_persons_and_duplicates)

In [9]:
df_without_persons.groupby("category").sample(1)

Unnamed: 0,question,answer,category,table_id
7213,How many total child agencies are there in all...,69,agency,1140
1190,What was the first year that pilots were able ...,1913,aircraft,225
6256,How many singles were released on the Death Ma...,3,album,950
7257,How many years were between when FASA was firs...,23,board game,1150
4467,In what year did Animal Farm get published?,1945,book,701
6982,What year did Lassie release on CBS?,1954,character,1076
4594,What is the Length of All Saints’ Church?,120 feet (37 m),church,722
6512,Who was the leader of UK after 2 years of Mala...,Clement Attlee,civil war,996
3877,In what year was DollarTree founded?,1986,company,602
6815,When did the Beautiful Trauma World Tour start?,"March 1, 2018",concert,1053


### Head test set

In [12]:
df_head = pd.read_csv("../../data/maindata/qapairs/head-set/head-set.csv", index_col=0)
df_head.head()

Unnamed: 0,question,answer,category,table_id
0,How many years did Art Carney as actor since 1...,54 Years,actor,2
1,Who was the spouse of Art Carney in 1970?,Barbara Isaac,actor,2
2,How many total years was Art Carney married to...,28 years,actor,2
3,Which spouse was Art Carney married to the least?,Barbara Isaac,actor,2
4,Who was Art Carney married to when he served i...,Jean Myers,actor,2


In [13]:
df_head.shape

(1851, 4)

In [14]:
df_head_without_persons = df_head.pipe(remove_persons_and_duplicates)

In [15]:
df_head_without_persons.groupby("category").sample(1)

Unnamed: 0,question,answer,category,table_id
1719,Which year formed in Coordination Center for E...,1937,agency,1139
243,How many years did B-24 Skua was in active ser...,3 Years,aircraft,226
1390,How many labels issued Confessions of a Danger...,two,album,948
1784,When was the first edition of Atlantis released?,1984,board game,1163
1351,How long was Dick King-Smith married to his s...,10 years,book,929
1661,What was the last year the Monks was portrayed...,2007,character,1104
1108,When Valen kapell was closed?,1873-1949,church,715
1413,How many years did Libya supported to Ethiopia...,8 Years,civil war,979
893,Is there more or less employess at AT&T in 202...,less,company,597
1526,How many shows was showed in Europe and Austra...,29,concert,1054


In [16]:
diff_cat_train_head = np.setdiff1d(
    df_train.loc[:, "category"].unique(), df_head.loc[:, "category"].unique()
)
diff_cat_train_head

array(['conference', 'football', 'painting', 'war/conflict'], dtype=object)

In [17]:
diff_cat_head_train = np.setdiff1d(
    df_head.loc[:, "category"].unique(), df_train.loc[:, "category"].unique()
)
diff_cat_head_train

array(['event', 'fighter', 'navy vessel', 'politician'], dtype=object)

### Tail test set

In [19]:
df_tail = pd.read_csv("../../data/maindata/qapairs/tail-set/tail-set.csv", index_col=0)
df_tail.head()

Unnamed: 0,question,answer,category,table_id
0,What was the age when Jenson Button best finis...,Age of 38,f1,0
1,What was Jenson Button's age when he won the S...,38,f1,0
2,How long did it take Jenson Button to win his ...,9 years,f1,0
3,Where did Jenson Button compete 5 years before...,Brazil,f1,0
4,For how many years did Jenson Button's profess...,17 years,f1,0


In [20]:
df_tail.category.unique()

array(['f1', 'time zone', 'hockey', 'cricket', 'cycling', 'squash',
       'sumo', 'political party', 'sports event', 'holiday', 'ship',
       'orbitor', 'boxing', 'terrorist orgnization', 'cyclone',
       'proxy war', 'army', 'planet', 'disease'], dtype=object)

In [21]:
df_tail.groupby("category").sample(1)

Unnamed: 0,question,answer,category,table_id
959,How many years did First Lebanon War was held ...,3 Years,army,1119
552,How much longer did Yamamoto play for Kamatama...,3 years,boxing,484
615,How old was Brian Lara when he joined West Ind...,21,cricket,528
101,What team did Valverde ride for the year he wo...,Kelme–Costa Blanca,cycling,99
740,How strong was Hurricane Ivan?,Category 5 Hurricane (SSHWS),cyclone,958
1030,How much time elapsed between the first report...,14 days.,disease,1205
34,How many years are between Barrichello's best ...,2,f1,51
661,How old was Lombi when won gold at the Pan Ame...,24,hockey,680
436,How many days later does Mardi Gras start in 2...,5 days,holiday,218
547,How many month left did ExoMars was planned in...,9 months left,orbitor,461


In [22]:
df_train.query("category.isin(@df_tail.category.unique())")

Unnamed: 0,question,answer,category,table_id


In [23]:
df_head.query("category.isin(@df_tail.category.unique())")

Unnamed: 0,question,answer,category,table_id


In [24]:
df_tail = df_tail.drop_duplicates()
# Table contains duplicate questions. Either, because answers are slightly different or because category is different
df_tail[df_tail.loc[:, "question"].duplicated(keep=False)]

Unnamed: 0,question,answer,category,table_id
198,How old was Tarek Momen when he turned pro?,17,squash,110
202,How old was Tarek Momen when he turned pro?,17 years old,squash,110
219,How old was Futabayama Sadaji when he retired?,33 years old,sumo,134
222,How old was Futabayama Sadaji when he retired?,33,sumo,134
270,How old was Aminishiki Ryūji when he made his ...,19 years old,sumo,180
275,How old was Aminishiki Ryūji when he made his ...,19,sumo,180
279,How many total years (terms) does Joe Biden ho...,6 years (2 terms),political party,182
280,What positions did Joe Biden hold in 2008?,"The United States Senator from Delaware, Chair...",political party,182
287,Who was Joe Biden married to when he was first...,Unmarried,political party,182
293,What positions did Joe Biden hold in 2008?,"The United States Senator from Delaware, Chair...",political party,183


In [25]:
# Duplicates due to 1:n relationship between question and category, and question and table_id
df_tail[
    df_tail.duplicated(subset=["question", "answer", "category"], keep=False)
].sort_values(by="question")

Unnamed: 0,question,answer,category,table_id
937,At what age does Joe Biden join the democratic...,27,army,1118
923,At what age does Joe Biden join the democratic...,27,army,1116
862,At what age does Joe Biden join the democratic...,27,cyclone,1091
732,At what age does Joe Biden join the democratic...,27,cyclone,958
279,How many total years (terms) does Joe Biden ho...,6 years (2 terms),political party,182
297,How many total years (terms) does Joe Biden ho...,6 years (2 terms),political party,184
965,How many years after the second marriage did J...,44 years,army,1120
957,How many years after the second marriage did J...,44 years,army,1119
947,How many years after the second marriage did J...,44 years,army,1118
293,What positions did Joe Biden hold in 2008?,"The United States Senator from Delaware, Chair...",political party,183


In [26]:
# Duplicates due to different answers per question
df_tail[df_tail.duplicated(subset=["question", "table_id"], keep=False)].sort_values(
    by="question"
)

Unnamed: 0,question,answer,category,table_id
270,How old was Aminishiki Ryūji when he made his ...,19 years old,sumo,180
275,How old was Aminishiki Ryūji when he made his ...,19,sumo,180
219,How old was Futabayama Sadaji when he retired?,33 years old,sumo,134
222,How old was Futabayama Sadaji when he retired?,33,sumo,134
198,How old was Tarek Momen when he turned pro?,17,squash,110
202,How old was Tarek Momen when he turned pro?,17 years old,squash,110
850,Who was the US senator from Delaware in Dec 1972?,A. J. Caleb Boggs,cyclone,1091
854,Who was the US senator from Delaware in Dec 1972?,J. Caleb Boggs,cyclone,1091


## Inspect the author's data analysis
After running the dataAnalysis.py script, I created a .csv that contains descriptors of the questions raised in the training set such as whether the questions is implicit or explicit, which temporal operation is required and so on.

In [27]:
df_analysis = pd.read_csv(
    "../../data/maindata/qapairs/train-set/train-set_analysis.csv"
).iloc[:, 2:]
df_analysis.head()

Unnamed: 0,question,answer,category,table_id,explicit,implicit,before_related,after_related,duration_related,max_operator,min_operator,count_operator,sum_operator,difference_operator,average_operator,comparison_operator,ordinal,answer_type
0,How many years prior to Davis's death did she ...,57,actor,4,True,False,True,False,False,False,False,True,False,False,False,False,False,COUNT
1,How much longer was Davis married to Gary Merr...,7 years,actor,4,False,True,False,False,True,False,False,False,False,False,False,False,False,TEMPORAL
2,How long after Davis career began did she take...,6,actor,4,False,True,False,True,False,False,False,False,False,False,False,False,False,UNKNOWN
3,Who was Bette Davis married to in 1942?,Arthur Farnsworth,actor,4,True,False,False,False,False,False,False,False,False,False,False,False,False,PERSON
4,When was the first time that Bette Davis becam...,1943,actor,4,False,True,False,False,False,False,False,False,False,False,False,False,True,TEMPORAL


In [28]:
df_analysis.columns

Index(['question', 'answer', 'category', 'table_id', 'explicit', 'implicit',
       'before_related', 'after_related', 'duration_related', 'max_operator',
       'min_operator', 'count_operator', 'sum_operator', 'difference_operator',
       'average_operator', 'comparison_operator', 'ordinal', 'answer_type'],
      dtype='object')

In [29]:
df_analysis.loc[:, "answer_type"].unique()

array(['COUNT', 'TEMPORAL', 'UNKNOWN', 'PERSON', 'AGE', 'PLACE',
       'PERCENTAGE', 'ORDINAL', 'YES/NO', 'ORGANIZATION', 'PRODUCT',
       'MONEY'], dtype=object)

### _How many_ questions are the hardest for humans. _Who_ questions are the hardest for LLMs
Let's investigate how these questions look like and what they have in common.

`dataAnalysis.py` does not produce a category _how many_ or _who_. When investigating the regexes in the script, both categories `count_operator` and `duration_related` match _how many_. When looking for _who_ matching regexes, only answer types were classified. Therefore, I assume the analysis must have been using simple string matching.

#### Let's start with looking at the GPT 4 prediction for the tail data set. 
We must load both datasets, remove duplicates and find tail questions by merging them with the GPT4 answers. Afterwards, we will search for _how many_ and _who_ questions to inspect the data further.

In [30]:
df_gpt4 = pd.read_csv(
    "../../models/predictions/gpt4/fewshot_with_reasoning/outdomain_eval_gpt_4_few_shot_with_reasoning_single.csv"
)
df_gpt4.head()

Unnamed: 0,table,predicted_answer,actual_answer,question
0,"<html><body><table class=""infobox biography vc...",Formula One && Five years before his Super GT ...,Brazil,Where did Jenson Button compete 5 years before...
1,"<html><body><table class=""infobox biography vc...",20 years old && Button began his Formula One c...,20,How old was Jenson Button when he began his pr...
2,"<html><body><table class=""infobox biography vc...",United Kingdom && Jenson Button's nationality ...,England,Which country did Jenson Button participated i...
3,"<html><body><table class=""infobox biography vc...",2000 && He first entered the Australian Grand ...,2000,When did Jenson Button first enter into the Au...
4,"<html><body><table class=""infobox biography vc...",10 years ago && Jenson Button last won the Bra...,10 Years ago (2012),How many years ago did Jenson Button last won ...


In [31]:
def inline_render_html(html_str):
    return f'<div style="border: 1px solid #ddd; padding: 5px;">{html_str}</div>'


def html_render_df(df, html_col="table"):
    return df.style.format({html_col: inline_render_html}).set_properties(
        subset=["table"], **{"text-align": "left"}
    )


html_render_df(df_gpt4.tail(1))


Unnamed: 0,table,predicted_answer,actual_answer,question
1026,"White House COVID-19 outbreakPresident Donald Trump speaking during the event held to announce Amy Coney Barrett's nomination to the Supreme Court in the White House Rose Garden.DiseaseCOVID-19Virus strainSARS-CoV-2LocationWhite House, Washington, D.C., United StatesFirst reportedOctober 1, 2020Index caseSeptember 30, 2020Arrival dateSeptember 26, 2020; 2 years agoConfirmed casesTotal:At least 53, including President TrumpPre-nomination:At least six as of October 14Nomination:At least 25 as of October 14Pence staff:At least 5 as of November 11Election Day:At least 20 as of November 11Hospitalized casesAt least one, by October 15",President Trump && He was the most noteworthy individual to contract Covid in the White House outbreak.,President Trump,Who was the most noteworthy individual to contract Covid in this?
White House COVID-19 outbreak,White House COVID-19 outbreak,,,
President Donald Trump speaking during the event held to announce Amy Coney Barrett's nomination to the Supreme Court in the White House Rose Garden.,President Donald Trump speaking during the event held to announce Amy Coney Barrett's nomination to the Supreme Court in the White House Rose Garden.,,,
Disease,COVID-19,,,
Virus strain,SARS-CoV-2,,,
Location,"White House, Washington, D.C., United States",,,
First reported,"October 1, 2020",,,
Index case,"September 30, 2020",,,
Arrival date,"September 26, 2020; 2 years ago",,,
Confirmed cases,"Total:At least 53, including President TrumpPre-nomination:At least six as of October 14Nomination:At least 25 as of October 14Pence staff:At least 5 as of November 11Election Day:At least 20 as of November 11",,,

White House COVID-19 outbreak,White House COVID-19 outbreak.1
President Donald Trump speaking during the event held to announce Amy Coney Barrett's nomination to the Supreme Court in the White House Rose Garden.,President Donald Trump speaking during the event held to announce Amy Coney Barrett's nomination to the Supreme Court in the White House Rose Garden.
Disease,COVID-19
Virus strain,SARS-CoV-2
Location,"White House, Washington, D.C., United States"
First reported,"October 1, 2020"
Index case,"September 30, 2020"
Arrival date,"September 26, 2020; 2 years ago"
Confirmed cases,"Total:At least 53, including President TrumpPre-nomination:At least six as of October 14Nomination:At least 25 as of October 14Pence staff:At least 5 as of November 11Election Day:At least 20 as of November 11"
Hospitalized cases,"At least one, by October 15"


In [32]:
df_gpt4.shape

(1027, 4)

In [33]:
# Answers are otherwise not easy to check for exact match
df_gpt4 = df_gpt4.assign(
    predicted_answer_short=lambda x: x["predicted_answer"]
    .str.split("&&")
    .str[0]
    .str.strip()
)

In [34]:
html_render_df(
    df_gpt4.query("predicted_answer_short == actual_answer")
    .sample(3, random_state=94)
    .loc[:, ["table", "question", "predicted_answer_short", "actual_answer"]]
)

Unnamed: 0,table,question,predicted_answer_short,actual_answer
85,"Deshabandu Sanath JayasuriyaJayasuriya playing for Sri Lanka in 2008Personal informationFull nameSanath Teran JayasuriyaBorn30 June 1969(age 52) Matara, CeylonNicknameMaster Blaster, Little Dynamite, Matara Hurricane Matara MaulerHeight5 ft 7 in (1.70 m)BattingLeft-handedBowlingSlow left arm orthodoxRoleAll-rounderInternational informationNational sideSri Lanka (1989–2011)Test debut (cap 49)22 February 1991 v New ZealandLast Test1 December 2007 v EnglandODI debut (cap 58)26 December 1989 v AustraliaLast ODI28 June 2011 v EnglandODI shirt no.07T20I debut (cap 4)15 June 2006 v EnglandLast T20I25 June 2011 v EnglandDomestic team informationYearsTeam1994–2011Bloomfield2005Somerset2007Lancashire2008Warwickshire2008–2010Mumbai Indians2010Worcestershire2011Ruhuna Rhinos2012Khulna Royal Bengals2012Kandurata WarriorsCareer statisticsCompetitionTestODIFCT20Matches110445265111Runs scored6,97313,43014,8192,317Batting average40.0732.3638.3922.71100s/50s14/3128/6829/701/12Top score340189340114*Balls bowled8,18814,87415,2751,593Wickets9832320577Bowling average34.3436.7533.2025.755 wickets in innings242010 wickets in match0000Best bowling5/346/295/344/24Catches/stumpings78/0123/0162/021/0Source: ESPNcricinfo,15 April 2021",What was the third team that Sanath Jayasuriya played for?,Lancashire,Lancashire
Jayasuriya playing for Sri Lanka in 2008,Jayasuriya playing for Sri Lanka in 2008,,,
Personal information,Personal information,,,
Full name,Sanath Teran Jayasuriya,,,
Born,"30 June 1969(age 52) Matara, Ceylon",,,
Nickname,"Master Blaster, Little Dynamite, Matara Hurricane Matara Mauler",,,
Height,5 ft 7 in (1.70 m),,,
Batting,Left-handed,,,
Bowling,Slow left arm orthodox,,,
Role,All-rounder,,,

0,1,2,3,4
Jayasuriya playing for Sri Lanka in 2008,Jayasuriya playing for Sri Lanka in 2008,,,
Personal information,Personal information,,,
Full name,Sanath Teran Jayasuriya,,,
Born,"30 June 1969(age 52) Matara, Ceylon",,,
Nickname,"Master Blaster, Little Dynamite, Matara Hurricane Matara Mauler",,,
Height,5 ft 7 in (1.70 m),,,
Batting,Left-handed,,,
Bowling,Slow left arm orthodox,,,
Role,All-rounder,,,
International information,International information,,,

Competition,Test,ODI,FC,T20
Matches,110,445,265,111
Runs scored,6973,13430,14819,2317
Batting average,40.07,32.36,38.39,22.71
100s/50s,14/31,28/68,29/70,1/12
Top score,340,189,340,114*
Balls bowled,8188,14874,15275,1593
Wickets,98,323,205,77
Bowling average,34.34,36.75,33.20,25.75
5 wickets in innings,2,4,2,0
10 wickets in match,0,0,0,0

0,1,2
Coll in 2018,Coll in 2018,
Nickname(s),Superman,
Country,New Zealand,
Residence,"Hoofddorp, Netherlands",
Height,1.79 m (5 ft 10 in),
Weight,83 kg (183 lb),
Turned Pro,2010,
Retired,Active,
Plays,Right Handed,
Coached by,Rob Owen,

0,1,2
,,
Men's squash,Men's squash,Men's squash
RepresentingNew Zealand,RepresentingNew Zealand,RepresentingNew Zealand
World Championships,World Championships,World Championships
,2019–20 Doha,Singles
,2020–21 Chicago,Singles
World Doubles Championships,World Doubles Championships,World Doubles Championships
,2016 Darwin,Mixed doubles
,2017 Manchester,Mixed doubles
,2016 Darwin,Doubles

0,1,2,3,4
Richards in 2005,Richards in 2005,,,
Personal information,Personal information,,,
Full name,Isaac Vivian Alexander Richards,,,
Height,5 ft 10 in (1.78 m),,,
Batting,Right-handed,,,
Bowling,Right-arm slow seam Right-arm off-break,,,
Role,Batsman,,,
International information,International information,,,
National side,West Indies (1974–1991),,,
Test debut (cap 151),22 November 1974 v India,,,

Competition,Test,ODI,FC,LA
Matches,121,187,507,500
Runs scored,8540,6721,36212,16995
Batting average,50.23,47.00,49.40,41.96
100s/50s,24/45,11/45,114/162,26/109
Top score,291,189*,322,189*
Balls bowled,5170,5644,23226,12214
Wickets,32,118,223,290
Bowling average,61.37,35.83,45.15,30.59
5 wickets in innings,0,2,1,3
10 wickets in match,0,0,0,0


In [35]:
html_render_df(
    df_gpt4.query("predicted_answer_short == actual_answer")
    .sample(20, random_state=94)
    .loc[:, ["table", "question", "predicted_answer_short", "actual_answer"]]
)

Unnamed: 0,table,question,predicted_answer_short,actual_answer
85,"Deshabandu Sanath JayasuriyaJayasuriya playing for Sri Lanka in 2008Personal informationFull nameSanath Teran JayasuriyaBorn30 June 1969(age 52) Matara, CeylonNicknameMaster Blaster, Little Dynamite, Matara Hurricane Matara MaulerHeight5 ft 7 in (1.70 m)BattingLeft-handedBowlingSlow left arm orthodoxRoleAll-rounderInternational informationNational sideSri Lanka (1989–2011)Test debut (cap 49)22 February 1991 v New ZealandLast Test1 December 2007 v EnglandODI debut (cap 58)26 December 1989 v AustraliaLast ODI28 June 2011 v EnglandODI shirt no.07T20I debut (cap 4)15 June 2006 v EnglandLast T20I25 June 2011 v EnglandDomestic team informationYearsTeam1994–2011Bloomfield2005Somerset2007Lancashire2008Warwickshire2008–2010Mumbai Indians2010Worcestershire2011Ruhuna Rhinos2012Khulna Royal Bengals2012Kandurata WarriorsCareer statisticsCompetitionTestODIFCT20Matches110445265111Runs scored6,97313,43014,8192,317Batting average40.0732.3638.3922.71100s/50s14/3128/6829/701/12Top score340189340114*Balls bowled8,18814,87415,2751,593Wickets9832320577Bowling average34.3436.7533.2025.755 wickets in innings242010 wickets in match0000Best bowling5/346/295/344/24Catches/stumpings78/0123/0162/021/0Source: ESPNcricinfo,15 April 2021",What was the third team that Sanath Jayasuriya played for?,Lancashire,Lancashire
Jayasuriya playing for Sri Lanka in 2008,Jayasuriya playing for Sri Lanka in 2008,,,
Personal information,Personal information,,,
Full name,Sanath Teran Jayasuriya,,,
Born,"30 June 1969(age 52) Matara, Ceylon",,,
Nickname,"Master Blaster, Little Dynamite, Matara Hurricane Matara Mauler",,,
Height,5 ft 7 in (1.70 m),,,
Batting,Left-handed,,,
Bowling,Slow left arm orthodox,,,
Role,All-rounder,,,

0,1,2,3,4
Jayasuriya playing for Sri Lanka in 2008,Jayasuriya playing for Sri Lanka in 2008,,,
Personal information,Personal information,,,
Full name,Sanath Teran Jayasuriya,,,
Born,"30 June 1969(age 52) Matara, Ceylon",,,
Nickname,"Master Blaster, Little Dynamite, Matara Hurricane Matara Mauler",,,
Height,5 ft 7 in (1.70 m),,,
Batting,Left-handed,,,
Bowling,Slow left arm orthodox,,,
Role,All-rounder,,,
International information,International information,,,

Competition,Test,ODI,FC,T20
Matches,110,445,265,111
Runs scored,6973,13430,14819,2317
Batting average,40.07,32.36,38.39,22.71
100s/50s,14/31,28/68,29/70,1/12
Top score,340,189,340,114*
Balls bowled,8188,14874,15275,1593
Wickets,98,323,205,77
Bowling average,34.34,36.75,33.20,25.75
5 wickets in innings,2,4,2,0
10 wickets in match,0,0,0,0

0,1,2
Coll in 2018,Coll in 2018,
Nickname(s),Superman,
Country,New Zealand,
Residence,"Hoofddorp, Netherlands",
Height,1.79 m (5 ft 10 in),
Weight,83 kg (183 lb),
Turned Pro,2010,
Retired,Active,
Plays,Right Handed,
Coached by,Rob Owen,

0,1,2
,,
Men's squash,Men's squash,Men's squash
RepresentingNew Zealand,RepresentingNew Zealand,RepresentingNew Zealand
World Championships,World Championships,World Championships
,2019–20 Doha,Singles
,2020–21 Chicago,Singles
World Doubles Championships,World Doubles Championships,World Doubles Championships
,2016 Darwin,Mixed doubles
,2017 Manchester,Mixed doubles
,2016 Darwin,Doubles

0,1,2,3,4
Richards in 2005,Richards in 2005,,,
Personal information,Personal information,,,
Full name,Isaac Vivian Alexander Richards,,,
Height,5 ft 10 in (1.78 m),,,
Batting,Right-handed,,,
Bowling,Right-arm slow seam Right-arm off-break,,,
Role,Batsman,,,
International information,International information,,,
National side,West Indies (1974–1991),,,
Test debut (cap 151),22 November 1974 v India,,,

Competition,Test,ODI,FC,LA
Matches,121,187,507,500
Runs scored,8540,6721,36212,16995
Batting average,50.23,47.00,49.40,41.96
100s/50s,24/45,11/45,114/162,26/109
Top score,291,189*,322,189*
Balls bowled,5170,5644,23226,12214
Wickets,32,118,223,290
Bowling average,61.37,35.83,45.15,30.59
5 wickets in innings,0,2,1,3
10 wickets in match,0,0,0,0

Personal information,Personal information.1,Personal information.2,Personal information.3
Full name,Shohei Yamamoto,Shohei Yamamoto,Shohei Yamamoto
Date of birth,"August 29, 1982(age 39)","August 29, 1982(age 39)","August 29, 1982(age 39)"
Place of birth,"Nagaokakyo, Kyoto, Japan","Nagaokakyo, Kyoto, Japan","Nagaokakyo, Kyoto, Japan"
Height,1.73 m (5 ft 8 in),1.73 m (5 ft 8 in),1.73 m (5 ft 8 in)
Position(s),Midfielder,Midfielder,Midfielder
Youth career,Youth career,Youth career,Youth career
1995–2000,Kyoto Purple Sanga,Kyoto Purple Sanga,Kyoto Purple Sanga
Senior career*,Senior career*,Senior career*,Senior career*
Years,Team,Apps,(Gls)
2001,Kyoto Purple Sanga,0,(0)

0,1,2,3,4
Tendulkar at a promotional event,Tendulkar at a promotional event,,,
Personal information,Personal information,,,
Full name,Sachin Ramesh Tendulkar,,,
Born,"24 April 1973(age 49) Bombay, Maharashtra, India",,,
Nickname,"Little Master, Master Blaster",,,
Height,165 cm (5 ft 5 in),,,
Batting,Right-handed,,,
Bowling,Right-arm leg break Right-arm off break,,,
Relations,Arjun Tendulkar (son) Ramesh Tendulkar (father),,,
Website,sachintendulkar.com,,,

Competition,Test,ODI,FC,LA
Matches,200,463,310,551
Runs scored,15921,18426,25396,21999
Batting average,53.78,44.83,57.84,45.54
100s/50s,51/68,49/96,81/116,60/114
Top score,248*,200*,248*,200*
Balls bowled,4240,8054,7605,10230
Wickets,46,154,71,201
Bowling average,54.17,44.48,61.74,42.17
5 wickets in innings,0,2,0,2
10 wickets in match,0,0,0,0

0,1,2
Farag at the 2017 Men's World Team Squash Championships,Farag at the 2017 Men's World Team Squash Championships,
Full name,Ali Amr Farag,
Nickname(s),"Mr. Fantastic, Rubber-band Man, The Raptor",
Country,Egypt,
Residence,"Cairo, Egypt",
Born,"22 April 1992(age 30) Cairo, Egypt",
Height,1.83 m (6 ft 0 in),
Turned Pro,2009,
Retired,Active,
Plays,Right handed,

0,1,2
,,
Men's squash,Men's squash,Men's squash
Representing Egypt,Representing Egypt,Representing Egypt
World Championships,World Championships,World Championships
,2017 Manchester,Singles
,2018–19 Chicago,Singles
,2020–21 Chicago,Singles
,2021–22 Cairo,Singles
World Team Championships,World Team Championships,World Team Championships
,2017 Marseille,Team

Insurgency in Laos,Insurgency in Laos.1
Part of the Third Indochina War,Part of the Third Indochina War
Date2 December 1975 – presentLocationSouthern Laos (royalists and rightists); Central and Northern Laos (Hmong rebels)StatusOngoing low-intensity conflict2007 Hmong-led coup attempt against the Lao government foiled; alleged plotters tried and exonerated in the U.S.,Date2 December 1975 – presentLocationSouthern Laos (royalists and rightists); Central and Northern Laos (Hmong rebels)StatusOngoing low-intensity conflict2007 Hmong-led coup attempt against the Lao government foiled; alleged plotters tried and exonerated in the U.S.
Date,2 December 1975 – present
Location,Southern Laos (royalists and rightists); Central and Northern Laos (Hmong rebels)
Status,Ongoing low-intensity conflict2007 Hmong-led coup attempt against the Lao government foiled; alleged plotters tried and exonerated in the U.S.
Belligerents,Belligerents
LaosLao People's Revolutionary PartySupported by: Vietnam (from 1976) North Vietnam (until 1976) Soviet Union (until 1989),Hmong insurgentsSupported by: Thailand (until 1990) United States (until 1990)Neo Hom (1981–2007)Royalists:Lao National Liberation FrontRoyal Lao Democratic Government (1982)Supported by:Royal Lao Government in Exile China (until 1988)Democratic Kampuchea (until 1979)Khmer RougeParty of Democratic Kampuchea (1981–1990)Rightists:United Front for the Liberation of LaosSupported by: Thailand (early to mid–1980s)

0,1
Date,2 December 1975 – present
Location,Southern Laos (royalists and rightists); Central and Northern Laos (Hmong rebels)
Status,Ongoing low-intensity conflict2007 Hmong-led coup attempt against the Lao government foiled; alleged plotters tried and exonerated in the U.S.

0,1
"HMSSomersetin Indian Ocean, 2011","HMSSomersetin Indian Ocean, 2011"
History,History
United Kingdom,United Kingdom
Name,HMSSomerset
Operator,Royal Navy
Ordered,January 1992
Builder,Yarrow Shipbuilders
Laid down,12 October 1992
Launched,25 June 1994
Sponsored by,Lady Layard

Insurgency in Laos,Insurgency in Laos.1
Part of the Third Indochina War,Part of the Third Indochina War
Date2 December 1975 – presentLocationSouthern Laos (royalists and rightists); Central and Northern Laos (Hmong rebels)StatusOngoing low-intensity conflict2007 Hmong-led coup attempt against the Lao government foiled; alleged plotters tried and exonerated in the U.S.,Date2 December 1975 – presentLocationSouthern Laos (royalists and rightists); Central and Northern Laos (Hmong rebels)StatusOngoing low-intensity conflict2007 Hmong-led coup attempt against the Lao government foiled; alleged plotters tried and exonerated in the U.S.
Date,2 December 1975 – present
Location,Southern Laos (royalists and rightists); Central and Northern Laos (Hmong rebels)
Status,Ongoing low-intensity conflict2007 Hmong-led coup attempt against the Lao government foiled; alleged plotters tried and exonerated in the U.S.
Belligerents,Belligerents
LaosLao People's Revolutionary PartySupported by: Vietnam (from 1976) North Vietnam (until 1976) Soviet Union (until 1989),Hmong insurgentsSupported by: Thailand (until 1990) United States (until 1990)Neo Hom (1981–2007)Royalists:Lao National Liberation FrontRoyal Lao Democratic Government (1982)Supported by:Royal Lao Government in Exile China (until 1988)Democratic Kampuchea (until 1979)Khmer RougeParty of Democratic Kampuchea (1981–1990)Rightists:United Front for the Liberation of LaosSupported by: Thailand (early to mid–1980s)

0,1
Date,2 December 1975 – present
Location,Southern Laos (royalists and rightists); Central and Northern Laos (Hmong rebels)
Status,Ongoing low-intensity conflict2007 Hmong-led coup attempt against the Lao government foiled; alleged plotters tried and exonerated in the U.S.

0,1,2,3,4
Richards in 2005,Richards in 2005,,,
Personal information,Personal information,,,
Full name,Isaac Vivian Alexander Richards,,,
Height,5 ft 10 in (1.78 m),,,
Batting,Right-handed,,,
Bowling,Right-arm slow seam Right-arm off-break,,,
Role,Batsman,,,
International information,International information,,,
National side,West Indies (1974–1991),,,
Test debut (cap 151),22 November 1974 v India,,,

Competition,Test,ODI,FC,LA
Matches,121,187,507,500
Runs scored,8540,6721,36212,16995
Batting average,50.23,47.00,49.40,41.96
100s/50s,24/45,11/45,114/162,26/109
Top score,291,189*,322,189*
Balls bowled,5170,5644,23226,12214
Wickets,32,118,223,290
Bowling average,61.37,35.83,45.15,30.59
5 wickets in innings,0,2,1,3
10 wickets in match,0,0,0,0

Women's 100 metre breaststroke at the 2016 FINA World Swimming Championships (25 m),Women's 100 metre breaststroke at the 2016 FINA World Swimming Championships (25 m).1,Unnamed: 2
Venue,WFCU Centre,
Dates,9 December (heats and semifinals) 10 December (final),
Competitors,60 from 46 nations,
Winning time,1:03.03,
Medalists,Medalists,
Alia Atkinson Jamaica Lilly King United States Molly Hannis United States,Alia Atkinson Jamaica Lilly King United States Molly Hannis United States,
,Alia Atkinson,Jamaica
,Lilly King,United States
,Molly Hannis,United States
← 20142018 →,← 20142018 →,

0,1,2
,Alia Atkinson,Jamaica
,Lilly King,United States
,Molly Hannis,United States

0,1
"Scale model ofAchille, sister ship of French ship Tonnerre (1808), on display at the Musée national de la Marine in Paris.","Scale model ofAchille, sister ship of French ship Tonnerre (1808), on display at the Musée national de la Marine in Paris."
History,History
France,France
Name,Tonnerre
Ordered,16 April 1794
Laid down,22 September 1794
Launched,9 June 1808
Commissioned,21 July 1808
Renamed,Quatorze Juillet(1795)
Fate,Burned and exploded 12 April 1809

Haguroyama Masaji,Haguroyama Masaji.1
羽黒山 政司,羽黒山 政司
"Haguroyama, circa 1943","Haguroyama, circa 1943"
Personal information,Personal information
Born,"Kobayashi Masaji November 18, 1914 Nakanokuchi, Japan"
Died,"October 14, 1969(aged 54)"
Height,1.79 m (5 ft10+1⁄2 in)
Weight,129.5 kg (285 lb)
Career,Career
Stable,Tatsunami
Record,359-99-117-1 draw

0,1,2
Farag at the 2017 Men's World Team Squash Championships,Farag at the 2017 Men's World Team Squash Championships,
Full name,Ali Amr Farag,
Nickname(s),"Mr. Fantastic, Rubber-band Man, The Raptor",
Country,Egypt,
Residence,"Cairo, Egypt",
Born,"22 April 1992(age 30) Cairo, Egypt",
Height,1.83 m (6 ft 0 in),
Turned Pro,2009,
Retired,Active,
Plays,Right handed,

0,1,2
,,
Men's squash,Men's squash,Men's squash
Representing Egypt,Representing Egypt,Representing Egypt
World Championships,World Championships,World Championships
,2017 Manchester,Singles
,2018–19 Chicago,Singles
,2020–21 Chicago,Singles
,2021–22 Cairo,Singles
World Team Championships,World Team Championships,World Team Championships
,2017 Marseille,Team

Chadian Civil War (1965–1979),Chadian Civil War (1965–1979).1
French Navy helicopter and French paratroopers during a 1971 operation in Chad,French Navy helicopter and French paratroopers during a 1971 operation in Chad
Date1 November 1965 – November 1979LocationChadResultOverthrow and death of François Tombalbaye in 1975Overthrow of Félix Malloum in 1979Signing of Lagos Accord and installation of Transitional Government of National Unity,Date1 November 1965 – November 1979LocationChadResultOverthrow and death of François Tombalbaye in 1975Overthrow of Félix Malloum in 1979Signing of Lagos Accord and installation of Transitional Government of National Unity
Date,1 November 1965 – November 1979
Location,Chad
Result,Overthrow and death of François Tombalbaye in 1975Overthrow of Félix Malloum in 1979Signing of Lagos Accord and installation of Transitional Government of National Unity
Belligerents,Belligerents
"FROLINAT (from 1966)First Liberation Army (until 1975)Second Liberation Army (1968–76)Third Liberation Army (from 1968)Various splinter factionsFLT (until 1975) Volcan Army (from 1970) FAP (from 1976) FAN (1976–78, 1979) Tribal and peasant rebels Libya (1969–72, from 1975) Supported by:  Algeria  Kingdom of Libya (non-combat, until 1969)",ChadChadian Armed ForcesFROLINAT's First Liberation Army (c.1975)FAN (1978–79) France Supported by: Egypt  Israel
Commanders and leaders,Commanders and leaders
"Ibrahim Abatcha †(FROLINAT) Abba Siddick (FROLINAT) Hissène Habré (FROLINAT, Second Liberation Army, Third Liberation Army, FAN) Goukouni Oueddei (FROLINAT, Second Liberation Army, FAP) Ahmat Acyl (FROLINAT, First Liberation Army; Volcan Army) Mohamed Baghlani (Volcan Army) Muammar al-Gaddafi",François Tombalbaye † Félix Malloum Ahmat Acyl (First Liberation Army) Hissène Habré (FAN) Michel Arnaud Edouard Cortadellas
Strength,Strength

0,1
Date,1 November 1965 – November 1979
Location,Chad
Result,Overthrow and death of François Tombalbaye in 1975Overthrow of Félix Malloum in 1979Signing of Lagos Accord and installation of Transitional Government of National Unity

0,1,2,3,4
Richards in 2005,Richards in 2005,,,
Personal information,Personal information,,,
Full name,Isaac Vivian Alexander Richards,,,
Height,5 ft 10 in (1.78 m),,,
Batting,Right-handed,,,
Bowling,Right-arm slow seam Right-arm off-break,,,
Role,Batsman,,,
International information,International information,,,
National side,West Indies (1974–1991),,,
Test debut (cap 151),22 November 1974 v India,,,

Competition,Test,ODI,FC,LA
Matches,121,187,507,500
Runs scored,8540,6721,36212,16995
Batting average,50.23,47.00,49.40,41.96
100s/50s,24/45,11/45,114/162,26/109
Top score,291,189*,322,189*
Balls bowled,5170,5644,23226,12214
Wickets,32,118,223,290
Bowling average,61.37,35.83,45.15,30.59
5 wickets in innings,0,2,1,3
10 wickets in match,0,0,0,0

United Sabah PartyParti Bersatu Sabah,United Sabah PartyParti Bersatu Sabah.1
,
Malay name,Parti Bersatu Sabah ڤرتي برساتو سابه
Chinese name,沙巴團結黨 沙巴团结党 Shābā tuánjiédǎng
Abbreviation,PBS
President,Maximus Ongkili
Chairperson,Claudius Alex Sundang
Secretary-General,Joniston Bangkuai
Founder,Joseph Pairin Kitingan
Founded,5 March 1985; 37 years ago
Split from,Sabah People's United Front (BERJAYA)

Women's 70 kg at the 2021 European Judo Championships,Women's 70 kg at the 2021 European Judo Championships.1,Unnamed: 2
Venue,Altice Arena,
Location,"Lisbon, Portugal",
Date,17 April,
Competitors,18 from 16 nations,
Medalists,Medalists,
Sanne van Dijke (2nd title) Netherlands Margaux Pinot France Madina Taimazova Russia Bárbara Timo Portugal,Sanne van Dijke (2nd title) Netherlands Margaux Pinot France Madina Taimazova Russia Bárbara Timo Portugal,
,Sanne van Dijke (2nd title),Netherlands
,Margaux Pinot,France
,Madina Taimazova,Russia
,Bárbara Timo,Portugal

0,1,2
,Sanne van Dijke (2nd title),Netherlands
,Margaux Pinot,France
,Madina Taimazova,Russia
,Bárbara Timo,Portugal

Cholera,Cholera.1
Other names,"Asiatic cholera, epidemic cholera"
,
"A person with severe dehydration due to cholera, causing sunken eyes and wrinkled hands and skin.","A person with severe dehydration due to cholera, causing sunken eyes and wrinkled hands and skin."
Specialty,Infectious disease
Symptoms,"Large amounts of watery diarrhea, vomiting, muscle cramps"
Complications,"Dehydration, electrolyte imbalance"
Usual onset,2 hours to 5 days after exposure
Duration,A few days
Causes,Vibrio choleraespread by fecal-oral route
Risk factors,"Poor sanitation, not enough clean drinking water, poverty"

Diwali,Diwali.1
"Rangoli decorations, made using coloured fine powder or sand, are popular during Diwali.","Rangoli decorations, made using coloured fine powder or sand, are popular during Diwali."
Also called,Deepavali
Observed by,"Hindus, Jains, Sikhs, some Buddhists (notably Newar Buddhists)"
Type,"Religious, cultural, seasonal"
Significance,See below
Celebrations,"Diya lighting,puja(worship and prayer),vrat(fasting),dāna(charity),melā(fairs/shows), home cleansing and decoration, fireworks, gifts, feast and sweets"
Begins,"āśvina māsa (amānta) / kārtika māsa (purnimānta), kṛṣṇa pakṣa, trayodaśī tithi"
Ends,"kārtika māsa, śukla pakṣa, dvitīyā tithi"
Date,"Ashvin, Krishna, Thrayodashi, Kartika, Shukla, Dwitiya"
2022 date,October21 (Dhanteras/Yama Deepam)22 (Naraka Chaturdashi/Kali Chaudas/Hanuman Puja/Chhoti Diwali)23 (Lakshmi Puja/Kali Puja/Sharda Puja/Kedar Gauri Vrat)24 (Govardhan Puja/Balipratipada/Gujarati New Year)25 (Bhai Dooj/Vishwakarma Puja)


In [36]:
html_render_df(
    df_gpt4.query("predicted_answer_short != actual_answer")
    .query("question.str.contains('Biden')")
    .loc[[279]]
)

Unnamed: 0,table,predicted_answer,actual_answer,question,predicted_answer_short
279,"Citizen Revolution MovementMovimiento Revolución CiudadanaAbbreviationRCLeaderRafael CorreaPresidentMarcela AguiñagaGeneral SecretaryDavid VillamarFounderIván EspinelFounded2010(historical) August 2021(modern)Registered18 August 2016; 5 years agoSplit fromPAIS AllianceHeadquartersQuitoYouth wingFrente de Jóvenes de la RCMembership(2022)200,000IdeologyProgressivismAnti-neoliberalismSocialism of the 21st centuryBolivarianismCorreismLeft-wing nationalismLeft-wing populismMarket socialismAnti-imperialismPolitical positionLeft-wingNational affiliationUnion for HopeColors Cyan  White  RedSeats in the National Assembly47 / 137Provincial Prefects2 / 137Mayors0 / 221Websiterevolucionciudadana.com.ecPolitics of EcuadorPolitical partiesElections",Irrelevant Context && The context provided does not give any information about Joe Biden's spouse during his first election to the Senate.,Unmarried,Who was Joe Biden married to when he was first elected to the Senate?,Irrelevant Context
Citizen Revolution MovementMovimiento Revolución Ciudadana,Citizen Revolution MovementMovimiento Revolución Ciudadana,,,,
,,,,,
Abbreviation,RC,,,,
Leader,Rafael Correa,,,,
President,Marcela Aguiñaga,,,,
General Secretary,David Villamar,,,,
Founder,Iván Espinel,,,,
Founded,2010(historical) August 2021(modern),,,,
Registered,18 August 2016; 5 years ago,,,,

Citizen Revolution MovementMovimiento Revolución Ciudadana,Citizen Revolution MovementMovimiento Revolución Ciudadana.1
,
Abbreviation,RC
Leader,Rafael Correa
President,Marcela Aguiñaga
General Secretary,David Villamar
Founder,Iván Espinel
Founded,2010(historical) August 2021(modern)
Registered,18 August 2016; 5 years ago
Split from,PAIS Alliance
Headquarters,Quito


In [37]:
df_gpt4.query("predicted_answer.str.contains('relevant')").shape

(15, 5)

In [38]:
html_render_df(
    df_gpt4.query("predicted_answer_short != actual_answer")
    .sample(10, random_state=94)
    .loc[:, ["table", "question", "predicted_answer_short", "actual_answer"]]
)

Unnamed: 0,table,question,predicted_answer_short,actual_answer
719,"Hurricane GastonCategory 1 hurricane (SSHWS/NWS)Hurricane Gaston shortly after moving ashore on August 29FormedAugust 27, 2004DissipatedSeptember 3, 2004(Extratropical after September 1)Highest winds1-minute sustained:75 mph (120 km/h) Lowest pressure985 mbar (hPa); 29.09 inHgFatalities8 direct, 1 indirectDamage$130 million (2004 USD)Areas affectedSouth Carolina, North Carolina, Virginia, Maryland, Delaware, MassachusettsPart of the2004 Atlantic hurricane season",When was Hurricane Gaston on the land?,"August 27 to September 3, 2004",after August 29
Category 1 hurricane (SSHWS/NWS),Category 1 hurricane (SSHWS/NWS),,,
Hurricane Gaston shortly after moving ashore on August 29,Hurricane Gaston shortly after moving ashore on August 29,,,
Formed,"August 27, 2004",,,
Dissipated,"September 3, 2004",,,
(Extratropical after September 1),(Extratropical after September 1),,,
,,,,
,,,,
Highest winds,1-minute sustained:75 mph (120 km/h),,,
Lowest pressure,985 mbar (hPa); 29.09 inHg,,,

0,1
Category 1 hurricane (SSHWS/NWS),Category 1 hurricane (SSHWS/NWS)
Hurricane Gaston shortly after moving ashore on August 29,Hurricane Gaston shortly after moving ashore on August 29
Formed,"August 27, 2004"
Dissipated,"September 3, 2004"
(Extratropical after September 1),(Extratropical after September 1)
,
,
Highest winds,1-minute sustained:75 mph (120 km/h)
Lowest pressure,985 mbar (hPa); 29.09 inHg
,

Federal Defence Forces of Germany,Federal Defence Forces of Germany.1
Bundeswehr,Bundeswehr
,
Motto,Wir. Dienen. Deutschland. (German for ''We. Serve. Germany.'')
Founded,12 November 1955
Current form,3 October 1990
Service branches,Army  Navy  Air Force  Joint Support Service  Joint Medical Service  Cyber and Information Domain Service
Headquarters,"Berlin, Bonn, and Potsdam"
Website,www.bundeswehr.de
Leadership,Leadership
Commander-in-Chief,Federal Minister of Defence (during peacetime)Chancellor of Germany (during war)

0,1
"HMSSomersetin Indian Ocean, 2011","HMSSomersetin Indian Ocean, 2011"
History,History
United Kingdom,United Kingdom
Name,HMSSomerset
Operator,Royal Navy
Ordered,January 1992
Builder,Yarrow Shipbuilders
Laid down,12 October 1992
Launched,25 June 1994
Sponsored by,Lady Layard

0,1
Button at the 2012 Bahrain Grand Prix,Button at the 2012 Bahrain Grand Prix
Born,"Jenson Alexander Lyons Button 19 January 1980(age 42) Frome, Somerset, England"
Formula One World Championship career,Formula One World Championship career
Nationality,British
Active years,2000–2017
Teams,"Williams, Benetton, Renault, BAR, Honda, Brawn, McLaren"
Engines,"BMW, Renault, Honda, Mercedes"
Car number,22
Entries,309 (306 starts)
Championships,1 (2009)

Personal information,Personal information.1,Unnamed: 2
Born,"November 1, 1971",
Medal recordMen’s Field HockeyRepresenting ArgentinaChampions Challenge2001 Kuala LumpurTeam2005 AlexandriaTeam2007 BoomTeamPan American Games1995 Mar del PlataTeam1999 WinnipegTeam2003 Santo DomingoTeam2007 Rio de JaneiroTeam,Medal recordMen’s Field HockeyRepresenting ArgentinaChampions Challenge2001 Kuala LumpurTeam2005 AlexandriaTeam2007 BoomTeamPan American Games1995 Mar del PlataTeam1999 WinnipegTeam2003 Santo DomingoTeam2007 Rio de JaneiroTeam,
,,
Men’s Field Hockey,Men’s Field Hockey,Men’s Field Hockey
Representing Argentina,Representing Argentina,Representing Argentina
Champions Challenge,Champions Challenge,Champions Challenge
,2001 Kuala Lumpur,Team
,2005 Alexandria,Team
,2007 Boom,Team
Pan American Games,Pan American Games,Pan American Games

0,1,2
,,
Men’s Field Hockey,Men’s Field Hockey,Men’s Field Hockey
Representing Argentina,Representing Argentina,Representing Argentina
Champions Challenge,Champions Challenge,Champions Challenge
,2001 Kuala Lumpur,Team
,2005 Alexandria,Team
,2007 Boom,Team
Pan American Games,Pan American Games,Pan American Games
,1995 Mar del Plata,Team
,1999 Winnipeg,Team

Israel Defense Forces,Israel Defense Forces.1
צבא ההגנה לישראל‎,צבא ההגנה לישראל‎
Emblem of the Israel Defense Forces,Emblem of the Israel Defense Forces
Flag of the Israel Defense Forces,Flag of the Israel Defense Forces
Founded,26 May 1948; 74 years ago
Service branches,Israeli Ground Forces Israeli Air Force Israeli Navy
Website,www.idf.il
Leadership,Leadership
Prime Minister,Yair Lapid
Defense Minister,Benny Gantz
Chief of the General Staff,Lieutenant General Aviv Kochavi

Atlantic Time Zone,Atlantic Time Zone.1
Time zone,Time zone
Atlantic Time Zone,Atlantic Time Zone
UTC offset,UTC offset
AST,UTC−04:00
ADT,UTC−03:00
Current time,Current time
"08:40, 28 June 2022 AST[refresh] 09:40, 28 June 2022 ADT[refresh]","08:40, 28 June 2022 AST[refresh] 09:40, 28 June 2022 ADT[refresh]"
Observance of DST,Observance of DST
DST is observed in parts of this time zone.,DST is observed in parts of this time zone.

Chiyonofuji Mitsugu,Chiyonofuji Mitsugu.1
千代の富士 貢,千代の富士 貢
Chiyonofuji in 2010,Chiyonofuji in 2010
Personal information,Personal information
Born,"Mitsugu Akimoto June 1, 1955 Fukushima, Hokkaido, Japan"
Died,"July 31, 2016(aged 61) Tokyo, Japan"
Height,183 cm (6 ft 0 in)
Weight,126 kg (278 lb; 19 st 12 lb)
Career,Career
Stable,Kokonoe
Record,1045-437-170

Purim,Purim.1
18th-century manuscript of the prayer of Al HaNissim on the miracles of Purim,18th-century manuscript of the prayer of Al HaNissim on the miracles of Purim
Type,Jewish
Significance,Celebration of Jewish deliverance as told in the Book of Esther (megillah)
Celebrations,"Listening to the Book of Esther in synagogue;sending food parcels and giving charity;dressing up in costume;eating a festive meal;parties and parades (Adloyada);drinking alcoholic beverages, especially wine"
Date,"14th day of Adar (in Jerusalem and all ancient walled cities, 15th of Adar)"
2021 date,"Sunset, 25 February – nightfall, 26 February"
2022 date,"Sunset, 16 March – nightfall, 17 March"
2023 date,"Sunset, 6 March – nightfall, 7 March"
2024 date,"Sunset, 23 March – nightfall, 24 March"
Frequency,Annual

Kaiō Hiroyuki,Kaiō Hiroyuki.1
魁皇 博之,魁皇 博之
Kaiō in May 2008,Kaiō in May 2008
Personal information,Personal information
Born,"Hiroyuki Koga 24 July 1972(age 49) Nōgata, Fukuoka, Japan"
Height,1.85 m (6 ft 1 in)
Weight,170 kg (375 lb; 26 st 11 lb)
Web presence,website
Career,Career
Stable,Tomozuna
Record,1047–700–158


In [39]:
# Some questions appear more than one time
df_gpt4.groupby("question").size().to_frame("occurences_of_same_question").groupby(
    "occurences_of_same_question"
).size()

occurences_of_same_question
1    975
2      3
4      2
5      4
6      3
dtype: int64

In [40]:
df_gpt4[df_gpt4.duplicated(["question"], keep=False)].shape

(52, 5)

In [41]:
df_gpt4[df_gpt4.duplicated(["question", "actual_answer"], keep=False)].shape

(49, 5)

In [42]:
# Duplicate questions where question-actual_answer-pairs are not duplicated
(
    df_gpt4[df_gpt4.duplicated(["question"], keep=False)]  # Rows with duplicates only
    .drop_duplicates(
        subset=["question", "actual_answer"], keep=False
    )  # Remove (all) rows if Q and A are not unique
    .sort_values("question")
)

Unnamed: 0,table,predicted_answer,actual_answer,question,predicted_answer_short
468,"<html><body><table class=""infobox"" style=""widt...",26 years && HMS Somerset was commissioned in 1...,28 Years,How many years does HMSAstute is service in UK...,26 years
893,"<table class=""infobox"" style=""width:25.5em;bor...",8 years && HMS Astute has been in service sinc...,8 Years (from 2014),How many years does HMSAstute is service in UK...,8 years
938,"<table class=""infobox"" style=""width:25.5em;bor...",Not applicable && The context given is about t...,A. J. Caleb Boggs,Who was the US senator from Delaware in Dec 1972?,Not applicable


In [43]:
# Different predicted answers for the same question-table pairs
df_gpt4[df_gpt4.duplicated(["question", "table"], keep=False)]

Unnamed: 0,table,predicted_answer,actual_answer,question,predicted_answer_short
18,"<html><body><table class=""infobox ib-time-zone...",2 hours && Florida is in Eastern Time Zone and...,two hours,What's the difference in time between Florida ...,2 hours
20,"<html><body><table class=""infobox ib-time-zone...",2 hours difference && Florida is in Eastern Ti...,two hours,What's the difference in time between Florida ...,2 hours difference
219,"<html><body><table class=""infobox vcard""><tbod...",25 years old && Futabayama Sadaji was born in ...,25,How old was Futabayama Sadaji when he achieved...,25 years old
221,"<html><body><table class=""infobox vcard""><tbod...",25 years old && Futabayama was born in 1912 an...,25,How old was Futabayama Sadaji when he achieved...,25 years old


In [44]:
# Predicted answer and question are the same despite different tables
df_gpt4[df_gpt4.duplicated(["question", "predicted_answer"], keep=False)].sort_values(
    "question"
)

Unnamed: 0,table,predicted_answer,actual_answer,question,predicted_answer_short
342,"<html><body><table class=""infobox vevent""><tbo...",Neilia Hunter && Joe Biden was married to Neil...,Unmarried,Who was Joe Biden married to when he was first...,Neilia Hunter
728,"<table class=""infobox vevent"" style=""border-co...",Neilia Hunter && Joe Biden was married to Neil...,Unmarried,Who was Joe Biden married to when he was first...,Neilia Hunter
345,"<html><body><table class=""infobox vevent""><tbo...",Not relevant && The context provided does not ...,Neilia Hunter,Who was the better half of Joe Biden in 1970?,Not relevant
948,"<table class=""infobox"" style=""width:25.5em;bor...",Not relevant && The context provided does not ...,Neilia Hunter,Who was the better half of Joe Biden in 1970?,Not relevant


In [45]:
# Sanity check to see if table 342 and 345 are different
# (as prodced by this code: df_gpt4[df_gpt4.duplicated(["question", "predicted_answer"], keep=False)].sort_values("question"))
df_gpt4[df_gpt4.duplicated(["question", "predicted_answer", "table"], keep=False)]

Unnamed: 0,table,predicted_answer,actual_answer,question,predicted_answer_short


In [46]:
# Duplicates may be due to different predicted answers or different context tables
df_gpt4[
    df_gpt4.duplicated(subset=["question", "actual_answer"], keep=False)
].sort_values(by="question").head()

Unnamed: 0,table,predicted_answer,actual_answer,question,predicted_answer_short
908,"<table class=""infobox"" style=""width:25.5em;bor...",Not available && The context provided is about...,27,At what age does Joe Biden join the democratic...,Not available
725,"<table class=""infobox vevent"" style=""border-co...",Information not available && The context provi...,27,At what age does Joe Biden join the democratic...,Information not available
922,"<table class=""infobox"" style=""width:25.5em;bor...",Not available && The context provided does not...,27,At what age does Joe Biden join the democratic...,Not available
845,"<table class=""infobox vevent""><tbody><tr><th c...",Unrelated context && The provided context does...,27,At what age does Joe Biden join the democratic...,Unrelated context
339,"<html><body><table class=""infobox vevent""><tbo...",Not applicable && The context provided is not ...,one,How many parties does Joe’s Biden’s is associa...,Not applicable


In [49]:
html_tables = os.listdir("../../data/maindata/tables/html/")
table_id_to_html = {}
for file in html_tables:
    with open(f"../../data/maindata/tables/html/{file}") as f:
        html = f.read()
    table_id = int(file.replace(".html", ""))
    table_id_to_html[table_id] = html
table_id_mapping = pd.DataFrame.from_dict(
    table_id_to_html, orient="index", columns=["table"]
).reset_index(names="table_id")