Skip to content

Commit

Permalink
t-movies/: Make 'em correct, jsons
Browse files Browse the repository at this point in the history
  • Loading branch information
pasky committed Jul 7, 2015
1 parent ff78ce5 commit b314123
Show file tree
Hide file tree
Showing 5 changed files with 16 additions and 5 deletions.
7 changes: 5 additions & 2 deletions t-movies/README.md
Original file line number Diff line number Diff line change
Expand Up @@ -7,10 +7,13 @@ knowledge base in a narrow domain. Here, we choose the "movies" domain,
meant to be answerable using IMDB based data.

for s in devtest val trainmodel test; do
{ echo '[';
cat main/$s.json |
egrep 'qText.*(play|star[^t]|voice|movie|\bact)' |
egrep -v 'play[^ ]* (for|4)\b|position|playoff|soccer|music|sport|ball|guitar|tennis' >\
t-movies/$s.json
egrep -v 'play[^ ]* (for|4)\b|position|playoff|soccer|music|sport|ball|guitar|tennis'
echo ']'
# the crazy thing below strips the trailing comma; json is silly
} | tac | sed -e '2s/,$//' | tac > t-movies/$s.json
done

The dataset is currently rather noisy and mixed with sports questions.
Expand Down
2 changes: 2 additions & 0 deletions t-movies/devtest.json
Original file line number Diff line number Diff line change
@@ -1,3 +1,4 @@
[
{"qId": "wqr000120", "answers": ["Mila Kunis"], "qText": "who plays meg in family guy?"},
{"qId": "wqr000140", "answers": ["University of Phoenix Stadium"], "qText": "what stadium did the chicago cardinals play in?"},
{"qId": "wqr000580", "answers": ["New Moon", "He's a Bully, Charlie Brown", "Eclipse", "Cheaper by the Dozen 2", "Incarceron", "The Adventures of Sharkboy and Lavagirl", "Dear Eleanor", "Abduction", "Shadow Fury", "Field of Dreams 2: Lockout"], "qText": "what movies has taylor lautner?"},
Expand All @@ -17,3 +18,4 @@
{"qId": "wqr003400", "answers": ["Seth MacFarlane"], "qText": "who plays stewie griffin on family guy?"},
{"qId": "wqr003500", "answers": ["Matthew Broderick"], "qText": "who was the voice of simba?"},
{"qId": "wqr003760", "answers": ["In the Land of Blood and Honey"], "qText": "what movie is angelina jolie directing?"}
]
4 changes: 3 additions & 1 deletion t-movies/test.json
Original file line number Diff line number Diff line change
@@ -1,3 +1,4 @@
[
{"qId": "wqs000003", "answers": ["Tony Warren"], "qText": "who plays ken barlow in coronation street?"},
{"qId": "wqs000017", "answers": ["Norman Bird", "Martin Freeman", "Ian Holm"], "qText": "who plays bilbo baggins in the hobbit?"},
{"qId": "wqs000051", "answers": ["Karen Mulder"], "qText": "who will play mr gray in the film?"},
Expand Down Expand Up @@ -165,4 +166,5 @@
{"qId": "wqs001996", "answers": ["Nancy Cartwright"], "qText": "who played maggie in himym?"},
{"qId": "wqs002000", "answers": ["for amos"], "qText": "who played berger in sex and the city?"},
{"qId": "wqs002003", "answers": ["Eclipse", "Dark Kingdom: The Dragon King", "New Moon", "Remember Me", "How to Be", "Harry Potter and the Order of the Phoenix", "Little Ashes", "Bel Ami", "Twilight", "The Twilight Saga: Breaking Dawn - Part 1"], "qText": "what movies have robert pattinson in them?"},
{"qId": "wqs002005", "answers": ["Ken Jenkins"], "qText": "who plays bob kelso in scrubs?"},
{"qId": "wqs002005", "answers": ["Ken Jenkins"], "qText": "who plays bob kelso in scrubs?"}
]
4 changes: 3 additions & 1 deletion t-movies/trainmodel.json
Original file line number Diff line number Diff line change
@@ -1,3 +1,4 @@
[
{"qId": "wqr000001", "answers": ["Padm\u00e9 Amidala"], "qText": "what character did natalie portman play in star wars?"},
{"qId": "wqr000005", "answers": ["Denethor II"], "qText": "what character did john noble play in lord of the rings?"},
{"qId": "wqr000025", "answers": ["Abduction", "Eclipse", "Valentine's Day", "The Twilight Saga: Breaking Dawn - Part 1", "New Moon"], "qText": "what movies does taylor lautner play in?"},
Expand Down Expand Up @@ -256,4 +257,5 @@
{"qId": "wqr003702", "answers": ["Britt McKillip", "Kristen Wiig"], "qText": "who voices lola bunny in looney tunes?"},
{"qId": "wqr003706", "answers": ["David Wenham"], "qText": "who plays faramir in lord of the rings?"},
{"qId": "wqr003738", "answers": ["American Crude", "Air Buddies", "A Crush on You", "Brother Bear", "Back in Business", "A Night at the Roxbury", "Breakfast of Champions", "Bulworth", "Armageddon", "Brother Bear 2"], "qText": "what films did michael clarke duncan star in?"},
{"qId": "wqr003767", "answers": ["New Moon", "Eclipse", "The Runaways", "Into the Wild", "Adventureland", "Twilight"], "qText": "what movies did kristen stewart act in?"},
{"qId": "wqr003767", "answers": ["New Moon", "Eclipse", "The Runaways", "Into the Wild", "Adventureland", "Twilight"], "qText": "what movies did kristen stewart act in?"}
]
4 changes: 3 additions & 1 deletion t-movies/val.json
Original file line number Diff line number Diff line change
@@ -1,3 +1,4 @@
[
{"qId": "wqr000049", "answers": ["Cirque du Freak: The Vampire's Assistant", "The Hunger Games", "7 Days in Havana", "Journey to the Center of the Earth", "The Forger", "Detention", "Journey 2: The Mysterious Island", "Red Dawn", "The Third Rule", "The Kids Are All Right"], "qText": "what movie is josh hutcherson in?"},
{"qId": "wqr000069", "answers": ["Blossom", "Melissa & Joey", "Bow", "Gimme a Break!", "Run of the House", "Brotherly Love"], "qText": "what tv show did joey lawrence play on?"},
{"qId": "wqr000099", "answers": ["Woman at Wedding"], "qText": "who does the author stephenie meyer play in the movie twilight?"},
Expand Down Expand Up @@ -64,4 +65,5 @@
{"qId": "wqr003569", "answers": ["Jason Segel"], "qText": "who plays marvin eriksen?"},
{"qId": "wqr003599", "answers": ["The Legend of Zelda", "3D Dot Game Heroes", "Akuma-kun: Makai no Wana", "Atsui 12 Game: Furi Furi Party!", "11eyes CrossOver", "11eyes: Tsumi to Batsu to Aganai no Sh\u014djo", "Military Madness", "The Legend of Zelda: Twilight Princess", "Cosmic Walker"], "qText": "what games do japanese people play?"},
{"qId": "wqr003699", "answers": ["Marc Blucas"], "qText": "who plays riley finn on buffy the vampire slayer?"},
{"qId": "wqr003704", "answers": ["Matt Lanter"], "qText": "who voices anakin in the clone wars?"},
{"qId": "wqr003704", "answers": ["Matt Lanter"], "qText": "who voices anakin in the clone wars?"}
]

0 comments on commit b314123

Please sign in to comment.