In [3]:
import numpy as np
import json
from nltk.tokenize import word_tokenize
from nltk.tokenize import sent_tokenize

from sklearn.feature_extraction.text import TfidfVectorizer

<b>Word embedding</b>

In [4]:
embedding_size = 50
gloveFilePath = "data/glove.6B.50d.txt"
def loadGlove(filePath):
    file = open(filePath, 'r')
    
    vocab = {}
    embedding = []
    for i, line in enumerate(file.readlines()):
        line = line.strip().split(' ')
        word = line[0]
        vocab[word] = i
        embedding.append(line[1:])
    file.close()
    return vocab,embedding
vocab, embedding = loadGlove(gloveFilePath)
vocab_size = len(vocab)
print(vocab_size)

400000


<b>Load data</b>

In [5]:
f = open("./data/training.json", encoding='utf-8')
js = json.load(f)
#discard the token '?' at the end of each query
train_qs = [item['question'][:-1] for item in js]
tokenized_train_qs_all = [word_tokenize(item['question'][:-1]) for item in js]
train_texts = [item['text'] for item in js]
tokenized_train_texts_all = [word_tokenize(item['text']) for item in js]
train_aps = [item['answer_paragraph'] for item in js]
train_docids = [item['docid'] for item in js]
f.close()
print(train_qs[0])
print(tokenized_train_qs_all[0])
print(train_texts[0])
print(tokenized_train_texts_all[0])

A kilogram could be definined as having a Planck constant of what value
['A', 'kilogram', 'could', 'be', 'definined', 'as', 'having', 'a', 'Planck', 'constant', 'of', 'what', 'value']
6966662606895999999♠6.62606896×10−34 j⋅s
['6966662606895999999♠6.62606896×10−34', 'j⋅s']


In [6]:
f = open("./data/testing.json", encoding='utf-8')
js = json.load(f)
#discard the token '?' at the end of each query
test_qs = [item['question'][:-1] for item in js]
tokenized_test_qs_all = [word_tokenize(item['question'][:-1]) for item in js]
test_docids = [item['docid'] for item in js]
f.close()
print(test_qs[0])
print(tokenized_test_qs_all[0])

Modern browser support standards-based and defacto what
['Modern', 'browser', 'support', 'standards-based', 'and', 'defacto', 'what']


In [7]:
f = open("./data/documents.json", encoding='utf-8')
js = json.load(f)
docs = [ [ sent for para in item['text'] for sent in sent_tokenize(para)] for item in js]
tokenized_docs = [[word_tokenize(sent) for sent in doc] for doc in docs]
docids = [item['docid'] for item in js]
f.close()
print(docs[0])
print(tokenized_docs[0])

['First recognized in 1900 by Max Planck, it was originally the proportionality constant between the minimal increment of energy, E, of a hypothetical electrically charged oscillator in a cavity that contained black body radiation, and the frequency, f, of its associated electromagnetic wave.', 'In 1905 the value E, the minimal energy increment of a hypothetical oscillator, was theoretically associated by Einstein with a "quantum" or minimal element of the energy of the electromagnetic wave itself.', 'The light quantum behaved in some respects as an electrically neutral particle, as opposed to an electromagnetic wave.', 'It was eventually called the photon.', 'Classical statistical mechanics requires the existence of h (but does not define its value).', "Eventually, following upon Planck's discovery, it was recognized that physical action cannot take on an arbitrary value.", 'Instead, it must be some multiple of a very small quantity, the "quantum of action", now called the Planck cons

<b>Locate answer sentence with TF-IDF</b>

In [8]:
TfidfVectorizers = []
tfidf_paras_mats = []
for paras in docs:
    tfidf = TfidfVectorizer(tokenizer=word_tokenize, lowercase=True)
    tfidf_paras_mats.append(tfidf.fit_transform(paras))
    TfidfVectorizers.append(tfidf)

train_context_sents = []
train_queries = []
train_answers = []
for i,query in enumerate(train_qs):
    docid = train_docids[i]
    tfidf_query = TfidfVectorizers[docid].transform([query])
    relativities = np.dot(tfidf_query, tfidf_paras_mats[docid].T).toarray()
    indices = (-relativities).argsort()[0]
    
    answer = train_texts[i]
    tokenized_answer = word_tokenize(answer)
    for index in indices:
        tokenized_context = tokenized_docs[docid][index]
        #if answer is not in context, which means we failed to find the right context. We discard this train item
        if tokenized_answer[0] in tokenized_context and tokenized_answer[-1] in tokenized_context:
            train_context_sents.append(docs[docid][index])
            train_queries.append(query)
            train_answers.append(answer)
            break
print(train_context_sents[6])
print(train_queries[6])
print(train_answers[6])
            
test_context_sents = []
for i,query in enumerate(test_qs):
    docid = test_docids[i]
    tfidf_query = TfidfVectorizers[docid].transform([query])
    relativities = np.dot(tfidf_query, tfidf_paras_mats[docid].T)
    index = np.argmax(relativities)
    test_context_sents.append(docs[docid][index])
print(test_context_sents[0])

First recognized in 1900 by Max Planck, it was originally the proportionality constant between the minimal increment of energy, E, of a hypothetical electrically charged oscillator in a cavity that contained black body radiation, and the frequency, f, of its associated electromagnetic wave.
What is frequency also known as in science
f
Modern web browsers support a combination of standards-based and de facto HTML and XHTML, which should be rendered in the same way by all browsers.


<b>Get answer indices in context</b>

In [9]:
tokenized_train_context = [word_tokenize(context) for context in train_context_sents]
tokenized_train_qs = [word_tokenize(query) for query in train_queries]
tokenized_train_answers = [word_tokenize(answer) for answer in train_answers]

In [104]:
#indices of answer words in context 
train_answers_indices = []
for i,answer in enumerate(tokenized_train_answers):
    start_w = answer[0]
    start_i = -1
    end_w = answer[-1]
    end_i = -1
    
    has_answer = False
    for j,word in enumerate(tokenized_train_context[i]):
        if start_w == word:
            start_i = j
        if end_w == word:
            end_i = j
        
        answer_indices = []
        #answer should be less than 5 words, and start index should smaller than end_i
        if start_i!=-1 and end_i - start_i <= 5 and end_i >= start_i :
            for index in range(start_i, end_i+1):
                answer_indices.append(index)
            train_answers_indices.append(answer_indices)
            has_answer = True
            break
    if not has_answer:
        train_answers_indices.append([])
        
print(tokenized_train_context[0])
print(tokenized_train_answers[0])
print(train_answers_indices[0])
    
tokenized_test_context = [word_tokenize(context) for context in test_context_sents]
tokenized_test_qs = [word_tokenize(query) for query in test_qs]

['The', 'most', 'urgent', 'unit', 'on', 'the', 'list', 'for', 'redefinition', 'is', 'the', 'kilogram', ',', 'whose', 'value', 'has', 'been', 'fixed', 'for', 'all', 'science', '(', 'since', '1889', ')', 'by', 'the', 'mass', 'of', 'a', 'small', 'cylinder', 'of', 'platinum–iridium', 'alloy', 'kept', 'in', 'a', 'vault', 'just', 'outside', 'Paris', '.']
['cylinder']
[31]


In [11]:
embed_train_context = [[embedding[vocab[word]] for word in context if word in vocab] for context in tokenized_train_context]
embed_train_qs = [[embedding[vocab[word]] for word in q if word in vocab] for q in tokenized_train_qs]
embed_train_answers = [[embedding[vocab[word]] for word in answer if word in vocab] for answer in tokenized_train_answers]
embed_test_context = [[embedding[vocab[word]] for word in context if word in vocab] for context in tokenized_test_context]
embed_test_qs = [[embedding[vocab[word]] for word in q if word in vocab] for q in tokenized_test_qs]
print(embed_train_answers[0])

[['0.53501', '0.51619', '1.2869', '-0.44228', '-0.6153', '1.5837', '0.77163', '-0.74072', '-0.59075', '0.44771', '0.35128', '0.16073', '-0.43567', '1.5196', '-0.32378', '0.0080341', '-0.37728', '1.537', '-0.44858', '-2.0515', '0.050697', '-1.3163', '-0.074289', '-0.13453', '0.1929', '-0.46173', '0.51555', '1.3476', '-0.38719', '0.38547', '1.7052', '-0.84175', '0.16006', '1.0468', '1.2382', '0.33616', '0.95423', '0.14869', '0.48572', '0.44431', '0.54502', '-0.20186', '-0.43291', '0.1342', '-0.58757', '0.40151', '0.93869', '0.16292', '-0.1962', '-0.99166']]


<b>Deep learning model</b>

In [12]:
max_context_size = 0
for tokenized_doc in tokenized_docs:
    for tokenized_sent in tokenized_doc:
        len_sent = len(tokenized_sent)
        if max_context_size < len_sent:
            max_context_size = len_sent

max_query_size = 0
for query in tokenized_train_qs_all:
    len_query = len(query)
    if max_query_size < len_query:
        max_query_size = len_query
for query in tokenized_test_qs_all:
    len_query = len(query)
    if max_query_size < len_query:
        max_query_size = len_query
        
max_answer_size = 0
for answer in tokenized_train_answers:
    len_answer = len(answer)
    if max_answer_size < len_answer:
        max_answer_size = len_answer

print(max_context_size)
print(max_query_size)
print(max_answer_size)

382
59
8



training data

In [43]:
trainig_size = len(embed_train_qs)

training_contexts = np.zeros(
    (trainig_size, max_context_size, embedding_size),
    dtype='float32')
training_queries = np.zeros(
    (trainig_size, max_query_size, embedding_size),
    dtype='float32')
#answers are indices in context
# training_answers = np.zeros(
#     (trainig_size, max_answer_size, max_context_size),
#     dtype='float32')

#answers are start and end indices in context
training_answers = np.zeros(
    ( 2, trainig_size, max_context_size),
    dtype='float32')

#similarity matrix of context words to context words
training_cc = np.zeros(
    (trainig_size, max_context_size, max_context_size),
    dtype='float32')
#similarity matrix of query words to query words
training_qq = np.zeros(
    (trainig_size, max_query_size, max_query_size),
    dtype='float32')
#similarity matrix of context words to query words
training_qc = np.zeros(
    (trainig_size, max_query_size, max_context_size),
    dtype='float32')
training_input = np.zeros(
    (trainig_size, max_query_size, max_context_size),
    dtype='float32')

for i, embed_context in enumerate(embed_train_context):
    for j, embed_word in enumerate(embed_context):
        training_contexts[i,j] = embed_word
        
for i, embed_query in enumerate(embed_train_qs):
    for j, embed_word in enumerate(embed_query):
        training_queries[i,j] = embed_word

for i, answer_indices in enumerate(train_answers_indices):
    if len(answer_indices) > 1:
        training_answers[0, i, answer_indices[0]] = 1.
        training_answers[1, i, answer_indices[-1]] = 1.
        
for i in range(trainig_size):
    training_cc[i] = np.dot(training_contexts[i], training_contexts[i].T)
    training_qq[i] = np.dot(training_queries[i], training_queries[i].T)
    training_qc[i] = np.dot(training_queries[i], training_contexts[i].T)
    training_input[i] = np.dot( np.dot(training_qq[i], training_qc[i]), training_cc[i])

testing data

In [99]:
testing_size = len(embed_test_qs)

testing_contexts = np.zeros(
    (testing_size, max_context_size, embedding_size),
    dtype='float32')
testing_size_queries = np.zeros(
    (testing_size, max_query_size, embedding_size),
    dtype='float32')

#similarity matrix of context words to context words
testing_cc = np.zeros(
    (testing_size, max_context_size, max_context_size),
    dtype='float32')
#similarity matrix of query words to query words
testing_qq = np.zeros(
    (testing_size, max_query_size, max_query_size),
    dtype='float32')
#similarity matrix of context words to query words
testing_qc = np.zeros(
    (testing_size, max_query_size, max_context_size),
    dtype='float32')
testing_input = np.zeros(
    (testing_size, max_query_size, max_context_size),
    dtype='float32')

for i, embed_context in enumerate(embed_test_context):
    for j, embed_word in enumerate(embed_context):
        testing_contexts[i,j] = embed_word
        
for i, embed_query in enumerate(embed_test_qs):
    for j, embed_word in enumerate(embed_query):
        testing_queries[i,j] = embed_word
        
for i in range(testing_size):
    testing_cc[i] = np.dot(testing_contexts[i], testing_contexts[i].T)
    testing_qq[i] = np.dot(testing_queries[i], testing_queries[i].T)
    testing_qc[i] = np.dot(testing_queries[i], testing_contexts[i].T)
    testing_input[i] = np.dot( np.dot(testing_qq[i], testing_qc[i]), testing_cc[i])

NameError: name 'testing_queries' is not defined

'''
testing_size = len(embed_test_qs)

input_contexts = np.zeros(
    (testing_size, max_context_size, embedding_size),
    dtype='float32')

input_queries = np.zeros(
    (testing_size, max_query_size, embedding_size),
    dtype='float32')
'''

In [109]:
import keras.backend as K
from keras.models import Model
from keras import layers
from keras.layers import Input, GRU, Dense, Reshape, Flatten

batch_size = 128  
epochs = 100
qc_relations_size = max_context_size*max_query_size

<b>model 1 pure GRU</b>

In [44]:
qc_relations = Input(shape=(None, max_context_size))
qc_relations_dense = Dense(max_query_size, activation='relu')(qc_relations)
encoder_outputs = GRU(output_dim = max_context_size, activation = 'tanh')(qc_relations_dense) #output_dim #activation

start = Dense(max_context_size, activation='softmax')(encoder_outputs)
end = Dense(max_context_size, activation='softmax')(encoder_outputs)

  This is separate from the ipykernel package so we can avoid doing imports until


In [None]:
model = Model(qc_relations, [start, end])
model.compile(optimizer='adam', loss='categorical_crossentropy') 
model.fit(training_input, [training_answers[0], training_answers[1]] ,
          batch_size=batch_size,
          epochs=epochs,
          validation_split=0.2)

In [47]:
my_answers = []
for i,embed_query in enumerate(embed_train_qs):
    start_idx, end_idx = model.predict(training_input[i:i+1])
    start_idx = np.argmax(start_idx)
    end_idx = np.argmax(end_idx)
    print(train_answers_indices[i], "\t", start_idx, end_idx)
    print("Answer:", train_answers[i], "My answer:", tokenized_train_context[i][start_idx:end_idx+1])

[31] 	 5 8
Answer: cylinder My answer: ['the', 'list', 'for', 'redefinition']
[3, 4, 5] 	 5 8
Answer: time vs. energy My answer: ['energy', '.']
[15, 16, 17] 	 5 8
Answer: quantum of action My answer: ['some', 'multiple', 'of', 'a']
[11] 	 5 8
Answer: 1913 My answer: ['quantized', 'model', 'of', 'the']
[7] 	 5 8
Answer: h My answer: ['existence', 'of', 'h', '(']
[7] 	 5 8
Answer: h My answer: ['existence', 'of', 'h', '(']
[42] 	 5 8
Answer: f My answer: ['Max', 'Planck', ',', 'it']
[9] 	 5 8
Answer: 1839 My answer: ['Alexandre', 'Edmond', 'Becquerel', 'in']
[19] 	 5 8
Answer: 1911 My answer: ['as', 'the', '``', 'ultraviolet']
[78, 79] 	 5 8
Answer: multiphoton effect My answer: ['each', 'photoelectron', ')', 'is']
[5, 6] 	 5 8
Answer: nuclear magneton My answer: ['nuclear', 'magneton', 'are', 'units']
[9, 10] 	 5 8
Answer: 555 nanometres My answer: ['with', 'a', 'wavelength', 'of']
[6] 	 5 8
Answer: 1911 My answer: ['in', '1911', 'was', 'devoted']
[22, 23] 	 5 8
Answer: hot atoms My an

[13] 	 5 8
Answer: four My answer: ['his', 'work', ',', 'Universal']
[23] 	 5 8
Answer: seven-year My answer: ['was', 'impressed', 'by', 'the']
[18] 	 5 8
Answer: 1989 My answer: ['serious', 'dramatic', 'films', ',']
[20] 	 5 8
Answer: cinematography My answer: ['in', 'Scouting', ',', 'Spielberg']
[13] 	 5 8
Answer: four My answer: ['his', 'work', ',', 'Universal']
[7] 	 5 8
Answer: poorly My answer: ['film', 'fared', 'poorly', 'at']
[23] 	 5 8
Answer: 1996 My answer: ['publishers', 'Knowledge', 'Adventure', 'on']
[24] 	 5 8
Answer: 1980 My answer: ['Encounters', 'project', 'and', ',']
[13] 	 5 8
Answer: six My answer: ['reviews', 'from', 'critics', ',']
[18] 	 5 8
Answer: 1982 My answer: ['the', 'novel', 'of', 'the']
[15, 16, 17] 	 5 8
Answer: reportedly close friends My answer: [',', "''", 'starred', 'Joan']
[50] 	 5 8
Answer: terrorism My answer: ['films', 'began', 'addressing', 'humanistic']
[10] 	 5 8
Answer: 1981 My answer: ['at', 'the', 'box', 'office']
[18] 	 5 8
Answer: editin

[4, 5] 	 5 8
Answer: guided missile My answer: ['missile', 'resulted', 'in', 'a']
[31, 32] 	 5 8
Answer: guided missiles My answer: ['defence', 'was', 'one', 'of']
[4, 5] 	 5 8
Answer: important buildings My answer: ['buildings', 'were', 'common', 'in']
[14] 	 5 8
Answer: 1950s My answer: ['mm', 'guns', 'would', 'continue']
[23, 24] 	 5 8
Answer: the u.s. army My answer: ['some', '(', 'largely', 'communist']
[6, 7] 	 5 8
Answer: maximum ceiling My answer: [',', 'maximum', 'ceiling', 'being']
[9] 	 5 8
Answer: .50-inch My answer: ['considering', 'anything', 'larger', 'than']
[25, 26, 27, 28, 29] 	 5 8
Answer: `` flaktürme '' flak towers My answer: ['concrete', 'blockhouses', ',', 'some']
[9, 10] 	 5 8
Answer: homeland air defence My answer: ['defence', 'may', 'be', 'for']
[1] 	 5 8
Answer: 1925 My answer: ['a', 'new', 'instrument', 'developed']
[8, 9] 	 5 8
Answer: the laser My answer: ['anti-aircraft', 'use', 'is', 'the']
[38] 	 5 8
Answer: 1990 My answer: ['for', 'instance', ',', 'air

[13, 14, 15] 	 5 8
Answer: indvuna ye nkhundla My answer: ['is', 'elected', 'at', 'the']
[19] 	 5 8
Answer: 1906 My answer: ['(', 'for', 'example', ',']
[14, 15, 16] 	 5 8
Answer: at least ten My answer: ['it', ',', 'he', 'or']
[] 	 5 8
Answer: constituency executive committee My answer: ['committee', '(', 'bucopho', ')']
[11, 12] 	 5 8
Answer: 30 seats My answer: ['Libandla', 'consists', 'of', 'the']
[3, 4] 	 5 8
Answer: 21.6 % My answer: ['of', 'preschool', 'age', 'children']
[27] 	 5 8
Answer: 1982 My answer: [',', 'the', 'constitution', 'of']
[1] 	 5 8
Answer: 1903 My answer: ['victory', 'in', 'the', 'Anglo-Boer']
[12, 13, 14] 	 5 8
Answer: 19 august 2005 My answer: ['chastity', 'rite', 'of', '``']
[33, 34, 35, 36] 	 5 8
Answer: less than 20 % My answer: ['the', 'external', 'debt', 'burden']
[0, 1] 	 5 8
Answer: 83 % My answer: ['population', 'adheres', 'to', 'Christianity']
[1, 2, 3, 4] 	 5 8
Answer: childless , unmarried girls My answer: ['can', 'take', 'part', '.']
[17, 18] 	 5 

[6] 	 5 8
Answer: 1952 My answer: ['in', '1952', ',', 'he']
[] 	 5 8
Answer: executive order 10925 My answer: [',', 'Kennedy', 'issued', 'Executive']
[12, 13, 14] 	 5 8
Answer: mediocrity and incompetence My answer: ['is', 'the', 'idea', 'that']
[7, 8] 	 5 8
Answer: positive action My answer: ['words', '``', 'positive', 'action']
[3] 	 5 8
Answer: 5-4 My answer: [',', 'the', 'Supreme', 'Court']
[46, 47] 	 5 8
Answer: the descendants My answer: ['in', 'the', 'South', 'Bronx']
[30, 31, 32] 	 5 8
Answer: remedying past discrimination My answer: ['who', 'wrote', 'From', 'Ending']
[8, 9] 	 5 8
Answer: compensation argument My answer: ['action', 'is', 'the', 'compensation']
[23] 	 5 8
Answer: 14 My answer: ['affirmative', 'action', 'itself', 'is']
[18, 19, 20] 	 5 8
Answer: 52 million acres My answer: ['belonging', 'to', 'Native', 'Americans']
[3] 	 5 8
Answer: 10,000 My answer: ['at', 'the', 'Lincoln', 'Memorial']
[23, 24, 25] 	 5 8
Answer: just outlawing discrimination My answer: ['similar

[14, 15] 	 5 8
Answer: intellectual development My answer: ['suffered', 'from', 'an', 'education']
[11, 12] 	 5 8
Answer: breaking up My answer: ['Prussian', 'southern', 'attacks', 'in']
[27, 28, 29] 	 5 8
Answer: inflamed public opinion My answer: ['the', 'public', ',', 'Bismarck']
[15, 16] 	 5 8
Answer: significant distances My answer: ['Moltke', "'s", 'ability', 'to']
[11, 12, 13] 	 5 8
Answer: their military system My answer: ['advantages', 'given', 'to', 'the']
[4] 	 5 8
Answer: 7,855 My answer: ['killed', 'and', 'wounded', 'along']
[7, 8] 	 5 8
Answer: war reparations My answer: ['amenable', 'to', 'war', 'reparations']
[11] 	 5 8
Answer: trench-warfare My answer: ['use', 'of', 'the', 'Chassepot']
[24, 25] 	 5 8
Answer: very limited My answer: ['Great', 'Britain', 'remained', 'the']
[7, 8, 9] 	 5 8
Answer: the chassepot rifle My answer: ['worth', 'against', 'the', 'Dreyse']
[10, 11, 12] 	 5 8
Answer: 1859 to 1873 My answer: ['Prussian', 'Minister', 'of', 'War']
[4] 	 5 8
Answer: 2

[8] 	 5 8
Answer: summer My answer: [',', 'produced', 'in', 'summer']
[9] 	 5 8
Answer: density My answer: ['the', 'variation', 'in', 'wood']
[14, 15, 16] 	 5 8
Answer: near the base My answer: ['upper', 'portion', 'of', 'the']
[8, 9] 	 5 8
Answer: ripple sycamore My answer: ['such', 'as', 'the', 'ripple']
[18] 	 5 8
Answer: birds My answer: ['in', 'hickory', 'and', 'certain']
[10, 11] 	 5 8
Answer: insect attacks My answer: ['hemlock', 'is', 'the', 'result']
[12] 	 5 8
Answer: veneers My answer: ['manufactured', 'by', 'bonding', 'together']
[6] 	 5 8
Answer: three My answer: ['has', 'three', 'main', 'components']
[7] 	 5 8
Answer: water-saturated My answer: ['green', '(', 'water-saturated', ')']
[15] 	 5 8
Answer: thin My answer: ['heartwood', 'very', 'early', 'in']
[25] 	 5 8
Answer: weapons My answer: ['millennia', 'for', 'many', 'purposes']
[23] 	 5 8
Answer: decay My answer: [',', 'or', 'deep', 'wound']
[24] 	 5 8
Answer: density My answer: ['growth', 'ring', 'is', 'usually']
[25]

[7] 	 5 8
Answer: cherry My answer: ['walnut', 'and', 'cherry', ',']
[1] 	 5 8
Answer: ring-porous My answer: ['of', 'the', 'early', 'wood']
[6] 	 5 8
Answer: radial My answer: [',', 'radial', 'growth', ',']
[21] 	 5 8
Answer: houses My answer: ['millennia', 'for', 'many', 'purposes']
[1, 2] 	 5 8
Answer: white pines My answer: ['not', 'much', 'contrast', 'between']
[12] 	 5 8
Answer: mechanically My answer: ['its', 'native', 'form', 'may']
[15] 	 5 8
Answer: cellulose My answer: ['paper', 'industry', 'is', 'the']
[14] 	 5 8
Answer: cellulose My answer: ['and', 'the', 'cell', 'walls']
[9] 	 5 8
Answer: sapwood My answer: ['is', 'first', 'formed', 'as']
[19] 	 5 8
Answer: timber My answer: ['to', 'felled', 'trees', ',']
[22] 	 5 8
Answer: glue My answer: ['manufactured', 'by', 'bonding', 'together']
[1, 2] 	 5 8
Answer: 100 million My answer: ['of', 'wood', 'was', 'consumed']
[17] 	 5 8
Answer: diffuse-porous My answer: ['is', 'customary', 'to', 'divide']
[14] 	 5 8
Answer: slow My answ

[16, 17, 18] 	 5 8
Answer: 2014 and 2016 My answer: ['being', 'inducted', 'into', 'the']
[6, 7] 	 5 8
Answer: number one My answer: ['reached', 'number', 'one', 'in']
[15, 16, 17, 18] 	 5 8
Answer: `` madonna mic '' My answer: [',', 'the', 'microphone', 'design']
[6, 7] 	 5 8
Answer: breast cancer My answer: ['of', 'breast', 'cancer', ',']
[21, 22, 23] 	 5 8
Answer: $ 305.2 million My answer: ['Tour', 'in', 'May', '2006']
[4] 	 5 8
Answer: 38 My answer: ['top-ten', 'singles', 'on', 'the']
[3] 	 5 8
Answer: academics My answer: ['her', 'a', '``', 'dynamic']
[14] 	 5 8
Answer: 1977 My answer: ['Michigan', ',', 'Madonna', 'moved']
[13, 14, 15] 	 5 8
Answer: 15 million copies My answer: ['number', 'one', 'on', 'the']
[3, 4] 	 5 8
Answer: urban direction My answer: ['with', 'Hard', 'Candy', '(']
[18, 19, 20, 21] 	 5 8
Answer: simple love songs , My answer: ['the', 'content', 'of', 'the']
[] 	 5 8
Answer: the english roses , My answer: ['venture', 'was', 'Madonna', "'s"]
[12] 	 5 8
Answer: t

[1] 	 5 8
Answer: 75 My answer: ['Jewish', 'population', 'in', 'France']
[20] 	 5 8
Answer: 16 My answer: ['workplace', 'of', '144,600', 'employees']
[23, 24] 	 5 8
Answer: the city My answer: ['sixty', 'homeless', 'shelters', ',']
[1] 	 5 8
Answer: bistro My answer: ['of', 'eating', 'place', 'loosely']
[2] 	 5 8
Answer: 20th My answer: ['the', 'Paris', 'literary', 'community']
[18] 	 5 8
Answer: bridges My answer: ['to', 'prevent', 'sacking', 'by']
[15, 16, 17] 	 5 8
Answer: 1786 and 1814 My answer: ['from', 'Cimetière', 'des', 'Innocents']
[1, 2, 3] 	 5 8
Answer: 2 february 2000 My answer: ['Philippe', 'Binant', 'realised', 'the']
[12] 	 5 8
Answer: 1682 My answer: ['and', 'moved', 'his', 'court']
[21] 	 5 8
Answer: 144,600 My answer: ['Hauts-de-Seine', 'department', 'La', 'Défense']
[58] 	 5 8
Answer: 1,176 My answer: ['and', 'contracts', 'it', 'out']
[18] 	 5 8
Answer: thirteen My answer: ['two', 'French', 'Muslim', 'extremists']
[18] 	 5 8
Answer: 1977 My answer: ['architecture', 

[24] 	 5 8
Answer: 303,465 My answer: ['for', 'this', 'transmitter', 'to']
[21] 	 5 8
Answer: cambium My answer: ['the', 'xylem', 'and', 'phloem']
[16, 17] 	 5 8
Answer: flowering plants My answer: ['has', 'been', 'Angiospermae', '(']
[4] 	 5 8
Answer: magnoliids My answer: ['the', 'first', 'to', 'diverge']
[5] 	 5 8
Answer: biochemical My answer: ['biochemical', '(', 'physiological', ')']
[26, 27, 28] 	 5 8
Answer: increase in thickness My answer: ['layer', 'of', 'cambium', 'between']
[16] 	 5 8
Answer: flowering My answer: ['remain', 'too', 'fragile', 'to']
[10, 11, 12] 	 5 8
Answer: green and leaf-like My answer: ['of', 'sepals', ')', 'is']
[7] 	 5 8
Answer: flower My answer: ['is', 'the', 'flower', '.']
[39, 40] 	 5 8
Answer: annual rings My answer: ['character', 'of', 'the', 'elements']
[26, 27, 28] 	 5 8
Answer: inferior transitional forms My answer: ['be', 'a', 'common', 'source']
[2, 3, 4] 	 5 8
Answer: whole genome duplication My answer: ['event', 'at', '160', 'million']
[10] 

[22] 	 5 8
Answer: 2013 My answer: ['of', 'Architecture', 'and', 'Urban']
[7, 8] 	 5 8
Answer: three divisions My answer: ['University', 'comprises', 'three', 'divisions']
[2] 	 5 8
Answer: 1853 My answer: ['named', 'after', 'George', 'Washington']
[3] 	 5 8
Answer: four My answer: ['student-run', 'media', 'outlets', '.']
[14, 15, 16, 17] 	 5 8
Answer: 12 research centers . My answer: ['the', 'university-wide', 'Institute', 'of']
[1, 2] 	 5 8
Answer: the 1890s My answer: ['to', 'the', 'dramatic', 'expansion']
[9, 10, 11] 	 5 8
Answer: full-time or part-time My answer: ['pursue', 'an', 'MBA', 'either']
[1] 	 5 8
Answer: 1957 My answer: ['for', 'the', 'construction', 'of']
[7] 	 5 8
Answer: 1988 My answer: ['beginning', 'in', '1988', 'by']
[26] 	 5 8
Answer: sanctions My answer: ['Amadou', 'Sanogo', 'seized', 'power']
[12] 	 5 8
Answer: 113 My answer: ['the', 'Alliance', 'for', 'Democracy']
[14] 	 5 8
Answer: nonviolent My answer: ['300', 'lives', 'over', 'the']
[13] 	 5 8
Answer: five-y

[] 	 5 8
Answer: scarlet biretta My answer: ['is', 'distinctive', 'not', 'merely']
[] 	 5 8
Answer: cardinal priests My answer: ['numerous', 'of', 'the', 'three']
[7] 	 5 8
Answer: white My answer: ['is', 'always', 'white', '—']
[21] 	 5 8
Answer: 1962 My answer: ['that', 'all', 'cardinals', ',']
[27, 28] 	 5 8
Answer: 10 years My answer: ['the', 'right', 'to', '``']
[11] 	 5 8
Answer: 1917 My answer: ['Code', 'of', 'Canon', 'Law']
[13] 	 5 8
Answer: 1567 My answer: ['was', 'reserved', 'for', 'the']
[15] 	 5 8
Answer: third My answer: ['were', 'Italian', 'by', '1994']
[14, 15, 16] 	 5 8
Answer: the cardinalate expires My answer: ['revealing', 'the', 'identity', 'of']
[26] 	 5 8
Answer: prince My answer: ['sanctae', 'romanae', 'ecclesiae', 'cardinalis']
[22] 	 5 8
Answer: seven My answer: ['of', 'electing', 'the', 'pope']
[15] 	 5 8
Answer: marry My answer: ['inaccurately', 'called', '``', 'lay']
[3] 	 5 8
Answer: 1563 My answer: ['influential', 'Ecumenical', 'Council', 'of']
[20] 	 5 8

[22, 23, 24] 	 5 8
Answer: nerve fiber tracts My answer: ['the', 'brain', 'is', 'taken']
[9, 10, 11] 	 5 8
Answer: slow wave sleep My answer: ['and', 'serotonin', 'drop', 'during']
[3] 	 5 8
Answer: invertebrates My answer: ['as', 'sponges', ',', 'jellyfish']
[6] 	 5 8
Answer: strokes My answer: ['of', 'strokes', 'and', 'other']
[9, 10, 11] 	 5 8
Answer: twice as large My answer: ['has', 'a', 'brain', 'roughly']
[5, 6] 	 5 8
Answer: the 1990s My answer: ['the', '1990s', 'were', 'officially']
[10] 	 5 8
Answer: white My answer: ['on', 'the', 'outside', 'and']
[35] 	 5 8
Answer: mesencephalon My answer: ['the', 'brain', 'appears', 'as']
[1, 2, 3] 	 5 8
Answer: autonomic nervous system My answer: ['heart', 'rate', ',', 'digestion']
[9] 	 5 8
Answer: 30 My answer: ['primates', 'includes', 'at', 'least']
[5] 	 5 8
Answer: mammals My answer: ['mammals', 'are', 'generally', 'similar']
[7, 8, 9] 	 5 8
Answer: the pituitary gland My answer: ['go', 'to', 'the', 'pituitary']
[5, 6, 7] 	 5 8
Answe

[37, 38, 39] 	 5 8
Answer: the modern age My answer: ['that', ',', 'while', 'Sanskrit']
[11, 12] 	 5 8
Answer: composition contests My answer: ["''", '(', 'since', '2002']
[6] 	 5 8
Answer: gurukulas My answer: ['traditional', 'gurukulas', 'throughout', 'India']
[7] 	 5 8
Answer: close My answer: ['includes', 'the', 'close', 'relationship']
[9, 10] 	 5 8
Answer: oral tradition My answer: ['society', ',', 'and', 'the']
[71] 	 5 8
Answer: inferior My answer: ['logically', 'opposite', 'sources', 'for']
[13, 14] 	 5 8
Answer: separate dialects My answer: ['and', 'Classical', 'or', '``']
[1] 	 5 8
Answer: 1974 My answer: ['been', 'a', 'short', 'daily']
[3, 4] 	 5 8
Answer: daily newspaper My answer: ['in', 'Sanskrit', ',', 'has']
[52, 53] 	 5 8
Answer: lingua franca My answer: [':', 'saṃskṛtam', '[', 'səmskr̩t̪əm']
[12] 	 5 8
Answer: bhāṣā My answer: ['many', 'Southeast', 'Asian', 'languages']
[4, 5] 	 5 8
Answer: 18th century My answer: ['century', 'like', 'Sir', 'William']
[18, 19] 	 5 8


[14, 15, 16] 	 5 8
Answer: the scanning system My answer: ['remaining', 'numeric', 'parameter', 'is']
[6] 	 5 8
Answer: 10 My answer: ['contains', '10', 'HD', 'channels']
[22] 	 5 8
Answer: region by region My answer: ['contains', '10', 'HD', 'channels']
[8, 9, 10] 	 5 8
Answer: the frame rate My answer: ['a', 'product', ',', 'the']
[9] 	 5 8
Answer: 16:9 My answer: ['HDTV', 'also', 'handle', 'the']
[63, 64] 	 5 8
Answer: 20 million My answer: [',', 'the', 'number', 'of']
[2, 3, 4] 	 5 8
Answer: a research project My answer: ['and', 'the', 'system', 'was']
[21] 	 5 8
Answer: 625 My answer: ['until', 'the', '1960s', ',']
[] 	 5 8
Answer: analog tape My answer: ['capable', 'of', 'recording', 'analog']
[22, 23] 	 5 8
Answer: by satellite My answer: ['analog', 'HDTV', 'to', 'about']
[28, 29] 	 5 8
Answer: monochrome only My answer: ['even', 'higher-resolution', 'standard', 'at']
[6] 	 5 8
Answer: twice My answer: ['has', 'twice', 'the', 'linear']
[16, 17] 	 5 8
Answer: 1953 , My answer: ['

[41, 42] 	 5 8
Answer: 25 percent My answer: ['for', 'installed', 'wind', 'energy']
[14] 	 5 8
Answer: 2007 My answer: ['named', 'the', 'top', 'event']
[5] 	 5 8
Answer: 77 My answer: ['77', 'counties', 'that', 'govern']
[17] 	 5 8
Answer: 1976 My answer: ['the', 'Medieval', 'Fair', 'of']
[11] 	 5 8
Answer: 10-day My answer: ['over', 'one', 'million', 'people']
[29] 	 5 8
Answer: fifth My answer: ['third-largest', 'producer', 'of', 'natural']
[7] 	 5 8
Answer: two My answer: ['state', "'s", 'two', 'members']
[17] 	 5 8
Answer: 638,817 My answer: ['up', 'of', 'public', 'school']
[1] 	 5 8
Answer: 1927 My answer: ['Cyrus', 'Avery', ',', 'known']
[12, 13] 	 5 8
Answer: glass sculptures My answer: ['Art', 'contains', 'the', 'most']
[92] 	 5 8
Answer: 45,688 My answer: [',', 'Oklahoma', "'s", 'largest']
[6] 	 5 8
Answer: 11,330 My answer: ['by', '11,330', 'people', ',']
[39, 40, 41] 	 5 8
Answer: tell the world My answer: ['2010-', ')', ',', 'sociologist']
[38, 39, 40] 	 5 8
Answer: $ 12 mi

[20, 21] 	 5 8
Answer: nonimaging optics My answer: ['the', 'light', 'emission', 'of']
[28, 29, 30] 	 5 8
Answer: gamut area index My answer: ['to', 'meet', 'the', 'expectations']
[6, 7, 8] 	 5 8
Answer: searchlights and flares My answer: ['present', 'searchlights', 'and', 'flares']
[14, 15] 	 5 8
Answer: stage lighting My answer: ['use', 'many', 'of', 'the']
[15, 16] 	 5 8
Answer: translucent tube My answer: ['low', 'wattage', ',', 'low']
[16, 17] 	 5 8
Answer: small lights My answer: ['steps', 'in', 'the', 'aisles']
[16] 	 5 8
Answer: positive My answer: ['performance', ',', 'improve', 'the']
[31, 32, 33] 	 5 8
Answer: lumen per watt My answer: ['fixtures', 'is', 'the', 'luminous']
[9] 	 5 8
Answer: 50,000 My answer: ['longer', '—', 'up', 'to']
[1, 2] 	 5 8
Answer: incandescent bulb My answer: ['color', 'temperature', 'around', '2800']
[10, 11] 	 5 8
Answer: incandescent light My answer: ['price', 'came', 'about', 'with']
[3, 4] 	 5 8
Answer: lighting cues My answer: ['are', 'prepare

[8] 	 5 8
Answer: manjaniq My answer: ['ballista', ')', ',', 'manjaniq']
[6] 	 5 8
Answer: 749 My answer: ['in', '749', ',', 'the']
[13] 	 5 8
Answer: 5.79 My answer: ['the', 'Umayyad', 'Caliphate', 'covered']
[7] 	 5 8
Answer: northern My answer: ['Resafa', 'in', 'northern', 'Syria']
[13] 	 5 8
Answer: cohort My answer: ['abandoned', 'the', 'old', 'division']
[16] 	 5 8
Answer: 684 My answer: ['at', 'a', 'battle', 'at']
[21] 	 5 8
Answer: dhimmis My answer: ['Caliphate', ',', 'which', 'included']
[14, 15] 	 5 8
Answer: after 1587 My answer: ['Christiana', 'en', 'letra', 'y']
[50] 	 5 8
Answer: ethnic My answer: ['not', 'only', 'from', 'Mainlander']
[12] 	 5 8
Answer: tha̍k-im My answer: ['colloquial', 'readings', '(', '文白異讀']
[5] 	 5 8
Answer: 1842 My answer: ['1842', ',', 'Xiamen', '(']
[12, 13, 14] 	 5 8
Answer: the 16th century My answer: ['Hokkien', ',', 'can', 'be']
[1] 	 5 8
Answer: 1993 My answer: ['the', 'first', 'region', 'in']
[6, 7, 8] 	 5 8
Answer: 5 to 7 My answer: ['have

[8, 9] 	 5 8
Answer: very strong My answer: ['``', 'There', 'are', 'very']
[61, 62] 	 5 8
Answer: over 150 My answer: ['Wen', 'Jiabao', 'ordered', 'the']
[17] 	 5 8
Answer: 700 My answer: ['Wenchuan', 'and', 'four', 'nearby']
[2, 3] 	 5 8
Answer: donated blood My answer: ['resulting', 'in', 'according', 'to']
[11] 	 5 8
Answer: 31 My answer: ['later', 'said', 'that', 'a']
[16] 	 5 8
Answer: months My answer: ['by', 'the', 'government', 'piece']
[7, 8] 	 5 8
Answer: satellite images My answer: ['of', 'its', 'satellite', 'images']
[6, 7] 	 5 8
Answer: international help My answer: ['accept', 'international', 'help', 'to']
[30] 	 5 8
Answer: 420,000 My answer: ['aftershocks', ',', 'one', '5.2']
[7] 	 5 8
Answer: five My answer: ['mother', 'of', 'five', 'at']
[13, 14, 15] 	 5 8
Answer: neglected and untouched My answer: ['earthquake', 'hit', 'an', 'area']
[4] 	 5 8
Answer: seven My answer: ['schools', 'collapsed', ',', 'burying']
[4, 5] 	 5 8
Answer: 4.8 million My answer: ['million', 'peo

[0] 	 5 8
Answer: 1,300 My answer: [',', 'with', 'initial', 'relocation']
[15, 16] 	 5 8
Answer: around 280 My answer: ['to', 'contact', 'the', 'Wolong']
[14, 15] 	 5 8
Answer: health care My answer: ['Qiang', 'told', 'reporters', 'in']
[15, 16, 17] 	 5 8
Answer: put them online My answer: ['Shifang', ',', 'taken', 'photos']
[5, 6] 	 5 8
Answer: safety checks My answer: ['safety', 'checks', 'were', 'to']
[16] 	 5 8
Answer: booths My answer: ['were', 'made', 'by', 'people']
[22, 23] 	 5 8
Answer: 19 km My answer: ['(', '50', 'mi', ')']
[7, 8] 	 5 8
Answer: government officials My answer: ['that', '``', 'government', 'officials']
[7, 8, 9] 	 5 8
Answer: the government My answer: ['earthquake', ',', 'the', 'Chinese']
[10, 11] 	 5 8
Answer: around 3,000 My answer: ['Town', ',', 'Wenchuan', ',']
[4] 	 5 8
Answer: 200,000 My answer: ['people', 'were', 'evacuated', 'from']
[12] 	 5 8
Answer: calm My answer: ['Hotel', 'in', 'Chengdu', 'said']
[36, 37, 38] 	 5 8
Answer: 1976 tangshan earthquake

[20] 	 5 8
Answer: 24 My answer: [',', 'there', 'are', '77']
[6, 7, 8] 	 5 8
Answer: the m6 motorway My answer: ['on', 'the', 'M6', 'motorway']
[22] 	 5 8
Answer: 1972 My answer: ['College', 'of', 'Music', '(']
[8] 	 5 8
Answer: 77 My answer: [',', 'there', 'are', '77']
[23] 	 5 8
Answer: sheep My answer: ['this', 'area', 'is', 'devoted']
[9] 	 5 8
Answer: 1974 My answer: ['significant', 'boundary', 'reform', 'in']
[21] 	 5 8
Answer: 1994 My answer: ['was', 'transferred', 'from', 'the']
[43] 	 5 8
Answer: 1905 My answer: ['of', 'Barrow-in-Furness', ',', 'Blackburn']
[12, 13, 14] 	 5 8
Answer: the southern part My answer: ['the', 'county', 'became', 'increasingly']
[9] 	 5 8
Answer: 1893 My answer: ['Music', 'was', 'founded', 'in']
[1] 	 5 8
Answer: 1889 My answer: ['county', 'of', 'Lancashire', 'was']
[36] 	 5 8
Answer: 1993 My answer: ['focal', 'point', 'for', 'many']
[10, 11] 	 5 8
Answer: ceremonial county My answer: ['Lord-Lieutenant', '(', 'termed', 'now']
[14, 15, 16] 	 5 8
Answe

[17] 	 5 8
Answer: martial My answer: [',', 'Chopin', "'s", 'works']
[63] 	 5 8
Answer: 1830 My answer: ['the', 'death', 'of', 'Chopin']
[9, 10] 	 5 8
Answer: rigid procedures My answer: ['performance', ',', 'Chopin', 'avoided']
[25] 	 5 8
Answer: 1849 My answer: [';', 'French', 'pronunciation', ':']
[4] 	 5 8
Answer: 1831 My answer: [',', 'Chopin', 'received', 'the']
[19] 	 5 8
Answer: pianos My answer: ['23', 'March', '1833', ',']
[21] 	 5 8
Answer: 1810 My answer: [';', 'French', 'pronunciation', ':']
[12, 13, 14] 	 5 8
Answer: best possible condition My answer: ['little', 'piano', ',', 'which']
[4, 5, 6] 	 5 8
Answer: flute and violin My answer: ['and', 'violin', ';', 'the']
[16] 	 5 8
Answer: 1927 My answer: ['music', 'competition', ',', 'the']
[61, 62, 63] 	 5 8
Answer: intimate keyboard technique My answer: ['in', 'the', 'Revue', 'et']
[10] 	 5 8
Answer: apartment My answer: ['Paris', ',', 'where', 'Chopin']
[7] 	 5 8
Answer: piano My answer: ['include', 'the', 'piano', '.']
[16

[5] 	 5 8
Answer: 48,000 My answer: ['48,000', 'inmates', 'was', 'established']
[21] 	 5 8
Answer: 1618 My answer: ['the', 'grandmaster', 'of', 'the']
[4] 	 5 8
Answer: 800,000 My answer: ['Germans', 'were', 'living', 'in']
[7] 	 5 8
Answer: 1466 My answer: ['Thorn', 'in', '1466', 'it']
[2] 	 5 8
Answer: 1,500 My answer: ['ordered', 'to', 'be', 'renamed']
[12] 	 5 8
Answer: 42,094 My answer: ['October', '1948', '21', 'transports']
[8] 	 5 8
Answer: publishers My answer: ['number', 'of', 'peak', 'publishers']
[24] 	 5 8
Answer: absolutism My answer: ['chief', 'characteristics', 'as', 'historicism']
[15] 	 5 8
Answer: 1909 My answer: ['Society', "'s", 'headquarters', 'to']
[13] 	 5 8
Answer: low My answer: ['on', 'Religion', '&', 'Public']
[7, 8, 9] 	 5 8
Answer: their door-to-door preaching My answer: ['known', 'for', 'their', 'door-to-door']
[15] 	 5 8
Answer: voting My answer: ['do', 'not', 'seek', 'public']
[21, 22] 	 5 8
Answer: house-to-house preaching My answer: ['at', 'Cedar', 'P

Answer: 45,000 My answer: ['books', 'is', 'derived', 'from']
[3] 	 5 8
Answer: tourism My answer: ['Nepal', 'has', 'thrived', ';']
[7] 	 5 8
Answer: icons My answer: ['form', 'of', 'icons', 'of']
[15] 	 5 8
Answer: inscriptions My answer: ['history', ',', 'spanning', 'nearly']
[8] 	 5 8
Answer: 74 My answer: ['30', 'hectares', '(', '74']
[17] 	 5 8
Answer: 300 My answer: ['the', 'Spiritual', 'Assembly', 'of']
[17] 	 5 8
Answer: 21 My answer: [',', 'garments', ',', 'carpets']
[3] 	 5 8
Answer: one My answer: ['restaurant', 'in', '1955', '.']
[13] 	 5 8
Answer: lake My answer: ['present-day', 'Kathmandu', 'was', 'once']
[15, 16, 17] 	 5 8
Answer: humid subtropical climate My answer: [',', 'portions', 'of', 'the']
[12] 	 5 8
Answer: tri-city My answer: ['as', '``', 'KTM', "''"]
[13] 	 5 8
Answer: 170 My answer: ['is', 'said', 'that', 'in']
[6, 7] 	 5 8
Answer: 5th century My answer: ['famous', '5th', 'century', 'Hindu']
[6] 	 5 8
Answer: two My answer: ['into', 'two', 'areas', ':']
[6] 	 

[35] 	 5 8
Answer: 1985 My answer: ['regulations', 'among', 'countries', ',']
[1] 	 5 8
Answer: label My answer: ['proper', 'use', 'of', 'the']
[4, 5, 6] 	 5 8
Answer: dissolve in fats My answer: ['in', 'fats', 'and', 'are']
[2] 	 5 8
Answer: 1960s My answer: ['than', '1', 'kg/ha', '(']
[45, 46] 	 5 8
Answer: 10 % to 212 % My answer: ['in', 'northern', 'Florida', 'found']
[5, 6, 7] 	 5 8
Answer: every 15 years My answer: ['every', '15', 'years', 'to']
[5] 	 5 8
Answer: 1960s My answer: ['1960s', ',', 'led', 'by']
[21, 22] 	 5 8
Answer: the wind My answer: ['atmosphere', 'at', 'relatively', 'high']
[12] 	 5 8
Answer: 1910 My answer: ['authority', 'for', 'regulating', 'pesticides']
[23, 24, 25] 	 5 8
Answer: weakness or paralysis My answer: ['enzyme', 'acetylcholinesterase', ',', 'allowing']
[7] 	 5 8
Answer: 2002 My answer: ['1998', 'and', '2002', '.']
[40] 	 5 8
Answer: cancer My answer: ['variety', 'of', 'adverse', 'health']
[25, 26] 	 5 8
Answer: chemical structure My answer: ['targe

[3] 	 5 8
Answer: 1883 My answer: ['she', 'fell', 'down', 'some']
[20, 21, 22] 	 5 8
Answer: her popularity recovered My answer: ['seclusion', ',', 'republicanism', 'temporarily']
[4, 5] 	 5 8
Answer: typhoid fever My answer: ['fever', 'by', 'William', 'Jenner']
[1] 	 5 8
Answer: 1839 My answer: ['after', 'Radicals', 'and', 'Tories']
[14] 	 5 8
Answer: 1900 My answer: ['throughout', 'her', 'widowhood', ',']
[] 	 5 8
Answer: the kensington system My answer: ['from', 'meeting', 'people', 'whom']
[31, 32] 	 5 8
Answer: older fathers My answer: ['the', 'mutation', 'arose', 'spontaneously']
[11, 12] 	 5 8
Answer: constitutional monarchy My answer: ['the', 'gradual', 'establishment', 'of']
[12] 	 5 8
Answer: 82 My answer: ['the', '1892', 'general', 'election']
[21, 22] 	 5 8
Answer: chloroform . My answer: ['birth', 'to', 'her', 'eighth']
[3] 	 5 8
Answer: 1865 My answer: ['and', 'after', 'a', 'brief']
[] 	 5 8
Answer: family monarchy My answer: ['more', 'symbolic', 'than', 'political']
[1] 

[17] 	 5 8
Answer: male My answer: ['of', 'a', 'haemophiliac', 'in']
[9, 10] 	 5 8
Answer: his budget My answer: ['resigned', 'in', '1885', 'after']
[16, 17, 18] 	 5 8
Answer: with her mother My answer: ['unmarried', 'young', 'woman', 'Victoria']
[1, 2, 3] 	 5 8
Answer: 2 march 1882 My answer: ['Roderick', 'Maclean', ',', 'a']
[1] 	 5 8
Answer: disliked My answer: ['the', 'constant', 'round', 'of']
[25, 26, 27] 	 5 8
Answer: a eulogistic biography My answer: ['her', 'accident', ',', 'and']
[24, 25, 26, 27] 	 5 8
Answer: the boer war My answer: ['to', 'Ireland', 'for', 'the']
[1] 	 5 8
Answer: 1845 My answer: ['hit', 'by', 'a', 'potato']
[13, 14, 15] 	 5 8
Answer: 14 december 1861 My answer: ['fever', 'by', 'William', 'Jenner']
[17, 18] 	 5 8
Answer: her mother My answer: ['unmarried', 'young', 'woman', 'Victoria']
[8] 	 5 8
Answer: 1848 My answer: ['the', 'revolutions', 'of', '1848']
[6] 	 5 8
Answer: 1840 My answer: ['in', '1840', ',', 'in']
[8] 	 5 8
Answer: 1844 My answer: ['recipro

[3, 4] 	 5 8
Answer: carpet weaving My answer: ['was', 'particularly', 'significant', 'in']
[4] 	 5 8
Answer: 400,000 My answer: ['Muslims', 'fleeing', 'with', 'the']
[6, 7, 8] 	 5 8
Answer: the non-muslim population My answer: [',', 'the', 'non-Muslim', 'population']
[5] 	 5 8
Answer: 571 My answer: ['571', 'primary', 'and', '94']
[7, 8, 9] 	 5 8
Answer: units called usul My answer: ['around', 'rhythmic', 'units', 'called']
[7, 8] 	 5 8
Answer: the state My answer: ['in', 'which', 'the', 'state']
[19, 20, 21] 	 5 8
Answer: a muslim minority My answer: ['the', '15th', 'century', 'the']
[] 	 5 8
Answer: in 1915 My answer: ['Russian', 'Caucasus', 'Army', 'continued']
[7, 8, 9] 	 5 8
Answer: 30 october 1918 My answer: ['signed', 'on', '30', 'October']
[1, 2, 3] 	 5 8
Answer: 10 november 1444 My answer: ['Murad', 'II', 'defeated', 'the']
[23] 	 5 8
Answer: east My answer: ['on', 'many', 'fronts', 'during']
[11] 	 5 8
Answer: 1768–1774 My answer: ['Empire', 'into', 'the', 'Russo-Turkish']
[

[18] 	 5 8
Answer: hardware My answer: [',', 'several', 'websites', 'have']
[7] 	 5 8
Answer: apartments My answer: ['their', 'personal', 'apartments', ',']
[74] 	 5 8
Answer: weight My answer: ['Super', 'Slim', 'model', 'a']
[2] 	 5 8
Answer: four My answer: ['content', 'the', 'What', "'s"]
[27, 28] 	 5 8
Answer: $ 306 My answer: ['at', 'US', '$', '499']
[70] 	 5 8
Answer: disc-loader My answer: ['new', 'Super', 'Slim', '4']
[14] 	 5 8
Answer: quieter My answer: ['form', 'factor', ',', 'decreased']
[14] 	 5 8
Answer: news My answer: ['the', 'existing', '[', 'Information']
[1, 2, 3] 	 5 8
Answer: paid netflix subscription My answer: ['required', 'for', 'the', 'service']
[2] 	 5 8
Answer: 2009 My answer: ['Computer', 'Entertainment', 'and', 'Netflix']
[52, 53, 54] 	 5 8
Answer: to cut costs My answer: ['May', '2005', 'featured', 'two']
[13] 	 5 8
Answer: city My answer: ['globe', 'data', 'to', 'display']
[] 	 5 8
Answer: the playstation store My answer: ['available', 'via', 'the', 'PC']

[2] 	 5 8
Answer: 2013 My answer: ['Infectious', 'Disease', 'Society', 'of']
[4] 	 5 8
Answer: 2 My answer: ['new', 'antibiotics', 'were', 'approved']
[12, 13, 14] 	 5 8
Answer: overgrowth of yeast My answer: ['vaginal', 'flora', ',', 'and']
[9, 10] 	 5 8
Answer: antibiotic resistance My answer: ['problems', 'with', 'antimicrobial', 'and']
[9, 10] 	 5 8
Answer: prophylactic antibiotics My answer: ['include', 'excessive', 'use', 'of']
[3, 4] 	 5 8
Answer: 20th century My answer: [',', 'treatments', 'for', 'infections']
[13] 	 5 8
Answer: penicillins My answer: [',', 'the', 'beta-lactam', 'antibiotics']
[14] 	 5 8
Answer: 1942 My answer: ['purifying', 'the', 'first', 'penicillin']
[24] 	 5 8
Answer: tyrothricin My answer: ['the', 'start', 'of', 'World']
[5] 	 5 8
Answer: 20th My answer: ['20th', 'century', ',', 'and']
[33] 	 5 8
Answer: 1977 My answer: ['the', 'question', 'of', 'emergence']
[9, 10, 11] 	 5 8
Answer: increased body mass My answer: ['life', 'is', 'associated', 'with']
[11,

[32, 33, 34] 	 5 8
Answer: the national capital My answer: ['People', "'s", 'Republic', 'of']
[7, 8] 	 5 8
Answer: public transportation My answer: ['cities', ',', 'public', 'transportation']
[30, 31] 	 5 8
Answer: hill hiking My answer: ['were', 'observed', 'in', 'the']
[23, 24] 	 5 8
Answer: inland ports My answer: ['area', 'and', 'the', 'center']
[16, 17, 18] 	 5 8
Answer: the southern suburb My answer: ['There', 'is', 'a', 'long']
[5, 6, 7] 	 5 8
Answer: the olympic spirit My answer: ['the', 'Olympic', 'spirit', 'and']
[65, 66, 67] 	 5 8
Answer: 600 years ago My answer: ['human', 'cost', 'of', 'some']
[22, 23] 	 5 8
Answer: 121 stations My answer: ['a', 'metro', 'system', 'with']
[1, 2, 3] 	 5 8
Answer: 10 february 2010 My answer: ['the', '122nd', 'IOC', 'session']
[6, 7] 	 5 8
Answer: 190 mi My answer: ['(', '190', 'mi', ')']
[4, 5, 6] 	 5 8
Answer: “ world-class ” My answer: ['world-class', '”', 'industrial', 'city']
[16, 17] 	 5 8
Answer: 750 mi My answer: ['(', '190', 'mi', ')'

[9, 10] 	 5 8
Answer: indigenous civilizations My answer: ['was', 'home', 'to', 'numerous']
[5] 	 5 8
Answer: single My answer: ['single', 'stringed', 'instrument', '.']
[33, 34] 	 5 8
Answer: 150 years My answer: ['contacts', 'with', 'Europeans', 'and']
[0] 	 5 8
Answer: 2012 My answer: ['similarities', 'in', 'ages', 'and']
[21, 22] 	 5 8
Answer: many accomplishments My answer: ['and', 'European', 'accounts', 'and']
[13] 	 5 8
Answer: single My answer: ['the', 'first', 'inhabitants', 'of']
[29] 	 5 8
Answer: 200,000 My answer: ['built', 'one', 'of', 'the']
[24] 	 5 8
Answer: mestizo My answer: ['population', 'are', 'of', 'full-blooded']
[14, 15] 	 5 8
Answer: about 600,329 My answer: ['indigenous', 'population', '(', 'known']
[10] 	 5 8
Answer: none My answer: ['proposed', 'and', 'used', ',']
[29, 30, 31] 	 5 8
Answer: wild teosinte grasses My answer: ['indigenous', 'peoples', 'developed', 'entirely']
[24, 25] 	 5 8
Answer: 3.7 % My answer: ['%', 'majority', 'of', 'residents']
[23, 24

[9, 10] 	 5 8
Answer: a disturbance My answer: ['theorized', 'that', 'pain', 'was']
[14] 	 5 8
Answer: specificity My answer: ['with', 'Avicenna', "'s", ',']
[4] 	 5 8
Answer: 13 My answer: ['studies', 'found', 'evidence', 'for']
[10] 	 5 8
Answer: nociceptive My answer: ['pain', ':', '(', '1']
[18] 	 5 8
Answer: sugar My answer: ['effect', 'of', 'pain', 'on']
[18] 	 5 8
Answer: identical My answer: ['fiber', 'endings', '(', 'with']
[3] 	 5 8
Answer: distressing My answer: ['often', 'caused', 'by', 'intense']
[19] 	 5 8
Answer: unclear My answer: ['of', 'animals', ',', 'such']
[5] 	 5 8
Answer: plants My answer: ['plants', ',', 'or', 'other']
[6, 7] 	 5 8
Answer: cancer pain My answer: ['as', 'cancer', 'pain', 'or']
[4, 5, 6, 7] 	 5 8
Answer: complex , subjective phenomenon My answer: [',', 'subjective', 'phenomenon', ',']
[10] 	 5 8
Answer: nociceptive My answer: ['pain', ':', '(', '1']
[4, 5] 	 5 8
Answer: cancer patients My answer: ['patients', 'who', 'often', 'have']
[8] 	 5 8
Answ

[12] 	 5 8
Answer: eight My answer: ['most', 'rail-oriented', 'cities', 'in']
[1] 	 5 8
Answer: ecclesiastical My answer: ['the', 'Viking', 'longphort', ',']
[29] 	 5 8
Answer: four My answer: ['Ireland', "'s", 'most', 'successful']
[7] 	 5 8
Answer: rhoticity My answer: ['degrees', 'of', 'rhoticity', ',']
[10, 11, 12] 	 5 8
Answer: average of 97 My answer: ['foggy', 'city', ',', 'with']
[11, 12, 13] 	 5 8
Answer: late 19th century My answer: ['from', 'Lithuania', 'and', 'Russia']
[6] 	 5 8
Answer: pharmaceuticals My answer: ['is', 'pharmaceuticals', ',', 'with']
[8, 9, 10] 	 5 8
Answer: six electoral wards My answer: ['elected', 'members', 'representing', 'six']
[10] 	 5 8
Answer: 7 My answer: [',', 'and', 'Cork', 'has']
[27, 28] 	 5 8
Answer: 2 days My answer: ['of', '7', 'days', 'of']
[4, 5] 	 5 8
Answer: fully walled My answer: ['walled', ',', 'and', 'some']
[20] 	 5 8
Answer: rain My answer: ['of', '1,227.9', 'millimetres', '(']
[16] 	 5 8
Answer: mid-2000s My answer: ['the', 'mai

[5, 6] 	 5 8
Answer: 4 % My answer: ['4', '%', 'in', '2009']
[1] 	 5 8
Answer: 47-metre My answer: ['building', ',', 'which', 'includes']
[1, 2] 	 5 8
Answer: civil service My answer: ['supported', 'by', 'the', 'federal']
[2] 	 5 8
Answer: decade My answer: ['unemployment', 'rates', 'and', 'depopulation']
[12] 	 5 8
Answer: 1673 My answer: ['fend', 'off', 'a', 'second']
[30] 	 5 8
Answer: explorer My answer: ['handwritten', 'Latin', 'text', 'in']
[4] 	 5 8
Answer: 1,400,000 My answer: ['passengers', 'travelled', 'through', 'the']
[21, 22] 	 5 8
Answer: 15.1 mph My answer: ['St.', 'John', "'s", 'is']
[13, 14] 	 5 8
Answer: silver thaws My answer: ['is', 'subject', 'to', 'freezing']
[28, 29] 	 5 8
Answer: 15 metres My answer: ['more', 'office', 'space', 'downtown']
[3] 	 5 8
Answer: two My answer: ['schools', ',', 'St.', 'Bonaventure']
[3] 	 5 8
Answer: 2006 My answer: [',', 'there', 'were', '100,646']
[27] 	 5 8
Answer: 1675 My answer: ['the', '17th', 'century', 'and']
[1, 2] 	 5 8
Answ

[14, 15, 16] 	 5 8
Answer: six or eight My answer: ['four', 'records', ',', 'with']
[10, 11, 12, 13, 14] 	 5 8
Answer: `` cx '' noise reduction My answer: ['scheme', 'involved', 'using', 'the']
[3, 4, 5] 	 5 8
Answer: a shellac-based compound My answer: ['compound', 'was', 'introduced', 'and']
[11] 	 5 8
Answer: 1933 My answer: ['test', 'discs', 'using', 'the']
[12, 13] 	 5 8
Answer: compact discs My answer: ['individual', 'digital', 'tracks', ',']
[19, 20, 21] 	 5 8
Answer: microphones and amplifiers My answer: ['the', 'time', 'that', 'early']
[1] 	 5 8
Answer: 1931 My answer: ['launched', 'the', 'first', 'commercially']
[2] 	 5 8
Answer: 1910 My answer: ['note', '1', ']', 'bound']
[66, 67, 68] 	 5 8
Answer: automatic gain control My answer: ['standard', 'record', 'playback', 'preamplifiers']
[14, 15] 	 5 8
Answer: wide-pitched section My answer: ['the', 'end', 'of', 'the']
[10] 	 5 8
Answer: 46:1 My answer: ['rpm', ',', 'such', 'that']
[6, 7, 8] 	 5 8
Answer: stereophonic record syst

[] 	 5 8
Answer: the center My answer: ['microphone', 'was', 'of', 'paramount']
[] 	 5 8
Answer: digital compact disc My answer: ['digital', 'media', ',', 'in']
[2, 3, 4] 	 5 8
Answer: retrieve the information My answer: ['from', 'a', 'laterally', 'modulated']
[15] 	 5 8
Answer: rpm My answer: [',', 'some', 'children', "'s"]
[18] 	 5 8
Answer: 1925 My answer: ['new', 'electrical', 'system', 'from']
[11, 12, 13, 14, 15] 	 5 8
Answer: a `` purist '' transcription My answer: ['of', 'magnetic', 'tape', 'in']
[21, 22, 23] 	 5 8
Answer: high quality cuts My answer: ['the', 'invention', 'of', 'the']
[5] 	 5 8
Answer: mirror-like My answer: ['mirror-like', 'finish', ',', 'the']
[23, 24, 25] 	 5 8
Answer: lift the arm My answer: [',', 'most', 'automatic', 'turntables']
[10, 11] 	 5 8
Answer: subsonic filter My answer: ['stereo', 'receivers', 'contained', 'a']
[11, 12, 13] 	 5 8
Answer: later surround-sound systems My answer: ['but', 'were', 'an', 'important']
[] 	 5 8
Answer: master disc My ans

[48, 49, 50] 	 5 8
Answer: monasteries and universities My answer: [',', 'descended', 'into', 'turmoil']
[13, 14] 	 5 8
Answer: private television My answer: ['in', 'the', 'UK', ',']
[14] 	 5 8
Answer: northwest My answer: ['years', 'the', 'land', 'that']
[4, 5] 	 5 8
Answer: temperate marine My answer: ['marine', 'climate', '.']
[27, 28] 	 5 8
Answer: golden age My answer: [',', 'descended', 'into', 'turmoil']
[7] 	 5 8
Answer: 1066 My answer: ['England', 'in', '1066', 'and']
[5, 6] 	 5 8
Answer: 9th century My answer: ['9th', 'century', ',', 'followed']
[9] 	 5 8
Answer: biannually My answer: ['executive', 'powers', 'but', 'meets']
[] 	 5 8
Answer: the crimean war My answer: ['of', 'the', 'British', 'Empire']
[28, 29] 	 5 8
Answer: the near east My answer: ['Ottoman', 'Empire', 'and', 'the']
[1] 	 5 8
Answer: 1900 My answer: ['published', 'an', 'article', ',']
[1, 2] 	 5 8
Answer: the sailor My answer: ['connect', 'with', 'the', 'soldier']
[8, 9, 10] 	 5 8
Answer: a geographic featur

[20, 21] 	 5 8
Answer: the west My answer: ['centered', 'on', 'the', 'central']
[1] 	 5 8
Answer: 400,000 My answer: ['40,000', 'm2', ')', 'of']
[13, 14] 	 5 8
Answer: 19th century My answer: ['of', 'professional', 'sports', 'franchises']
[5] 	 5 8
Answer: half My answer: ['half', 'of', 'the', 'city']
[25] 	 5 8
Answer: bicycle My answer: ['continuous', '14-mile', '(', '23']
[21] 	 5 8
Answer: working-class My answer: ['major', 'branches', 'of', 'Christianity']
[11] 	 5 8
Answer: 1921 My answer: ['the', 'site', 'to', 'the']
[8, 9, 10] 	 5 8
Answer: central business district My answer: ['centered', 'on', 'the', 'central']
[16, 17, 18] 	 5 8
Answer: as extensive parks My answer: ['respectively', 'as', 'East', 'Rock']
[9, 10, 11] 	 5 8
Answer: free music concerts My answer: ['the', 'site', 'of', 'many']
[32] 	 5 8
Answer: 862,477 My answer: ['ˈheɪvən/', ',', 'noo-HAY-vən', ')']
[16] 	 5 8
Answer: 129,779 My answer: ['in', 'Connecticut', '(', 'after']
[4, 5] 	 5 8
Answer: about half My ans

[12, 13] 	 5 8
Answer: new haven harbor My answer: ['work', 'to', 'widen', 'I-95']
[12] 	 5 8
Answer: 1842 My answer: ["'s", 'Day', 'parade', ',']
[5, 6, 7] 	 5 8
Answer: heart of downtown My answer: ['heart', 'of', 'downtown', ',']
[19, 20] 	 5 8
Answer: the hamburger My answer: ['restaurant', "'s", 'founder', 'Louis']
[2] 	 5 8
Answer: 2000 My answer: ['parts', 'of', 'downtown', 'New']
[12, 13, 14] 	 5 8
Answer: better theological community My answer: ['establish', 'a', '(', 'in']
[2] 	 5 8
Answer: 56 My answer: ['in', 'New', 'Haven', ',']
[8] 	 5 8
Answer: manufacturing My answer: ['was', 'based', 'in', 'manufacturing']
[7] 	 5 8
Answer: 1877 My answer: ['decommissioned', 'in', '1877', 'following']
[4, 5, 6] 	 5 8
Answer: dock is planned My answer: ['is', 'planned', 'for', 'New']
[7] 	 5 8
Answer: 200 My answer: ['to', 'load', '200', 'trucks']
[4] 	 5 8
Answer: 2003 My answer: ['promotion', 'test', 'for', 'the']
[] 	 5 8
Answer: 360 state street . My answer: ['is', 'now', 'occupied'

[12, 13] 	 5 8
Answer: genetic engineering My answer: ['is', 'sometimes', 'used', 'to']
[1, 2] 	 5 8
Answer: the 1970s My answer: ['variety', 'of', 'techniques', 'have']
[14, 15, 16] 	 5 8
Answer: different phenotypic traits My answer: ['equivalent', ',', 'however', 'some']
[16] 	 5 8
Answer: phosphate-sugar My answer: ['around', 'each', 'other', 'to']
[4, 5] 	 5 8
Answer: untranslated regions My answer: ['regions', 'at', 'both', 'ends']
[11, 12] 	 5 8
Answer: in trans My answer: ['on', 'entirely', 'different', 'chromosomes']
[13, 14, 15] 	 5 8
Answer: barely 2 % My answer: ['suggest', 'that', ',', 'although']
[1, 2] 	 5 8
Answer: multicellular organisms My answer: ['the', 'embryo', 'is', 'engineered']
[11, 12] 	 5 8
Answer: industrial biotechnology My answer: ['modified', 'for', 'applications', 'in']
[5, 6, 7] 	 5 8
Answer: the rna molecules My answer: ['the', 'RNA', 'molecules', 'are']
[17] 	 5 8
Answer: constant My answer: ['carrying', 'out', 'basic', 'cell']
[8, 9] 	 5 8
Answer: en

[18, 19] 	 5 8
Answer: new york city My answer: ['in', '1904', ',', 'first']
[8] 	 5 8
Answer: 300,000 My answer: ['York', 'City', 'hosted', '300,000']
[19, 20] 	 5 8
Answer: 4.6 % My answer: ['highest', 'density', 'of', 'millionaires']
[37, 38, 39] 	 5 8
Answer: $ 7.1 billion My answer: ['York', 'City', 'was', 'the']
[8, 9] 	 5 8
Answer: 46.5 million My answer: ['square', 'feet', '(', '46.5']
[25, 26] 	 5 8
Answer: 51 million My answer: ['for', 'New', 'York', 'City']
[47] 	 5 8
Answer: 21 My answer: ['within', 'the', 'confines', 'of']
[9] 	 5 8
Answer: 200 My answer: ['population', 'had', 'diminished', 'to']
[8, 9, 10] 	 5 8
Answer: $ 40 billion My answer: ['Street', 'totaled', 'approximately', '$']
[25] 	 5 8
Answer: 1924 My answer: ['been', 'carried', 'by', 'a']
[10, 11] 	 5 8
Answer: over 200,000 My answer: ['of', 'public', 'transit', 'use']
[8] 	 5 8
Answer: 90,000 My answer: ['have', 'an', 'estimated', '90,000']
[13] 	 5 8
Answer: six My answer: ['city', 'required', 'their', 'ins

[3] 	 5 8
Answer: two My answer: ['League', 'Baseball', 'teams', 'in']
[3] 	 5 8
Answer: 234 My answer: ['with', 'at', 'least', 'some']
[16, 17] 	 5 8
Answer: five million My answer: ['provide', 'about', '225,000', 'admissions']
[15] 	 5 8
Answer: 234 My answer: ["'s", 'leading', 'specialty-food', 'export']
[18, 19] 	 5 8
Answer: 1.3 million My answer: ['Rican', 'migration', 'to', 'New']
[2, 3] 	 5 8
Answer: 59 % My answer: [',', 'particularly', 'Catholicism', '(']
[35] 	 5 8
Answer: 1959 My answer: ['Museum', 'for', 'African', 'Art']
[14, 15, 16, 17, 18, 19] 	 5 8
Answer: the bronx river My answer: ['flows', 'through', 'the', 'Bronx']
[36] 	 5 8
Answer: advertising My answer: ['streets', 'and', 'avenues', ',']
[18, 19] 	 5 8
Answer: 11.57 million My answer: ['12.21', 'million', ',', 'representing']
[36] 	 5 8
Answer: 9,000 My answer: ['over', '26,000', 'acres', '(']
[8] 	 5 8
Answer: cantilever My answer: ['important', 'piece', 'of', 'cantilever']
[1] 	 5 8
Answer: 1790 My answer: ['h

[30] 	 5 8
Answer: 1977 My answer: ['stylized', 'I', '❤', 'NY']
[31, 32] 	 5 8
Answer: 1.1 million My answer: ['Schools', 'system', ',', 'managed']
[14, 15] 	 5 8
Answer: 90 % My answer: ['the', 'rest', 'of', 'the']
[8] 	 5 8
Answer: 5,937 My answer: ['York', 'City', 'had', '5,937']
[24] 	 5 8
Answer: 200 My answer: ['York', 'City', 'was', 'the']
[29, 30] 	 5 8
Answer: half million My answer: ['in', 'New', 'York', 'City']
[24] 	 5 8
Answer: 469 My answer: ['Subway', 'system', 'is', 'the']
[11] 	 5 8
Answer: 12,000 My answer: ["'s", 'transportation', 'infrastructure', 'encompass']
[17] 	 5 8
Answer: 1971 My answer: ['in', 'the', 'United', 'States']
[31] 	 5 8
Answer: 7,000 My answer: ['bus', 'fleet', 'is', 'the']
[10, 11] 	 5 8
Answer: subway systems My answer: ['to', 'one', 'of', 'the']
[12] 	 5 8
Answer: 304.8 My answer: ['km2', ')', 'of', 'this']
[17] 	 5 8
Answer: 0.5 My answer: ['high', 'degree', 'of', 'income']
[1] 	 5 8
Answer: 37 My answer: ['city', "'s", 'population', 'is']
[25

[42, 43, 44] 	 5 8
Answer: medicine and agriculture My answer: ['geologic', 'record', ',', 'biogeography']
[13, 14] 	 5 8
Answer: is arbitrary My answer: ['specifies', 'that', 'the', 'distinction']
[9, 10] 	 5 8
Answer: an ape My answer: ['his', 'first', 'sight', 'of']
[32, 33, 34] 	 5 8
Answer: the malthusian aspects My answer: ['accepted', 'the', 'general', 'phenomenon']
[40, 41, 42] 	 5 8
Answer: 300 million years My answer: ['been', 'enough', 'time', 'for']
[9, 10, 11] 	 5 8
Answer: fancy pigeon breeding My answer: ['selection', ',', 'he', 'describes']
[23, 24] 	 5 8
Answer: 1250 copies My answer: ['was', 'first', 'published', 'on']
[26, 27] 	 5 8
Answer: scientific naturalism My answer: ['contributed', 'to', 'the', 'campaign']
[1, 2, 3] 	 5 8
Answer: the second edition My answer: ['Darwin', 'added', 'an', 'epigraph']
[2] 	 5 8
Answer: barnacle My answer: ['him', 'that', 'variation', 'arose']
[6] 	 5 8
Answer: 1825 My answer: ['in', '1825', 'to', 'study']
[42, 43] 	 5 8
Answer: nat

[11] 	 5 8
Answer: translation My answer: ['of', 'Buddhism', 'led', 'to']
[11] 	 5 8
Answer: hardly My answer: ['the', 'actual', 'practice', 'of']
[16, 17] 	 5 8
Answer: seventy translators My answer: ['the', '``', 'Septuagint', "''"]
[8, 9, 10] 	 5 8
Answer: subtitles or surtitles My answer: ['translations', 'presented', 'as', 'subtitles']
[2] 	 5 8
Answer: theoretical My answer: ['the', 'actual', 'practice', 'of']
[31] 	 5 8
Answer: events My answer: ['are', 'less', 'commonly', 'used']
[48] 	 5 8
Answer: 1453 My answer: [',', 'a', 'new', 'period']
[5, 6, 7] 	 5 8
Answer: contact and exchange My answer: ['contact', 'and', 'exchange', 'that']
[17, 18] 	 5 8
Answer: syntactic requirements My answer: [')', 'characteristics', 'of', 'a']
[20] 	 5 8
Answer: translation My answer: ['the', 'original', 'text', 'is']
[19, 20] 	 5 8
Answer: the monarch My answer: ['the', 'Commonwealth', ',', 'nominations']
[4, 5, 6] 	 5 8
Answer: 4 june 1917 My answer: ['June', '1917', 'by', 'King']
[9] 	 5 8
An

[3] 	 5 8
Answer: six My answer: ['districts', '.']
[23] 	 5 8
Answer: 100,000 My answer: ['city', 'projected', 'that', 'the']
[14] 	 5 8
Answer: five My answer: ['in', 'district', 'run', 'schools']
[12] 	 5 8
Answer: 1997 My answer: ['added', 'to', 'the', '215']
[13] 	 5 8
Answer: seven My answer: ['economic', 'activity', 'in', 'Pennsylvania']
[6] 	 5 8
Answer: 1,857 My answer: ['when', '1,857', 'shootings', 'were']
[6] 	 5 8
Answer: 1917 My answer: ['in', '1917', 'when', 'outrage']
[12] 	 5 8
Answer: 21 My answer: ['of', 'three', 'water', 'pollution']
[12, 13, 14] 	 5 8
Answer: $ 388 billion My answer: ['in', 'the', 'city', 'helped']
[10] 	 5 8
Answer: dropped My answer: ['in', 'district', 'run', 'schools']
[10] 	 5 8
Answer: increased My answer: [',', 'meanwhile', ',', 'have']
[20] 	 5 8
Answer: 18 My answer: ['tasked', 'with', 'guiding', 'growth']
[13] 	 5 8
Answer: 1994 My answer: ['the', 'code', 'was', 'split']
[22, 23] 	 5 8
Answer: grid plan My answer: ['more', 'like', 'an', 'E

[12] 	 5 8
Answer: silver My answer: ['in', '2015', 'Summer', 'in']
[9, 10] 	 5 8
Answer: $ 21,000 My answer: ['have', 'cost', 'about', 'US']
[5] 	 5 8
Answer: 1969 My answer: ['1969', ',', 'when', 'he']
[10] 	 5 8
Answer: 1983 My answer: ['citizen', 'on', 'September', '17']
[4] 	 5 8
Answer: 10,000 My answer: ['samurai', 'to', 'meet', 'this']
[17] 	 5 8
Answer: 1598 My answer: ['the', 'Japanese', 'campaigns', 'in']
[10, 11] 	 5 8
Answer: plate armor My answer: ['individual', 'scales', 'was', 'replaced']
[3, 4] 	 5 8
Answer: historical drama My answer: [')', 'has', 'always', 'been']
[24] 	 5 8
Answer: daimyo My answer: ['many', 'samurai', 'forces', 'that']
[1] 	 5 8
Answer: 1854 My answer: ['army', 'and', 'the', 'navy']
[2, 3, 4] 	 5 8
Answer: early heian period My answer: [',', 'the', 'late', '8th']
[18, 19, 20] 	 5 8
Answer: many wealthy merchants My answer: ['not', 'be', 'a', 'legal']
[5] 	 5 8
Answer: samurai My answer: ['samurai', 'such', 'as', 'the']
[9] 	 5 8
Answer: 1192 My ans

[8] 	 5 8
Answer: 1984 My answer: ['Chicago', ',', 'circa', '1984']
[6, 7] 	 5 8
Answer: house music My answer: ['to', 'house', 'music', 'were']
[7, 8, 9] 	 5 8
Answer: `` no ufos '' My answer: ['1990', 'single', '``', 'Vogue']
[2] 	 5 8
Answer: 1984 My answer: ['of', 'these', 'DJs', ',']
[2] 	 5 8
Answer: 1987 My answer: ['artist', 'Steve', '``', 'Silk']
[16] 	 5 8
Answer: 1979 My answer: ['from', 'Player', 'One', "'s"]
[] 	 5 8
Answer: one voice records My answer: ['Remix', "''", 'Roy', ',']
[14, 15] 	 5 8
Answer: acid house My answer: ['synthesizers', 'were', 'used', 'to']
[19, 20] 	 5 8
Answer: its roots My answer: ['examples', 'of', 'house', ',']
[24] 	 5 8
Answer: 1985 My answer: ['be', 'traced', 'to', 'Chicago']
[41] 	 5 8
Answer: 1986 My answer: ['record', 'generally', 'credited', 'as']
[12, 13, 14] 	 5 8
Answer: the black community My answer: ['many', 'of', 'the', 'messages']
[7, 8, 9, 10, 11] 	 5 8
Answer: `` new york underground '' My answer: ['for', 'the', '``', 'New']
[34,

[29, 30] 	 5 8
Answer: the sovereign My answer: [',', 'it', 'became', 'regular']
[10, 11] 	 5 8
Answer: letters patent My answer: ['usually', 'granted', 'less', 'ceremonially']
[17, 18] 	 5 8
Answer: exceedingly rare My answer: ['royal', 'assent', 'was', 'once']
[37, 38, 39, 40] 	 5 8
Answer: ( 24 june ) My answer: ['act', 'did', 'not', 'come']
[1] 	 5 8
Answer: 1994 My answer: ['was', 'granted', 'by', 'Order']
[18, 19] 	 5 8
Answer: committing adultery My answer: ['to', 'execute', 'his', 'fifth']
[10, 11, 12] 	 5 8
Answer: 11 march 1708 My answer: ['Anne', ',', 'similarly', 'withheld']
[5] 	 5 8
Answer: five My answer: ['five', 'times', 'during', 'the']
[22, 23] 	 5 8
Answer: governor general My answer: ['from', 'the', 'commons', 'stand']
[32, 33] 	 5 8
Answer: lieutenant governor My answer: ['was', 'granted', 'by', 'Order']
[2] 	 5 8
Answer: 2011 My answer: ['assembly', 'adopted', 'an', 'Arms']
[27] 	 5 8
Answer: 2007 My answer: ['was', 'refused', '(', 'or']
[15] 	 5 8
Answer: 2001 M

[24, 25] 	 5 8
Answer: 37.8 % My answer: ['of', 'February', '5', ',']
[20, 21] 	 5 8
Answer: 22.9 % My answer: ['Community', 'Survey', ',', 'White']
[30] 	 5 8
Answer: six My answer: ['during', 'the', '20th', 'century']
[1] 	 5 8
Answer: 1846 My answer: ['town', ',', 'West', 'Farms']
[18] 	 5 8
Answer: 1979 My answer: ['in', 'the', '1974', 'novel']
[8, 9] 	 5 8
Answer: 12.1 % My answer: ['under', 'one-eighth', '(', '12.1']
[14, 15] 	 5 8
Answer: 61.2 % My answer: ['of', 'February', '5', ',']
[0] 	 5 8
Answer: 320,640 My answer: ['home', ',', 'of', 'which']
[14] 	 5 8
Answer: 1985 My answer: ['and', '``', 'A', 'Kind']
[36, 37] 	 5 8
Answer: 1.3 million My answer: ['during', 'the', '20th', 'century']
[9] 	 5 8
Answer: 1917 My answer: ['Morris', 'Hillquit', 'in', 'the']
[7] 	 5 8
Answer: 1974 My answer: ['in', 'the', '1974', 'novel']
[62, 63] 	 5 8
Answer: 1.2 % My answer: [',', '53.5', '%', 'of']
[8, 9, 10] 	 5 8
Answer: rent control laws My answer: ['as', 'to', 'whether', 'rent']
[] 	 5

[4] 	 5 8
Answer: nine My answer: ['black', 'students', "'", 'entry']
[56] 	 5 8
Answer: professional My answer: ['president', 'of', 'Columbia', 'University']
[24] 	 5 8
Answer: gallbladder My answer: ['to', 'show', 'symptoms', 'of']
[34] 	 5 8
Answer: black My answer: ['and', 'after', 'his', 'presidency']
[7] 	 5 8
Answer: 1969 My answer: ['28', ',', '1969', ',']
[25] 	 5 8
Answer: freshman My answer: ['leg', 'be', 'amputated', 'but']
[1] 	 5 8
Answer: 1954 My answer: ['the', 'domino', 'theory', 'in']
[3, 4] 	 5 8
Answer: investment broker My answer: [',', 'also', 'handled', 'the']
[9] 	 5 8
Answer: cholecystitis My answer: ['to', 'show', 'symptoms', 'of']
[8, 9] 	 5 8
Answer: contract bridge My answer: ['learning', 'to', 'play', 'contract']
[5, 6] 	 5 8
Answer: cabinet meeting My answer: ['cabinet', 'meeting', 'when', 'Eisenhower']
[7] 	 5 8
Answer: millions My answer: ['demobilization', 'of', 'millions', 'of']
[9] 	 5 8
Answer: 1911 My answer: ['to', 'West', 'Point', 'in']
[] 	 5 8


[5, 6] 	 5 8
Answer: textile production My answer: ['textile', 'production', ',', 'reached']
[1, 2, 3] 	 5 8
Answer: 24 january 1706 My answer: ['Charles', 'Mordaunt', ',', '3rd']
[17] 	 5 8
Answer: 1978 My answer: [',', 'prestige', 'and', 'use']
[6, 7, 8] 	 5 8
Answer: 3 july 2006 My answer: ['on', '3', 'July', '2006']
[25, 26, 27] 	 5 8
Answer: the valencian community My answer: [':', '[', 'baˈlenθja', ']']
[26] 	 5 8
Answer: 1776 My answer: ['exaltation', 'of', 'ideas', 'the']
[32] 	 5 8
Answer: 20 My answer: ['biggest', 'on', 'the', 'Mediterranean']
[14, 15, 16] 	 5 8
Answer: over two hundred My answer: ['by', 'air', 'and', 'sea']
[19] 	 5 8
Answer: 1520–1522 My answer: ['the', 'comuneros', 'of', 'neighbouring']
[25, 26] 	 5 8
Answer: 3973 hectares My answer: ['on', 'in', 'the', 'municipality']
[6, 7] 	 5 8
Answer: 16 months My answer: ['for', '16', 'months', 'and']
[4, 5] 	 5 8
Answer: 58 m My answer: ['m', 'high', 'and', 'topped']
[11] 	 5 8
Answer: 1609 My answer: ['17th', 'cent

[23] 	 5 8
Answer: 1,800,000 My answer: ['concluding', 'Treaty', 'of', 'Versailles']
[1] 	 5 8
Answer: 18th My answer: ['(', 'after', '1707', ',']
[27] 	 5 8
Answer: 13,000,000 My answer: ['held', 'sway', 'over', 'about']
[11] 	 5 8
Answer: 1919 My answer: ['concluding', 'Treaty', 'of', 'Versailles']
[8] 	 5 8
Answer: 1997 My answer: ['to', 'China', 'in', '1997']
[1] 	 5 8
Answer: 1869 My answer: ['opened', 'under', 'Napoleon', 'III']
[16] 	 5 8
Answer: opium My answer: [',', 'the', 'Company', 'had']
[5] 	 5 8
Answer: 1605 My answer: ['1605', ')', 'and', 'Grenada']
[11] 	 5 8
Answer: 1948 My answer: ['it', 'was', 'called', ',']
[19] 	 5 8
Answer: 1756–1763 My answer: ['in', 'India', 'became', 'but']
[6] 	 5 8
Answer: 1967 My answer: ['in', '1967', ',', 'Bahrain']
[10] 	 5 8
Answer: 1914 My answer: ['with', 'Germany', 'were', 'realised']
[17, 18, 19, 20] 	 5 8
Answer: $ us 4.33 billion My answer: [',', 'with', 'insolvency', 'only']
[39, 40, 41, 42, 43, 44] 	 5 8
Answer: the `` great gam

[1] 	 5 8
Answer: 1584 My answer: ['granted', 'a', 'charter', 'to']
[16, 17] 	 5 8
Answer: literacy tests My answer: ['passed', 'a', 'new', 'constitution']
[46] 	 5 8
Answer: . My answer: ['for', 'the', 'temperature', 'to']
[30] 	 5 8
Answer: millions My answer: ['Carolina', 'Museum', 'of', 'Art']
[6, 7] 	 5 8
Answer: several million My answer: ['attract', 'several', 'million', 'tourists']
[11] 	 5 8
Answer: 1729 My answer: ['of', 'the', 'original', 'province']
[25, 26, 27] 	 5 8
Answer: over 25 million My answer: ['and', 'Great', 'Smoky', 'Mountains']
[7] 	 5 8
Answer: rose My answer: ['of', 'color', 'rose', 'markedly']
[17] 	 5 8
Answer: 1964 My answer: ['voice', 'in', 'the', 'state']
[33] 	 5 8
Answer: 1954 My answer: ['the', 'state', 'include', 'Hurricane']
[25] 	 5 8
Answer: 1996 My answer: ['Bill', 'Clinton', 'came', 'within']
[4] 	 5 8
Answer: 3 My answer: ['percent', 'of', 'the', 'free']
[24] 	 5 8
Answer: 1780 My answer: ['the', 'war', 'took', 'place']
[10, 11, 12] 	 5 8
Answe

KeyboardInterrupt: 

<b>model 2 GRU seq2seq</b>

In [69]:
decoder_input_data = np.zeros(
    (trainig_size, 2, max_context_size),
    dtype='float32')

decoder_target_data = np.zeros(
    (trainig_size, 2, max_context_size),
    dtype='float32')

for i, answer_indices in enumerate(train_answers_indices):
    if len(answer_indices) > 1:
        decoder_input_data[i, 1, answer_indices[0]] = 1.
        decoder_target_data[i, 0, answer_indices[0]] = 1.
        decoder_target_data[i, 1, answer_indices[-1]] = 1.

In [112]:
qc_relations = Input(shape=(None, max_context_size))
encoder_outputs, encoder_state= GRU(output_dim = max_context_size,
                                    return_state = True,
                                    activation = 'tanh')(qc_relations)

decoder_inputs = Input(shape=(None, max_context_size))
decoder_gru = GRU(output_dim = max_context_size,
                  return_sequences = True,
                  return_state = True,
                  activation = 'tanh')
decoder_outputs, _ = decoder_gru(decoder_inputs,
                                 initial_state = encoder_state)
decoder_dense = Dense(max_context_size,
                      activation='softmax')

start_end = decoder_dense(decoder_outputs)

  after removing the cwd from sys.path.
  # Remove the CWD from sys.path while we load stuff.


In [None]:
# Define the model that will turn
# `encoder_input_data` & `decoder_input_data` into `decoder_target_data`
model = Model([qc_relations, decoder_inputs], start_end)
model.compile(optimizer='rmsprop', loss='categorical_crossentropy') #optimizer
model.fit([training_input, decoder_input_data], decoder_target_data,
          batch_size=batch_size,
          epochs=epochs,
          validation_split=0.2)

#define inference model
encoder_model = Model(qc_relations, encoder_state)

decoder_state_inputs = Input(shape=(max_context_size,))
decoder_outputs, decoder_state = decoder_gru(decoder_inputs,
                                             initial_state = decoder_state_inputs)
start_end = decoder_dense(decoder_outputs)
decoder_model = Model(
    [decoder_inputs, decoder_state_inputs],
    [start_end, decoder_state])

Train on 19400 samples, validate on 4850 samples
Epoch 1/100
Epoch 2/100
Epoch 3/100
Epoch 4/100
Epoch 5/100
Epoch 6/100
Epoch 7/100
Epoch 8/100
Epoch 9/100
Epoch 10/100
Epoch 11/100
Epoch 12/100
Epoch 13/100
Epoch 14/100
Epoch 15/100
Epoch 16/100
Epoch 17/100
Epoch 18/100
Epoch 19/100
Epoch 20/100
Epoch 21/100
Epoch 22/100
Epoch 23/100
Epoch 24/100
Epoch 25/100
Epoch 26/100
Epoch 27/100
Epoch 28/100
Epoch 29/100
Epoch 30/100
Epoch 31/100
Epoch 32/100
Epoch 33/100
Epoch 34/100
Epoch 35/100
Epoch 36/100
Epoch 37/100
Epoch 38/100
Epoch 39/100
Epoch 40/100
Epoch 41/100
Epoch 42/100
Epoch 43/100
Epoch 44/100
Epoch 45/100
Epoch 46/100
Epoch 47/100
Epoch 48/100
Epoch 49/100
Epoch 50/100
Epoch 51/100
Epoch 52/100
Epoch 53/100
Epoch 54/100
Epoch 55/100
Epoch 56/100
Epoch 57/100
 3328/19400 [====>.........................] - ETA: 1:23 - loss: 0.0691

In [96]:
def get_start_end(question):
    # Encode the input as state vectors.
    states_value = encoder_model.predict(question)

    # Generate empty target sequence of length 1.
    Go_index = np.zeros((1, 1, max_context_size))
    
    start_index , states_value = decoder_model.predict( [Go_index, states_value])
    end_index, _ = decoder_model.predict( [start_index, states_value])

    return start_index, end_index

In [106]:
my_answers = []
for i,embed_query in enumerate(embed_train_qs):
    start_idx, end_idx = get_start_end(training_input[i:i+1])
    start_idx = np.argmax(start_idx)
    end_idx = np.argmax(end_idx)
    print(train_answers_indices[i], "\t", start_idx, end_idx)
    print("Answer:", train_answers[i], "My answer:", tokenized_train_context[i][start_idx:end_idx+1])

[31] 	 5 9
Answer: cylinder My answer: ['the', 'list', 'for', 'redefinition', 'is']
[3, 4, 5] 	 6 7
Answer: time vs. energy My answer: ['.']
[15, 16, 17] 	 5 9
Answer: quantum of action My answer: ['some', 'multiple', 'of', 'a', 'very']
[11] 	 5 9
Answer: 1913 My answer: ['quantized', 'model', 'of', 'the', 'atom']
[7] 	 5 9
Answer: h My answer: ['existence', 'of', 'h', '(', 'but']
[7] 	 5 9
Answer: h My answer: ['existence', 'of', 'h', '(', 'but']
[42] 	 1 8
Answer: f My answer: ['recognized', 'in', '1900', 'by', 'Max', 'Planck', ',', 'it']
[9] 	 5 9
Answer: 1839 My answer: ['Alexandre', 'Edmond', 'Becquerel', 'in', '1839']
[19] 	 5 9
Answer: 1911 My answer: ['as', 'the', '``', 'ultraviolet', 'catastrophe']
[78, 79] 	 1 8
Answer: multiphoton effect My answer: ['kinetic', 'energy', '(', 'for', 'each', 'photoelectron', ')', 'is']
[5, 6] 	 5 9
Answer: nuclear magneton My answer: ['nuclear', 'magneton', 'are', 'units', 'which']
[9, 10] 	 5 9
Answer: 555 nanometres My answer: ['with', 'a', 

[9] 	 5 8
Answer: 2005 My answer: ['Fame', 'inducted', 'Spielberg', 'in']
[14] 	 5 9
Answer: intrusive My answer: ['use', 'of', 'cut', 'scenes', 'in']
[10] 	 5 9
Answer: 1993 My answer: [',', 'and', 'Jurassic', 'Park', '(']
[2] 	 5 9
Answer: 1984 My answer: ['their', 'romance', ',', 'and', 'in']
[11, 12, 13] 	 5 8
Answer: $ 200 million My answer: ['box', 'office', 'success', ',']
[18, 19] 	 5 9
Answer: # 9 My answer: ['Film', 'Institute', 'listed', 'it', 'among']
[6] 	 5 9
Answer: 1989 My answer: ['the', '1989', 'National', 'Scout', 'Jamboree']
[8] 	 5 9
Answer: 1979 My answer: ['broke', 'up', 'in', '1979', ',']
[21, 22] 	 5 8
Answer: the 1930s My answer: ['began', 'opening', 'to', 'Western']
[13, 14] 	 5 9
Answer: his father My answer: ['$', '500', ',', 'most', 'of']
[31, 32] 	 5 9
Answer: his father My answer: ['most', 'autobiographical', 'aspect', 'of', 'Spielberg']
[2] 	 5 9
Answer: 1984 My answer: ['their', 'romance', ',', 'and', 'in']
[13, 14] 	 5 9
Answer: 15–20 years My answer:

[9, 10] 	 5 9
Answer: elevation angle My answer: ['the', 'target', 'and', 'the', 'elevation']
[6] 	 6 7
Answer: 1940 My answer: ['1940', '.']
[2] 	 5 9
Answer: altitude My answer: ['jet', 'aircraft', 'limit', 'target', 'opportunities']
[32] 	 5 9
Answer: 1954 My answer: ['arms', ',', 'PVO', 'Strany', ',']
[3, 4, 5, 6] 	 1 8
Answer: `` effective ceiling '' My answer: ['British', 'adopted', '``', 'effective', 'ceiling', "''", ',', 'meaning']
[19, 20, 21] 	 1 8
Answer: 8 july 1914 My answer: ['British', 'recognised', 'the', 'need', 'for', 'anti-aircraft', 'capability', 'a']
[33, 34] 	 5 8
Answer: its height My answer: ['approach', 'to', 'HAA', 'fire']
[27, 28] 	 5 9
Answer: experimental usefulness My answer: ['lasers', 'in', 'combat', 'since', 'the']
[8, 9] 	 5 9
Answer: 18-pdr guns My answer: ['the', 'war', 'but', '18-pdr', 'guns']
[4, 5] 	 6 7
Answer: into battalions My answer: ['or', 'equivalent']
[27, 28, 29] 	 5 8
Answer: for 20 seconds My answer: ['British', 'definition', 'was', '``

[23] 	 5 9
Answer: 3 My answer: [',', 'which', 'was', 'under', 'command']
[] 	 5 8
Answer: area air defence My answer: ['air', 'defence', 'of', 'a']
[8, 9] 	 5 9
Answer: the cold war My answer: ['by', 'Germany', 'during', 'the', 'war']
[17, 18, 19] 	 5 9
Answer: 90-day screening period My answer: ['for', 'both', 'types', 'except', 'with']
[5, 6] 	 5 9
Answer: $ 500,000 My answer: ['$', '500,000', 'the', 'Secretary', 'of']
[4, 5] 	 5 9
Answer: eight years My answer: ['years', 'before', 'the', 'first', 'national']
[21] 	 33 8
Answer: seven My answer: []
[30] 	 1 8
Answer: butterflies My answer: ['further', 'noted', 'that', 'the', 'San', 'Bruno', 'plan', 'was']
[6, 7] 	 6 7
Answer: two ways My answer: ['two', 'ways']
[28, 29] 	 5 9
Answer: the clinton administration My answer: ['Endangered', 'Species', 'Act', ':', 'law']
[11, 12] 	 5 9
Answer: 16 birds My answer: ['1941', 'was', 'estimated', 'at', 'about']
[] 	 5 8
Answer: habitat conservation plan My answer: ['San', 'Bruno', 'plan', 'was

[62, 63, 64] 	 1 8
Answer: the achaemenid empire My answer: ['reached', 'the', 'pinnacle', 'of', 'its', 'power', 'during', 'the']
[10, 11, 12, 13] 	 5 9
Answer: mamluks ( slave-warriors ) My answer: ['in', 'the', 'Abbasid', 'army', 'as']
[46] 	 5 9
Answer: watermelons My answer: ['has', 'been', 'a', 'top', 'five']
[7, 8] 	 5 9
Answer: the 1979 constitution My answer: ['incompatible', 'with', 'the', 'constitution', 'or']
[18, 19] 	 5 9
Answer: were executed My answer: ['had', 'initially', 'joined', 'with', 'Islamists']
[33] 	 5 8
Answer: petrochemicals My answer: ['in', 'the', 'fields', 'of']
[13, 14] 	 5 9
Answer: 18 % My answer: ['75', '%', 'was', 'based', 'on']
[1] 	 5 9
Answer: 2004 My answer: ['its', 'first', 'wind-powered', 'and', 'geothermal']
[32, 33] 	 5 8
Answer: natural gas My answer: ['and', 'middle', 'power', ',']
[48] 	 1 8
Answer: *ar-yo- My answer: ['Middle', 'Iranian', 'ērān', 'and', 'aryān', 'are', 'oblique', 'plural']
[52, 53] 	 1 8
Answer: scientific writing My answe

KeyboardInterrupt: 

In [108]:
import csv
with open('result.csv', 'w') as csvfile:
    writer = csv.writer(csvfile)
    writer.writerow(["id","answer"])
    for i,embed_query in enumerate(embed_test_qs):
        start_idx, end_idx = get_start_end(testing_input[i:i+1])
        start_idx = np.argmax(start_idx)
        end_idx = np.argmax(end_idx)
        my_answer = tokenized_test_context[i][start_idx:end_idx+1]
        writer.writerow([str(i), " ".join(my_answer)])