### Imports

In [135]:
import transformers
from newspaper import Article
from transformers import AutoModelForQuestionAnswering, AutoTokenizer, pipeline

# Extractive question answering
model_name = "distilbert-base-cased-distilled-squad"

### Call pipeline & load model

In [136]:
question_answerer = pipeline("question-answering", model=model_name)

### Extract text from article URL

In [137]:
url = "https://www.cbssports.com/nfl/news/2022-super-bowl-score-rams-beat-bengals-as-matthew-stafford-mvp-cooper-kupp-connect-late-in-comeback-win/live/"
article = Article(url)
article.download()
article.parse()
text = article.text

### Run model

In [139]:
question = "Who won?"
result = question_answerer(question=question, context=text)   
print("Question: " + question)
print(
    f"Answer 1: '{result['answer']}', score: {round(result['score'], 4)}"
)

Question: Who won?
Answer 1: 'Los Angeles Rams', score: 0.3778


### Test multiple articles & questions

In [141]:
url1 = "https://www.cbssports.com/nfl/gametracker/recap/NFL_20220213_LAR@CIN/"
url2 = "https://www.usatoday.com/story/sports/nfl/super-bowl/2022/02/13/super-bowl-2022-live-updates-score-bengals-rams-analysis/6774505001/"
url3 = "https://www.cbssports.com/nfl/news/2022-super-bowl-score-rams-beat-bengals-as-matthew-stafford-mvp-cooper-kupp-connect-late-in-comeback-win/live/"
article1 = Article(url1)
article1.download()
article1.parse()
text1 = article1.text

article2 = Article(url2)
article2.download()
article2.parse()
text2 = article2.text

article3 = Article(url3)
article3.download()
article3.parse()
text3 = article3.text

qs = ["Where was the 2022 Super Bowl?","What team won the 2022 Super Bowl?","What was the score of the 2022 Super Bowl?",
      "Who scored the first touchdown?","How many yards did Cooper Kupp have?","How many passes did Burrow complete?",
      "How many yards did Burrow have?","Why did the Rams win?"]

for question in qs:
    result1 = question_answerer(question=question, context=text1)
    result2 = question_answerer(question=question, context=text2)
    result3 = question_answerer(question=question, context=text3)
    print("Question: " + question)
    print(
        f"Answer 1: '{result1['answer']}', score: {round(result1['score'], 4)}"
    )
    print(
        f"Answer 2: '{result2['answer']}', score: {round(result2['score'], 4)}"
    )
    print(
        f"Answer 3: '{result3['answer']}', score: {round(result3['score'], 4)}"
    )

Question: Where was the 2022 Super Bowl?
Answer 1: 'Los Angeles', score: 0.2835
Answer 2: 'SoFi Stadium', score: 0.9382
Answer 3: 'SoFi Stadium', score: 0.8948
Question: What team won the 2022 Super Bowl?
Answer 1: 'the Rams', score: 0.4162
Answer 2: 'Los Angeles Rams', score: 0.7944
Answer 3: 'The Rams', score: 0.4787
Question: What was the score of the 2022 Super Bowl?
Answer 1: '13-10', score: 0.8217
Answer 2: '23-20', score: 0.3426
Answer 3: '23-20', score: 0.0002
Question: Who scored the first touchdown?
Answer 1: 'Ernest Jones', score: 0.9161
Answer 2: 'Ja'Marr Chase', score: 0.631
Answer 3: 'Odell Beckham Jr.', score: 0.4505
Question: How many yards did Cooper Kupp have?
Answer 1: '39', score: 0.8363
Answer 2: '92', score: 0.8979
Answer 3: '92', score: 0.9334
Question: How many passes did Burrow complete?
Answer 1: 'seven', score: 0.7126
Answer 2: '46', score: 0.9043
Answer 3: '22 of 33', score: 0.5857
Question: How many yards did Burrow have?
Answer 1: 'seven', score: 0.7643
An