In [None]:
# ✅ Step 1: Install Required Libraries
!pip install transformers datasets --quiet


In [None]:
# ✅ Step 2: Download SQuAD v2.0 Dataset Automatically
import requests

url = "https://rajpurkar.github.io/SQuAD-explorer/dataset/train-v2.0.json"
response = requests.get(url)

with open("train-v2.0.json", "wb") as f:
    f.write(response.content)

print("✅ Dataset downloaded successfully!")


✅ Dataset downloaded successfully!


In [None]:
# ✅ Step 3: Load Dataset and Extract First QA Pair
import json

# Load dataset
with open("train-v2.0.json", "r") as f:
    squad_data = json.load(f)

# Extract first QA pair
first_article = squad_data["data"][0]
first_paragraph = first_article["paragraphs"][0]

context = first_paragraph["context"]
question = first_paragraph["qas"][0]["question"]

print("📚 Context snippet:", context[:300], "...")
print("❓ Question:", question)


📚 Context snippet: Beyoncé Giselle Knowles-Carter (/biːˈjɒnseɪ/ bee-YON-say) (born September 4, 1981) is an American singer, songwriter, record producer and actress. Born and raised in Houston, Texas, she performed in various singing and dancing competitions as a child, and rose to fame in the late 1990s as lead singe ...
❓ Question: When did Beyonce start becoming popular?


In [None]:
# ✅ Step 4: Run Question Answering
from transformers import pipeline

# Load QA pipeline (uses default BERT model)
qa_pipeline = pipeline("question-answering")

# Get answer
result = qa_pipeline(question=question, context=context)

# Display result
print("✅ Answer:", result['answer'])


No model was supplied, defaulted to distilbert/distilbert-base-cased-distilled-squad and revision 564e9b5 (https://huggingface.co/distilbert/distilbert-base-cased-distilled-squad).
Using a pipeline without specifying a model name and revision in production is not recommended.
Device set to use cpu


✅ Answer: late 1990s


In [None]:
# ✅ Step 5: Bonus - Show Multiple QAs
# Loop through more questions if you want
for i in range(3):
    para = squad_data["data"][0]["paragraphs"][i]
    context = para["context"]
    question = para["qas"][0]["question"]
    result = qa_pipeline(question=question, context=context)

    print(f"\n❓ Question {i+1}: {question}")
    print(f"✅ Answer: {result['answer']}")



❓ Question 1: When did Beyonce start becoming popular?
✅ Answer: late 1990s

❓ Question 2: After her second solo album, what other entertainment venture did Beyonce explore?
✅ Answer: acting

❓ Question 3: In her music, what are some recurring elements in them?
✅ Answer: love, relationships, and monogamy


In [None]:
from transformers import pipeline

# Load the QA pipeline
qa_pipeline = pipeline("question-answering")

# 🔸 Your own custom context
context = """
Tomatoes are one of the most popular vegetables used in cooking.
They are rich in vitamins A and C, and contain antioxidants like lycopene.
Tomatoes grow best in warm climates with plenty of sunlight.
"""

# 🔸 Your custom question
question = "What vitamin do tomatoes contain?"

# 🔸 Get the answer
result = qa_pipeline(question=question, context=context)

# 🔸 Print result
print("❓ Question:", question)
print("📚 Context:", context)
print("✅ Answer:", result['answer'])


No model was supplied, defaulted to distilbert/distilbert-base-cased-distilled-squad and revision 564e9b5 (https://huggingface.co/distilbert/distilbert-base-cased-distilled-squad).
Using a pipeline without specifying a model name and revision in production is not recommended.
Device set to use cpu


❓ Question: What vitamin do tomatoes contain?
📚 Context: 
Tomatoes are one of the most popular vegetables used in cooking.
They are rich in vitamins A and C, and contain antioxidants like lycopene.
Tomatoes grow best in warm climates with plenty of sunlight.

✅ Answer: A and C
