# 🧠 Predictive Question Paper Generator
This notebook demonstrates the full pipeline: loading data, preprocessing, training a regression model, and generating a predicted question paper.

In [None]:
# Step 1: Import Required Libraries
import pandas as pd
from src.preprocessing import preprocess_data
from src.model import train_regression_model
from src.generate_paper import generate_question_paper

In [None]:
# Step 2: Load Dataset
df = pd.read_csv("../data/sample_questions.csv")
df.head()

In [None]:
# Step 3: Preprocess Questions
X, vectorizer, df = preprocess_data(df, text_column="question")
y = df["frequency"]

In [None]:
# Step 4: Train Regression Model
model, accuracy, X_test, y_test, y_pred = train_regression_model(X, y)
print(f"Model Accuracy Estimate: {accuracy:.2f}%")

In [None]:
# Step 5: Generate Predicted Question Paper
predicted_paper = generate_question_paper(df, model, vectorizer, top_k=10)
print(predicted_paper)