In [None]:
import re
import os
import json
import traceback
import pandas as pd
from dotenv import load_dotenv

from langchain.chains.llm import LLMChain
from langchain.prompts import PromptTemplate
from langchain_google_genai import ChatGoogleGenerativeAI

In [None]:
from google.oauth2 import service_account
credential_path = "/home/petpooja-739/Learning/MCQ Generator/spheric-shield-442613-b6-f9df1a08a88c.json"
credential = service_account.Credentials.from_service_account_file(credential_path)

In [None]:
llm = ChatGoogleGenerativeAI(
    model="gemini-1.5-flash-001",
    credentials=credential,
    temperature=0,
    max_tokens=None
)

In [None]:
RESPONSE_JSON = {
    "1": {
        "mcq": "multiple choice question",
        "options": {
            "a": "choice here",
            "b": "choice here",
            "c": "choice here",
            "d": "choice here",
        },
        "correct": "correct answer"
    },
    "2": {
        "mcq": "multiple choice question",
        "options": {
            "a": "choice here",
            "b": "choice here",
            "c": "choice here",
            "d": "choice here",
        },
        "correct": "correct answer"
    },
    "3": {
        "mcq": "multiple choice question",
        "options": {
            "a": "choice here",
            "b": "choice here",
            "c": "choice here",
            "d": "choice here",
        },
        "correct": "correct answer"
    },
}

In [None]:
TEMPLATE = """
Text:{text}
You are an expert MCQ maker. Given the above text, it is your job to \
create a quiz  of {number} multiple choice questions for {subject} students in {tone} tone. 
Make sure the questions are not repeated and check all the questions to be conforming the text as well.
Make sure to format your response like  RESPONSE_JSON below  and use it as a guide. \
Ensure to make {number} MCQs
### RESPONSE_JSON
{response_json}

"""

In [None]:
TEMPLATE2 = """
You are an expert english grammarian and writer. Given a Multiple Choice Quiz for {subject} students.\
You need to evaluate the complexity of the question and give a complete analysis of the quiz. Only use at max 50 words for complexity analysis. 
if the quiz is not at per with the cognitive and analytical abilities of the students,\
update the quiz questions which needs to be changed and change the tone such that it perfectly fits the student abilities
Quiz_MCQs:
{quiz}

Check from an expert English Writer of the above quiz:
"""

In [None]:
quiz_generation_prompt = PromptTemplate(
    input_variables=["text", "number", "subject", "tone", "response_json"],
    template=TEMPLATE,
)

In [None]:
quiz_chain = LLMChain(llm=llm, prompt=quiz_generation_prompt, output_key="quiz", verbose=True)

In [None]:
print(quiz_chain)

In [None]:
quiz_evaluation_prompt = PromptTemplate(
    input_variables=["subject", "quiz"],
    template=TEMPLATE2
)

In [None]:
review_chain = LLMChain(llm=llm, prompt=quiz_evaluation_prompt, output_key="review", verbose=True)

In [None]:
from langchain.chains.sequential import SequentialChain

generate_evaluate_chain = SequentialChain(
    chains=[quiz_chain, review_chain],
    input_variables=["text", "number", "subject", "tone", "response_json"],
    output_variables=["quiz", "review"],
    verbose=True
)

In [None]:
file_path = r"/home/petpooja-739/Learning/MCQ Generator/data.txt"
file_path

In [None]:
with open(file_path, 'r') as file:
    TEXT = file.read()

In [None]:
print(TEXT)

In [None]:
len(TEXT)

In [None]:
NUMBER = 5
SUBJECT = "Data Science"
TONE = "simple"

In [None]:
%time
from langchain_community.callbacks.manager import get_openai_callback

# How to setup Token Usage Tracking in LangChain
with get_openai_callback() as cb:
    response = generate_evaluate_chain(
        {
            "text": TEXT,
            "number": NUMBER,
            "subject": SUBJECT,
            "tone": TONE,
            "response_json": json.dumps(RESPONSE_JSON)
        }
    )

In [None]:
print(f"Total Tokens: {cb.total_tokens}")
print(f"Prompt Tokens: {cb.prompt_tokens}")
print(f"Completion Tokens: {cb.completion_tokens}")
print(f"Total Cost: {cb.total_cost}")

In [None]:
response

In [None]:
quiz = response.get("quiz")
quiz = re.search(r'\{.*\}', quiz, re.DOTALL).group(0)

In [None]:
quiz = json.loads(quiz)

In [None]:
quiz

In [None]:
quiz_table_data = []
for key, value in quiz.items():
    mcq = value["mcq"]
    # print(mcq)
    options = " | ".join(
        [
            f"{option}: {option_value}"
            for option, option_value in value["options"].items()
        ]
    )
    correct = value["correct"]
    quiz_table_data.append({"MCQ": mcq, "Choice": options, "Correct": correct})

In [None]:
quiz_table_data

In [None]:
quiz_df = pd.DataFrame(quiz_table_data)

In [None]:
quiz_df

In [None]:
quiz_df.to_csv("DataScienceQuiz.csv", index=False)