# Import Libraries

In [4]:
import pandas as pd
import numpy as np
import spacy
import matplotlib.pyplot as plt
import os
from transformers import pipeline, AutoTokenizer, AutoModelForSequenceClassification, AutoModelForCausalLM
import torch
import re
import tensorflow as tf

import warnings
warnings.filterwarnings('ignore')
pd.set_option('display.max_columns', None)  # Show all columns
pd.set_option('display.max_rows', None)  # Show all rows
pd.set_option('display.max_colwidth', None)  # Show full content in each cell
pd.set_option('display.width', 1000)  # Set max width

# Load spaCy's English model
nlp = spacy.load('en_core_web_sm')

# Question Classifier

## Text-Classification

In [None]:
tokenizer = AutoTokenizer.from_pretrained("uw-vta/bloominzer-0.1")
model = AutoModelForSequenceClassification.from_pretrained("uw-vta/bloominzer-0.1")
bloominzer = pipeline("text-classification", model=model, tokenizer=tokenizer)

In [None]:
print(bloominzer("If I have 2 pair of apple, can i make apple pie with it?"))

Device set to use mps:0


[{'label': 'Synthesis', 'score': 0.9990537762641907}]


## LLM Classification

## Zero-Shot

### BART

In [None]:
tokenizer = AutoTokenizer.from_pretrained("facebook/bart-large-mnli")
model = AutoModelForSequenceClassification.from_pretrained("facebook/bart-large-mnli")

bart = pipeline("zero-shot-classification",
                      model=model , tokenizer=tokenizer)

Xet Storage is enabled for this repo, but the 'hf_xet' package is not installed. Falling back to regular HTTP download. For better performance, install the package with: `pip install huggingface_hub[hf_xet]` or `pip install hf_xet`
Device set to use mps:0


In [None]:
sequence_to_classify = "If I have 2 pair of apple, can i make apple pie with it?"
candidate_labels = ['knowledge', 'comprehension', 'application', 'analysis','synthesis', 'evaluation']
label = bart(sequence_to_classify, candidate_labels)

In [15]:
label['labels'][0]

'application'

### bart-lage-mnli-yahoo-answers

In [26]:
tokenizer = AutoTokenizer.from_pretrained("joeddav/bart-large-mnli-yahoo-answers")
model = AutoModelForSequenceClassification.from_pretrained("joeddav/bart-large-mnli-yahoo-answers")

ya_classifier = pipeline("zero-shot-classification",
                      model=model , tokenizer=tokenizer)

Device set to use mps:0


In [31]:
sequence_to_classify = "If I have 2 pair of apple, can i make apple pie with it?"
candidate_labels = ['knowledge', 'comprehension', 'application', 'analysis','synthesis', 'evaluation']
hypothesis_template = "This text is about blooms taxonomy and it is classified as {}."
label = ya_classifier(sequence_to_classify, candidate_labels, hypothesis_template=hypothesis_template)

In [32]:
label['labels'][0]

'knowledge'

## Text Generation

In [7]:
tokenizer = AutoTokenizer.from_pretrained("deepseek-ai/DeepSeek-R1", trust_remote_code=True)
model = AutoModelForCausalLM.from_pretrained("deepseek-ai/DeepSeek-R1", trust_remote_code=True)

r1_classifier = pipeline(
    "text-generation", 
    model=model, 
    tokenizer=tokenizer,
    trust_remote_code=True
    )

messages = [
    {"role": "user", "content": "Who are you?"},
]
r1_classifier(messages)

ImportError: Loading an FP8 quantized model requires accelerate (`pip install accelerate`)

In [8]:
pip install accelerate

Note: you may need to restart the kernel to use updated packages.


# Query Augmentation