### Testing Model

In [1]:
import torch
from transformers import AutoTokenizer, AutoModelForCausalLM

  from .autonotebook import tqdm as notebook_tqdm


In [2]:
def load_model_and_tokenizer(model_path="customer_support_model"):
    device = torch.device("mps" if torch.backends.mps.is_available() else "cpu")
    tokenizer = AutoTokenizer.from_pretrained(model_path)
    model = AutoModelForCausalLM.from_pretrained(model_path).to(device)
    return model, tokenizer, device

In [3]:
def test_model(model, tokenizer, device, test_cases=None):
    if test_cases is None:
        test_cases = [
            "How do I cancel my order?",
            "I need help with my purchase",
            "I can't afford this order",
            "What's my order status?",
            "Can you help me with a refund?"
        ]
    
    results = []
    for prompt in test_cases:
        inputs = tokenizer(
            f"### User: {prompt}",
            return_tensors="pt",
            truncation=True,
            max_length=256
        ).to(device)
        
        outputs = model.generate(
            **inputs,
            max_new_tokens=128,
            temperature=0.7,
            do_sample=True,
            top_p=0.95,
            repetition_penalty=1.2
        )
        
        response = tokenizer.decode(outputs[0], skip_special_tokens=True)
        results.append({"prompt": prompt, "response": response})
        
        print(f"\nTest Case: {prompt}")
        print(f"Response: {response}")
        print("-" * 50)
    
    return results

In [None]:
# Load model
model, tokenizer, device = load_model_and_tokenizer()

# Run tests
results = test_model(model, tokenizer, device)

  Referenced from: <0B7EB158-53DC-3403-8A49-22178CAB4612> /Users/koyiljonvaliev/Anaconda/anaconda3/envs/llm_env/lib/python3.10/site-packages/torchvision/image.so
  warn(
  warn("The installed version of bitsandbytes was compiled without GPU support. "


'NoneType' object has no attribute 'cadam32bit_grad_fp32'


Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
