# Tiny A11y LoRA Chatbot
This notebook loads your LoRA fine-tuned `younglim/tiny-a11y-model` on DeepSeek-Coder and lets you chat interactively.

In [None]:
# Install required packages
!pip install --upgrade pip
!pip install transformers accelerate peft gradio

In [None]:
# Load base model and tokenizer
from transformers import AutoTokenizer, AutoModelForCausalLM
from peft import PeftModelForCausalLM

base_model_name = 'deepseek-ai/deepseek-coder-1.3b-instruct'
lora_model_name = 'younglim/tiny-a11y-model'

tokenizer = AutoTokenizer.from_pretrained(base_model_name)
base_model = AutoModelForCausalLM.from_pretrained(base_model_name)

# Load LoRA adapter using PeftModelForCausalLM
model = PeftModelForCausalLM.from_pretrained(base_model, lora_model_name)

In [None]:
# Chat function using PyTorch generate
def chat(prompt, max_new_tokens=300):
    inputs = tokenizer(prompt, return_tensors='pt')
    outputs = model.generate(
        **inputs,
        max_new_tokens=max_new_tokens,
        do_sample=True,
        temperature=0.7,
        top_p=0.9
    )
    return tokenizer.decode(outputs[0], skip_special_tokens=True)

In [None]:
# Launch Gradio interface
import gradio as gr

iface = gr.Interface(
    fn=chat,
    inputs=gr.Textbox(lines=5, label='Enter your prompt'),
    outputs=gr.Textbox(lines=15, label='Model response'),
    title='Tiny A11y Chatbot',
    description='Ask the Tiny A11y Model anything about accessibility.'
)

# Set share=True to get a public link
iface.launch(share=True)