# 🛡️ Simple Guardrail Demo with HuggingFace LLM (No API Key Needed)
This notebook allows you to:
- Block prompts containing bad words (guardrail)
- Send clean prompts to a HuggingFace-hosted LLM
- Log and display the results


In [ ]:
!pip install transformers accelerate

In [ ]:
import re

blocked_words = ["kill", "bomb", "steal"]

def is_blocked(prompt):
    pattern = r"\\b(" + "|".join(re.escape(word) for word in blocked_words) + r")\\b"
    return re.search(pattern, prompt.lower()) is not None

In [ ]:
from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline

model_name = "tiiuae/falcon-7b-instruct"
tokenizer = AutoTokenizer.from_pretrained(model_name)
model = AutoModelForCausalLM.from_pretrained(model_name, device_map="auto", trust_remote_code=True)
generator = pipeline("text-generation", model=model, tokenizer=tokenizer)

In [ ]:
prompt = input("Enter your prompt: ")

if is_blocked(prompt):
    print("❌ Prompt blocked by guardrail!")
else:
    output = generator(prompt, max_new_tokens=100)[0]["generated_text"]
    print("✅ Output:", output)