Skip to content

Commit

Permalink
Merge pull request #37 from jannikstdl/prompt_injection_filter
Browse files Browse the repository at this point in the history
  • Loading branch information
tjbck committed Jun 5, 2024
2 parents b4ed391 + 0bc42e8 commit ac14bf6
Showing 1 changed file with 81 additions and 0 deletions.
81 changes: 81 additions & 0 deletions examples/filters/llmguard_prompt_injection_filter_pipeline.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,81 @@
"""
title: LLM Guard Filter Pipeline
author: jannikstdl
date: 2024-05-30
version: 1.0
license: MIT
description: A pipeline for filtering out potential prompt injections using the LLM Guard library.
requirements: llm-guard
"""

from typing import List, Optional
from schemas import OpenAIChatMessage
from pydantic import BaseModel
from llm_guard.input_scanners import PromptInjection
from llm_guard.input_scanners.prompt_injection import MatchType
import os

class Pipeline:
def __init__(self):
# Pipeline filters are only compatible with Open WebUI
# You can think of filter pipeline as a middleware that can be used to edit the form data before it is sent to the OpenAI API.
self.type = "filter"

# Optionally, you can set the id and name of the pipeline.
# Assign a unique identifier to the pipeline.
# The identifier must be unique across all pipelines.
# The identifier must be an alphanumeric string that can include underscores or hyphens. It cannot contain spaces, special characters, slashes, or backslashes.
self.id = "llmguard_prompt_injection_filter_pipeline"
self.name = "LLMGuard Prompt Injection Filter"

class Valves(BaseModel):
# List target pipeline ids (models) that this filter will be connected to.
# If you want to connect this filter to all pipelines, you can set pipelines to ["*"]
# e.g. ["llama3:latest", "gpt-3.5-turbo"]
pipelines: List[str] = []

# Assign a priority level to the filter pipeline.
# The priority level determines the order in which the filter pipelines are executed.
# The lower the number, the higher the priority.
priority: int = 0

# Initialize
self.valves = Valves(
**{
"pipelines": ["*"], # Connect to all pipelines
}
)

self.model = None

pass

async def on_startup(self):
# This function is called when the server is started.
print(f"on_startup:{__name__}")

self.model = PromptInjection(threshold=0.8, match_type=MatchType.FULL)
pass

async def on_shutdown(self):
# This function is called when the server is stopped.
print(f"on_shutdown:{__name__}")
pass

async def on_valves_updated(self):
# This function is called when the valves are updated.
pass

async def inlet(self, body: dict, user: Optional[dict] = None) -> dict:
# This filter is applied to the form data before it is sent to the OpenAI API.
print(f"inlet:{__name__}")

user_message = body["messages"][-1]["content"]

# Filter out prompt injection messages
sanitized_prompt, is_valid, risk_score = self.model.scan(user_message)

if risk_score > 0.8:
raise Exception("Prompt injection detected")

return body

0 comments on commit ac14bf6

Please sign in to comment.