feat(prompt_injection_detection.py): support simple heuristic similarity check for prompt injection attacks

This commit is contained in:
Krrish Dholakia 2024-03-13 10:32:21 -07:00
parent ac867daadc
commit 234cdbbfef
3 changed files with 190 additions and 0 deletions

View file

@ -1665,6 +1665,18 @@ class ProxyConfig:
banned_keywords_obj = _ENTERPRISE_BannedKeywords()
imported_list.append(banned_keywords_obj)
elif (
isinstance(callback, str)
and callback == "detect_prompt_injection"
):
from litellm.proxy.enterprise.enterprise_hooks.prompt_injection_detection import (
_ENTERPRISE_PromptInjectionDetection,
)
prompt_injection_detection_obj = (
_ENTERPRISE_PromptInjectionDetection()
)
imported_list.append(prompt_injection_detection_obj)
else:
imported_list.append(
get_instance_fn(