feat(prompt_injection_detection.py): support simple heuristic similarity check for prompt injection attacks

2024-03-13 10:32:21 -07:00 · 2024-03-13 10:32:21 -07:00 · 234cdbbfef
commit 234cdbbfef
parent ac867daadc
3 changed files with 190 additions and 0 deletions
--- a/litellm/proxy/proxy_server.py
+++ b/litellm/proxy/proxy_server.py
@ -1665,6 +1665,18 @@ class ProxyConfig:

                                banned_keywords_obj = _ENTERPRISE_BannedKeywords()
                                imported_list.append(banned_keywords_obj)
+                            elif (
+                                isinstance(callback, str)
+                                and callback == "detect_prompt_injection"
+                            ):
+                                from litellm.proxy.enterprise.enterprise_hooks.prompt_injection_detection import (
+                                    _ENTERPRISE_PromptInjectionDetection,
+                                )
+
+                                prompt_injection_detection_obj = (
+                                    _ENTERPRISE_PromptInjectionDetection()
+                                )
+                                imported_list.append(prompt_injection_detection_obj)
                            else:
                                imported_list.append(
                                    get_instance_fn(