(feat) redis-semantic cache on proxy

2025-04-26 11:14:04 +00:00 · 2024-02-06 10:35:21 -08:00 · 2024-02-06 10:35:21 -08:00 · 4265c7affb
commit 4265c7affb
parent 698cee89fa
2 changed files with 5 additions and 1 deletions
--- a/litellm/proxy/proxy_server.py
+++ b/litellm/proxy/proxy_server.py
@ -1168,7 +1168,7 @@ class ProxyConfig:
                    verbose_proxy_logger.debug(f"passed cache type={cache_type}")
-                    if cache_type == "redis":
+                    if cache_type == "redis" or cache_type == "redis-semantic":
                        cache_host = litellm.get_secret("REDIS_HOST", None)
                        cache_port = litellm.get_secret("REDIS_PORT", None)
                        cache_password = litellm.get_secret("REDIS_PASSWORD", None)
@ -1195,6 +1195,9 @@ class ProxyConfig:
                            f"{blue_color_code}Cache Password:{reset_color_code} {cache_password}"
                        )
                        print()  # noqa
                    if cache_type == "redis-semantic":
                        # by default this should always be async
                        cache_params.update({"redis_semantic_cache_use_async": True})
                    # users can pass os.environ/ variables on the proxy - we should read them from the env
                    for key, value in cache_params.items():
--- a/requirements.txt
+++ b/requirements.txt
@ -10,6 +10,7 @@ gunicorn==21.2.0 # server dep
 boto3==1.28.58 # aws bedrock/sagemaker calls
 redis==4.6.0 # caching
 redisvl==0.0.7 # semantic caching
 numpy==1.24.3 # semantic caching
 prisma==0.11.0 # for db
 mangum==0.17.0 # for aws lambda functions
 google-generativeai==0.3.2 # for vertex ai calls