(feat) working semantic cache on proxy

2024-02-06 08:55:25 -08:00 · 2024-02-06 08:55:25 -08:00 · 70a895329e
commit 70a895329e
parent a3b1e3bc84
1 changed files with 6 additions and 1 deletions
--- a/litellm/proxy/proxy_config.yaml
+++ b/litellm/proxy/proxy_config.yaml
@ -73,7 +73,12 @@ litellm_settings:
    max_budget: 1.5000
    models: ["azure-gpt-3.5"]
    duration: None
-  # cache: True     
+  cache: True          # set cache responses to True
  cache_params:
    type: "redis-semantic"
    similarity_threshold: 0.8
    redis_semantic_cache_use_async: True
  # cache: True
  # setting callback class
  # callbacks: custom_callbacks.proxy_handler_instance # sets litellm.callbacks = [proxy_handler_instance]