v0 of caching

2025-04-26 19:24:27 +00:00 · 2023-08-28 13:11:54 -07:00 · 2023-08-28 13:11:54 -07:00 · 6fa2e578d4
commit 6fa2e578d4
parent 753ab03d91
4 changed files with 137 additions and 49 deletions
--- a/litellm/caching.py
+++ b/litellm/caching.py
@ -0,0 +1,81 @@
+import redis
+import litellm, openai
+
+def get_prompt(*args, **kwargs):
+    # make this safe checks, it should not throw any exceptions
+    if len(args) > 1:
+        messages = args[1]
+        prompt = " ".join(message["content"] for message in messages)
+        return prompt
+    if "messages" in kwargs:
+        messages = kwargs["messages"]
+        prompt = " ".join(message["content"] for message in messages)
+        return prompt
+    return None
+
+class RedisCache():
+    import redis
+    def __init__(self, host, port, password):
+        # if users don't provider one, use the default litellm cache
+        self.redis_client = redis.Redis(host=host, port=port, password=password)
+
+    def set_cache(self, key, value):
+        self.redis_client.set(key, str(value))
+
+    def get_cache(self, key):
+        # TODO convert this to a ModelResponse object 
+        return self.redis_client.get(key)
+
+class InMemoryCache():
+    def __init__(self):
+        # if users don't provider one, use the default litellm cache
+        self.cache_dict = {}
+
+    def set_cache(self, key, value):
+        self.cache_dict[key] = value
+
+    def get_cache(self, key):
+        if key in self.cache_dict:
+            return self.cache_dict[key]
+        return None
+
+class Cache():
+    def __init__(self, type="local", host="", port="", password=""):
+        if type == "redis":
+            self.cache = RedisCache(type, host, port, password)
+        if type == "local":
+            self.cache = InMemoryCache()
+
+    def check_cache(self, *args, **kwargs):
+        try:  # never block execution
+            prompt = get_prompt(*args, **kwargs)
+            if prompt != None:  # check if messages / prompt exists
+                if "model" in kwargs: # default to caching with `model + prompt` as key
+                    cache_key = prompt + kwargs["model"]
+                    return self.cache.get_cache(cache_key)
+            else:
+                return self.cache.get_cache(prompt)
+        except:
+            return None
+
+    def add_cache(self, result, *args, **kwargs):
+        try:
+            prompt = get_prompt(*args, **kwargs)
+            if "model" in kwargs: # default to caching with `model + prompt` as key
+                cache_key = prompt + kwargs["model"]
+                self.cache.set_cache(cache_key, result)
+            else:
+                self.cache.set_cache(prompt, result)
+        except:
+            pass
+
+
+
+
+
+
+
+
+
+
+