litellm/litellm/caching.py
2023-08-28 14:13:03 -07:00

90 lines
2.6 KiB
Python

import litellm, openai
def get_prompt(*args, **kwargs):
# make this safe checks, it should not throw any exceptions
if len(args) > 1:
messages = args[1]
prompt = " ".join(message["content"] for message in messages)
return prompt
if "messages" in kwargs:
messages = kwargs["messages"]
prompt = " ".join(message["content"] for message in messages)
return prompt
return None
class RedisCache():
import redis
def __init__(self, host, port, password):
# if users don't provider one, use the default litellm cache
self.redis_client = redis.Redis(host=host, port=port, password=password)
def set_cache(self, key, value):
self.redis_client.set(key, str(value))
def get_cache(self, key):
# TODO convert this to a ModelResponse object
return self.redis_client.get(key)
class InMemoryCache():
def __init__(self):
# if users don't provider one, use the default litellm cache
self.cache_dict = {}
def set_cache(self, key, value):
#print("in set cache for inmem")
self.cache_dict[key] = value
def get_cache(self, key):
#print("in get cache for inmem")
if key in self.cache_dict:
#print("got a cache hit")
return self.cache_dict[key]
#print("got a cache miss")
return None
class Cache():
def __init__(self, type="local", host="", port="", password=""):
if type == "redis":
self.cache = RedisCache(type, host, port, password)
if type == "local":
self.cache = InMemoryCache()
def get_cache_key(self, *args, **kwargs):
prompt = get_prompt(*args, **kwargs)
if prompt is not None:
cache_key = prompt
if "model" in kwargs:
cache_key += kwargs["model"]
elif "input" in kwargs:
cache_key = " ".join(kwargs["input"])
if "model" in kwargs:
cache_key += kwargs["model"]
else:
return None
return cache_key
def get_cache(self, *args, **kwargs):
try: # never block execution
cache_key = self.get_cache_key(*args, **kwargs)
if cache_key is not None:
return self.cache.get_cache(cache_key)
except:
return None
def add_cache(self, result, *args, **kwargs):
try:
cache_key = self.get_cache_key(*args, **kwargs)
if cache_key is not None:
self.cache.set_cache(cache_key, result)
except:
pass