(feat) add cache context manager

2023-12-30 19:32:51 +05:30 · 2023-12-30 19:32:51 +05:30 · ddddfe6602
commit ddddfe6602
parent 231148ed73
2 changed files with 58 additions and 0 deletions
--- a/litellm/caching.py
+++ b/litellm/caching.py
@ -220,6 +220,7 @@ class Cache:
        if "cache" not in litellm._async_success_callback:
            litellm._async_success_callback.append("cache")
        self.supported_call_types = supported_call_types  # default to ["completion", "acompletion", "embedding", "aembedding"]
        self.type = type
    def get_cache_key(self, *args, **kwargs):
        """
@ -374,3 +375,59 @@ class Cache:
    async def _async_add_cache(self, result, *args, **kwargs):
        self.add_cache(result, *args, **kwargs)
 def enable_cache(
    type: Optional[Literal["local", "redis"]] = "local",
    host: Optional[str] = None,
    port: Optional[str] = None,
    password: Optional[str] = None,
    supported_call_types: Optional[
        List[Literal["completion", "acompletion", "embedding", "aembedding"]]
    ] = ["completion", "acompletion", "embedding", "aembedding"],
    **kwargs,
 ):
    """
    Enable caching.
    :param attach_cache: If True, attach the cache to litellm.cache
    :return: None
    """
    print_verbose("LiteLLM: Enabling Cache")
    if "cache" not in litellm.input_callback:
        litellm.input_callback.append("cache")
    if "cache" not in litellm.success_callback:
        litellm.success_callback.append("cache")
    if "cache" not in litellm._async_success_callback:
        litellm._async_success_callback.append("cache")
    if litellm.cache == None:
        litellm.cache = Cache(
            type=type,
            host=host,
            port=port,
            password=password,
            supported_call_types=supported_call_types,
            **kwargs,
        )
    print_verbose(f"LiteLLM: Cache enabled, litellm.cache={litellm.cache}")
    print_verbose(f"LiteLLM Cache: {vars(litellm.cache)}")
 def disable_cache():
    from contextlib import suppress
    """
    Disable caching.
    :param detach_cache: If True, detach the cache from litellm.cache
    :return: None
    """
    print_verbose("LiteLLM: Disabling Cache")
    with suppress(ValueError):
        litellm.input_callback.remove("cache")
        litellm.success_callback.remove("cache")
        litellm._async_success_callback.remove("cache")
    litellm.cache = None
    print_verbose(f"LiteLLM: Cache disabled, litellm.cache={litellm.cache}")
--- a/litellm/main.py
+++ b/litellm/main.py
@ -71,6 +71,7 @@ from .llms.prompt_templates.factory import (
 import tiktoken
 from concurrent.futures import ThreadPoolExecutor
 from typing import Callable, List, Optional, Dict, Union, Mapping
 from .caching import enable_cache, disable_cache
 encoding = tiktoken.get_encoding("cl100k_base")
 from litellm.utils import (