(refactor) caching - use _sync_set_cache (#6224)

* caching - use _sync_set_cache * add sync _sync_add_streaming_response_to_cache * use caching class for cache storage
2025-04-27 11:43:54 +00:00 · 2024-10-16 10:38:07 +05:30 · 2024-10-16 10:38:07 +05:30 · 4eea0652eb
commit 4eea0652eb
parent a04fc1a921
3 changed files with 89 additions and 28 deletions
--- a/litellm/litellm_core_utils/litellm_logging.py
+++ b/litellm/litellm_core_utils/litellm_logging.py
@ -938,19 +938,6 @@ class Logging:
            else:
                callbacks = litellm.success_callback

-            ## STREAMING CACHING ##
-            if "cache" in callbacks and litellm.cache is not None:
-                # this only logs streaming once, complete_streaming_response exists i.e when stream ends
-                print_verbose("success_callback: reaches cache for logging!")
-                kwargs = self.model_call_details
-                if self.stream and _caching_complete_streaming_response is not None:
-                    print_verbose(
-                        "success_callback: reaches cache for logging, there is a complete_streaming_response. Adding to cache"
-                    )
-                    result = _caching_complete_streaming_response
-                    # only add to cache once we have a complete streaming response
-                    litellm.cache.add_cache(result, **kwargs)
-
            ## REDACT MESSAGES ##
            result = redact_message_input_output_from_logging(
                model_call_details=(