Merge pull request #2203 from BerriAI/litellm_streaming_caching_fix

fix(utils.py): support returning caching streaming response for function calling streaming calls
2025-04-26 03:04:13 +00:00 · 2024-02-26 19:58:00 -08:00 · 2024-02-26 19:58:00 -08:00 · 95b5b7f1fc
commit 95b5b7f1fc
parent 825c7fe376 2a6a72a0e7
5 changed files with 168 additions and 64 deletions
--- a/litellm/main.py
+++ b/litellm/main.py
@ -3677,6 +3677,7 @@ def stream_chunk_builder(
    response["usage"]["total_tokens"] = (
        response["usage"]["prompt_tokens"] + response["usage"]["completion_tokens"]
    )
+
    return convert_to_model_response_object(
        response_object=response,
        model_response_object=model_response,