fix(azure.py): fix error handling for openai/azure streaming

2025-04-26 03:04:13 +00:00 · 2023-11-29 11:52:24 -08:00 · 2023-11-29 11:52:24 -08:00 · a9ed768991
commit a9ed768991
parent b6bc75e27a
4 changed files with 32 additions and 8 deletions
--- a/litellm/llms/azure.py
+++ b/litellm/llms/azure.py
@ -221,7 +221,7 @@ class AzureChatCompletion(BaseLLM):
                  timeout: Any,
                  azure_ad_token: Optional[str]=None, 
                  client=None,
-    ):
+    ): 
        max_retries = data.pop("max_retries", 2)
        if not isinstance(max_retries, int): 
            raise AzureOpenAIError(status_code=422, message="max retries must be an int")
@ -244,8 +244,7 @@ class AzureChatCompletion(BaseLLM):
            azure_client = client
        response = azure_client.chat.completions.create(**data)
        streamwrapper = CustomStreamWrapper(completion_stream=response, model=model, custom_llm_provider="azure",logging_obj=logging_obj)
-        for transformed_chunk in streamwrapper:
-            yield transformed_chunk
+        return streamwrapper

    async def async_streaming(self, 
                          logging_obj,