diff --git a/litellm/llms/azure.py b/litellm/llms/azure.py index 01b54987b2..6a0c1ec1fb 100644 --- a/litellm/llms/azure.py +++ b/litellm/llms/azure.py @@ -333,10 +333,17 @@ class AzureChatCompletion(BaseLLM): azure_client_params["api_key"] = api_key elif azure_ad_token is not None: azure_client_params["azure_ad_token"] = azure_ad_token + + # setting Azure client if client is None: azure_client = AsyncAzureOpenAI(**azure_client_params) else: azure_client = client + if api_version is not None and isinstance( + azure_client._custom_query, dict + ): + # set api_version to version passed by user + azure_client._custom_query.setdefault("api-version", api_version) ## LOGGING logging_obj.pre_call( input=data["messages"],