mirror of
https://github.com/BerriAI/litellm.git
synced 2025-04-26 11:14:04 +00:00
fix(main.py): support max retries for transcription calls
This commit is contained in:
parent
c3e4af76cf
commit
ceabf726b0
3 changed files with 7 additions and 3 deletions
|
@ -799,6 +799,7 @@ class AzureChatCompletion(BaseLLM):
|
||||||
optional_params: dict,
|
optional_params: dict,
|
||||||
model_response: TranscriptionResponse,
|
model_response: TranscriptionResponse,
|
||||||
timeout: float,
|
timeout: float,
|
||||||
|
max_retries: int,
|
||||||
api_key: Optional[str] = None,
|
api_key: Optional[str] = None,
|
||||||
api_base: Optional[str] = None,
|
api_base: Optional[str] = None,
|
||||||
api_version: Optional[str] = None,
|
api_version: Optional[str] = None,
|
||||||
|
@ -817,8 +818,6 @@ class AzureChatCompletion(BaseLLM):
|
||||||
"timeout": timeout,
|
"timeout": timeout,
|
||||||
}
|
}
|
||||||
|
|
||||||
max_retries = optional_params.pop("max_retries", None)
|
|
||||||
|
|
||||||
azure_client_params = select_azure_base_url_or_endpoint(
|
azure_client_params = select_azure_base_url_or_endpoint(
|
||||||
azure_client_params=azure_client_params
|
azure_client_params=azure_client_params
|
||||||
)
|
)
|
||||||
|
|
|
@ -785,10 +785,10 @@ class OpenAIChatCompletion(BaseLLM):
|
||||||
optional_params: dict,
|
optional_params: dict,
|
||||||
model_response: TranscriptionResponse,
|
model_response: TranscriptionResponse,
|
||||||
timeout: float,
|
timeout: float,
|
||||||
|
max_retries: int,
|
||||||
api_key: Optional[str] = None,
|
api_key: Optional[str] = None,
|
||||||
api_base: Optional[str] = None,
|
api_base: Optional[str] = None,
|
||||||
client=None,
|
client=None,
|
||||||
max_retries=None,
|
|
||||||
logging_obj=None,
|
logging_obj=None,
|
||||||
atranscription: bool = False,
|
atranscription: bool = False,
|
||||||
):
|
):
|
||||||
|
|
|
@ -3553,6 +3553,7 @@ def transcription(
|
||||||
api_key: Optional[str] = None,
|
api_key: Optional[str] = None,
|
||||||
api_base: Optional[str] = None,
|
api_base: Optional[str] = None,
|
||||||
api_version: Optional[str] = None,
|
api_version: Optional[str] = None,
|
||||||
|
max_retries: Optional[int] = None,
|
||||||
litellm_logging_obj=None,
|
litellm_logging_obj=None,
|
||||||
custom_llm_provider=None,
|
custom_llm_provider=None,
|
||||||
**kwargs,
|
**kwargs,
|
||||||
|
@ -3568,6 +3569,8 @@ def transcription(
|
||||||
proxy_server_request = kwargs.get("proxy_server_request", None)
|
proxy_server_request = kwargs.get("proxy_server_request", None)
|
||||||
model_info = kwargs.get("model_info", None)
|
model_info = kwargs.get("model_info", None)
|
||||||
metadata = kwargs.get("metadata", {})
|
metadata = kwargs.get("metadata", {})
|
||||||
|
if max_retries is None:
|
||||||
|
max_retries = openai.DEFAULT_MAX_RETRIES
|
||||||
|
|
||||||
model_response = litellm.utils.TranscriptionResponse()
|
model_response = litellm.utils.TranscriptionResponse()
|
||||||
|
|
||||||
|
@ -3611,6 +3614,7 @@ def transcription(
|
||||||
api_key=api_key,
|
api_key=api_key,
|
||||||
api_version=api_version,
|
api_version=api_version,
|
||||||
azure_ad_token=azure_ad_token,
|
azure_ad_token=azure_ad_token,
|
||||||
|
max_retries=max_retries,
|
||||||
)
|
)
|
||||||
elif custom_llm_provider == "openai":
|
elif custom_llm_provider == "openai":
|
||||||
response = openai_chat_completions.audio_transcriptions(
|
response = openai_chat_completions.audio_transcriptions(
|
||||||
|
@ -3621,6 +3625,7 @@ def transcription(
|
||||||
atranscription=atranscription,
|
atranscription=atranscription,
|
||||||
timeout=timeout,
|
timeout=timeout,
|
||||||
logging_obj=litellm_logging_obj,
|
logging_obj=litellm_logging_obj,
|
||||||
|
max_retries=max_retries,
|
||||||
)
|
)
|
||||||
return response
|
return response
|
||||||
|
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue