diff --git a/litellm/cost_calculator.py b/litellm/cost_calculator.py index 1d10fa1f9e..b83fe09305 100644 --- a/litellm/cost_calculator.py +++ b/litellm/cost_calculator.py @@ -573,9 +573,7 @@ def completion_cost( # noqa: PLR0915 base_model=base_model, ) - verbose_logger.debug( - f"completion_response _select_model_name_for_cost_calc: {model}" - ) + verbose_logger.info(f"selected model name for cost calculation: {model}") if completion_response is not None and ( isinstance(completion_response, BaseModel) diff --git a/litellm/llms/azure/audio_transcriptions.py b/litellm/llms/azure/audio_transcriptions.py index 94793295ca..ba9ac01400 100644 --- a/litellm/llms/azure/audio_transcriptions.py +++ b/litellm/llms/azure/audio_transcriptions.py @@ -7,7 +7,11 @@ from pydantic import BaseModel import litellm from litellm.litellm_core_utils.audio_utils.utils import get_audio_file_name from litellm.types.utils import FileTypes -from litellm.utils import TranscriptionResponse, convert_to_model_response_object +from litellm.utils import ( + TranscriptionResponse, + convert_to_model_response_object, + extract_duration_from_srt_or_vtt, +) from .azure import ( AzureChatCompletion, @@ -156,6 +160,8 @@ class AzureAudioTranscription(AzureChatCompletion): stringified_response = response.model_dump() else: stringified_response = TranscriptionResponse(text=response).model_dump() + duration = extract_duration_from_srt_or_vtt(response) + stringified_response["duration"] = duration ## LOGGING logging_obj.post_call( diff --git a/litellm/proxy/_experimental/out/onboarding.html b/litellm/proxy/_experimental/out/onboarding.html deleted file mode 100644 index ef020510ab..0000000000 --- a/litellm/proxy/_experimental/out/onboarding.html +++ /dev/null @@ -1 +0,0 @@ -