From 2bf20ebfdf252bf6195b922b2fa165de7319326f Mon Sep 17 00:00:00 2001 From: Ishaan Jaff Date: Sat, 4 Jan 2025 20:18:32 -0800 Subject: [PATCH] latency fix proxy (#7563) --- litellm/proxy/litellm_pre_call_utils.py | 17 ++++++++++------- 1 file changed, 10 insertions(+), 7 deletions(-) diff --git a/litellm/proxy/litellm_pre_call_utils.py b/litellm/proxy/litellm_pre_call_utils.py index 6cd7dca743..ad7371e84d 100644 --- a/litellm/proxy/litellm_pre_call_utils.py +++ b/litellm/proxy/litellm_pre_call_utils.py @@ -1,3 +1,4 @@ +import asyncio import copy import time from typing import TYPE_CHECKING, Any, Dict, Optional, Union @@ -616,13 +617,15 @@ async def add_litellm_data_to_request( # noqa: PLR0915 ) end_time = time.time() - await service_logger_obj.async_service_success_hook( - service=ServiceTypes.PROXY_PRE_CALL, - duration=end_time - start_time, - call_type="add_litellm_data_to_request", - start_time=start_time, - end_time=end_time, - parent_otel_span=user_api_key_dict.parent_otel_span, + asyncio.create_task( + service_logger_obj.async_service_success_hook( + service=ServiceTypes.PROXY_PRE_CALL, + duration=end_time - start_time, + call_type="add_litellm_data_to_request", + start_time=start_time, + end_time=end_time, + parent_otel_span=user_api_key_dict.parent_otel_span, + ) ) return data