diff --git a/litellm/responses/main.py b/litellm/responses/main.py index 817389d44e..c719b993a9 100644 --- a/litellm/responses/main.py +++ b/litellm/responses/main.py @@ -15,6 +15,7 @@ from litellm.types.llms.openai import ( ResponseIncludable, ResponseInputParam, ResponsesAPIOptionalRequestParams, + ResponsesAPIResponse, ResponseTextConfigParam, ToolChoice, ToolParam, @@ -22,6 +23,8 @@ from litellm.types.llms.openai import ( from litellm.types.router import GenericLiteLLMParams from litellm.utils import ProviderConfigManager, client +from .streaming_iterator import ResponsesAPIStreamingIterator + ####### ENVIRONMENT VARIABLES ################### # Initialize any necessary instances or variables here base_llm_http_handler = BaseLLMHTTPHandler() @@ -72,7 +75,7 @@ async def aresponses( extra_body: Optional[Dict[str, Any]] = None, timeout: Optional[Union[float, httpx.Timeout]] = None, **kwargs, -): +) -> Union[ResponsesAPIResponse, ResponsesAPIStreamingIterator]: litellm_logging_obj: LiteLLMLoggingObj = kwargs.get("litellm_logging_obj") # type: ignore litellm_call_id: Optional[str] = kwargs.get("litellm_call_id", None) @@ -131,8 +134,6 @@ async def aresponses( ) return response - pass - def responses( input: Union[str, ResponseInputParam],