Complete 'requests' library removal (#7350)

* refactor: initial commit moving watsonx_text to base_llm_http_handler + clarifying new provider directory structure * refactor(watsonx/completion/handler.py): move to using base llm http handler removes 'requests' library usage * fix(watsonx_text/transformation.py): fix result transformation migrates to transformation.py, for usage with base llm http handler * fix(streaming_handler.py): migrate watsonx streaming to transformation.py ensures streaming works with base llm http handler * fix(streaming_handler.py): fix streaming linting errors and remove watsonx conditional logic * fix(watsonx/): fix chat route post completion route refactor * refactor(watsonx/embed): refactor watsonx to use base llm http handler for embedding calls as well * refactor(base.py): remove requests library usage from litellm * build(pyproject.toml): remove requests library usage * fix: fix linting errors * fix: fix linting errors * fix(types/utils.py): fix validation errors for modelresponsestream * fix(replicate/handler.py): fix linting errors * fix(litellm_logging.py): handle modelresponsestream object * fix(streaming_handler.py): fix modelresponsestream args * fix: remove unused imports * test: fix test * fix: fix test * test: fix test * test: fix tests * test: fix test * test: fix patch target * test: fix test
2025-04-26 03:04:13 +00:00 · 2024-12-22 07:21:25 -08:00 · 2024-12-22 07:21:25 -08:00 · 3671829e39
commit 3671829e39
parent 8b1ea40e7b
39 changed files with 2147 additions and 2279 deletions
--- a/litellm/llms/custom_httpx/llm_http_handler.py
+++ b/litellm/llms/custom_httpx/llm_http_handler.py
@ -110,6 +110,8 @@ class BaseLLMHTTPHandler:
        api_base = provider_config.get_complete_url(
            api_base=api_base,
            model=model,
+            optional_params=optional_params,
+            stream=stream,
        )

        data = provider_config.transform_request(
@ -402,6 +404,7 @@ class BaseLLMHTTPHandler:
        logging_obj: LiteLLMLoggingObj,
        api_base: Optional[str],
        optional_params: dict,
+        litellm_params: dict,
        model_response: EmbeddingResponse,
        api_key: Optional[str] = None,
        client: Optional[Union[HTTPHandler, AsyncHTTPHandler]] = None,
@ -424,6 +427,7 @@ class BaseLLMHTTPHandler:
        api_base = provider_config.get_complete_url(
            api_base=api_base,
            model=model,
+            optional_params=optional_params,
        )

        data = provider_config.transform_embedding_request(
@ -457,6 +461,8 @@ class BaseLLMHTTPHandler:
                api_key=api_key,
                timeout=timeout,
                client=client,
+                optional_params=optional_params,
+                litellm_params=litellm_params,
            )

        if client is None or not isinstance(client, HTTPHandler):
@ -484,6 +490,8 @@ class BaseLLMHTTPHandler:
            logging_obj=logging_obj,
            api_key=api_key,
            request_data=data,
+            optional_params=optional_params,
+            litellm_params=litellm_params,
        )

    async def aembedding(
@ -496,6 +504,8 @@ class BaseLLMHTTPHandler:
        provider_config: BaseEmbeddingConfig,
        model_response: EmbeddingResponse,
        logging_obj: LiteLLMLoggingObj,
+        optional_params: dict,
+        litellm_params: dict,
        api_key: Optional[str] = None,
        timeout: Optional[Union[float, httpx.Timeout]] = None,
        client: Optional[Union[HTTPHandler, AsyncHTTPHandler]] = None,
@ -524,6 +534,8 @@ class BaseLLMHTTPHandler:
            logging_obj=logging_obj,
            api_key=api_key,
            request_data=request_data,
+            optional_params=optional_params,
+            litellm_params=litellm_params,
        )

    def rerank(