fix(huggingface_restapi.py): fixes issue where 'wait_for_model' was not being passed as expected

2024-08-09 08:35:36 -07:00 · 2024-08-09 08:35:36 -07:00 · 51ccfa9e77
commit 51ccfa9e77
parent a1c3167853
3 changed files with 64 additions and 3 deletions
--- a/litellm/llms/huggingface_restapi.py
+++ b/litellm/llms/huggingface_restapi.py
@ -838,7 +838,12 @@ class Huggingface(BaseLLM):
        return {"inputs": input}  # default to feature-extraction pipeline tag
    async def _async_transform_input(
-        self, model: str, task_type: Optional[str], embed_url: str, input: List
+        self,
        model: str,
        task_type: Optional[str],
        embed_url: str,
        input: List,
        optional_params: dict,
    ) -> dict:
        hf_task = await async_get_hf_task_embedding_for_model(
            model=model, task_type=task_type, api_base=embed_url
@ -846,6 +851,9 @@ class Huggingface(BaseLLM):
        data = self._transform_input_on_pipeline_tag(input=input, pipeline_tag=hf_task)
        if len(optional_params.keys()) > 0:
            data["options"] = optional_params
        return data
    def _transform_input(
@ -856,6 +864,7 @@ class Huggingface(BaseLLM):
        optional_params: dict,
        embed_url: str,
    ) -> dict:
        data: Dict = {}
        ## TRANSFORMATION ##
        if "sentence-transformers" in model:
            if len(input) == 0:
@ -865,7 +874,7 @@ class Huggingface(BaseLLM):
                )
            data = {"inputs": {"source_sentence": input[0], "sentences": input[1:]}}
        else:
-            data = {"inputs": input}  # type: ignore
+            data = {"inputs": input}
            task_type = optional_params.pop("input_type", None)
@ -882,6 +891,9 @@ class Huggingface(BaseLLM):
                input=input, pipeline_tag=hf_task
            )
        if len(optional_params.keys()) > 0:
            data["options"] = optional_params
        return data
    def _process_embedding_response(
--- a/litellm/tests/test_embedding.py
+++ b/litellm/tests/test_embedding.py
@ -1,3 +1,4 @@
 import json
 import os
 import sys
 import traceback
@ -11,7 +12,7 @@ load_dotenv()
 sys.path.insert(
    0, os.path.abspath("../..")
 )  # Adds the parent directory to the system path
-from unittest.mock import MagicMock, patch
+from unittest.mock import AsyncMock, MagicMock, patch
 import litellm
 from litellm import completion, completion_cost, embedding
@ -740,3 +741,43 @@ async def test_databricks_embeddings(sync_mode):
 #     print(response)
 # local_proxy_embeddings()
@pytest.mark.parametrize("sync_mode", [True, False])
@pytest.mark.asyncio
 async def test_hf_embedddings_with_optional_params(sync_mode):
    litellm.set_verbose = True
    if sync_mode:
        client = HTTPHandler(concurrent_limit=1)
        mock_obj = MagicMock()
    else:
        client = AsyncHTTPHandler(concurrent_limit=1)
        mock_obj = AsyncMock()
    with patch.object(client, "post", new=mock_obj) as mock_client:
        try:
            if sync_mode:
                response = embedding(
                    model="huggingface/jinaai/jina-embeddings-v2-small-en",
                    input=["good morning from litellm"],
                    wait_for_model=True,
                    client=client,
                )
            else:
                response = await litellm.aembedding(
                    model="huggingface/jinaai/jina-embeddings-v2-small-en",
                    input=["good morning from litellm"],
                    wait_for_model=True,
                    client=client,
                )
        except Exception:
            pass
        mock_client.assert_called_once()
        print(f"mock_client.call_args.kwargs: {mock_client.call_args.kwargs}")
        assert "options" in mock_client.call_args.kwargs["data"]
        json_data = json.loads(mock_client.call_args.kwargs["data"])
        assert "wait_for_model" in json_data["options"]
        assert json_data["options"]["wait_for_model"] is True
--- a/litellm/tests/test_optional_params.py
+++ b/litellm/tests/test_optional_params.py
@ -438,3 +438,11 @@ def test_get_optional_params_image_gen():
    print(response)
    assert "aws_region_name" in response
 def test_bedrock_optional_params_embeddings_provider_specific_params():
    optional_params = get_optional_params_embeddings(
        custom_llm_provider="huggingface",
        wait_for_model=True,
    )
    assert len(optional_params) == 1