fix(main.py): fix lm_studio/ embedding routing (#7658)

* fix(main.py): fix lm_studio/ embedding routing adds the mapping + updates docs with example * docs(self_serve.md): update doc to show how to auto-add sso users to teams * fix(streaming_handler.py): simplify async iterator check, to just check if streaming response is an async iterable
2025-04-26 19:24:27 +00:00 · 2025-01-09 23:03:24 -08:00 · 2025-01-09 23:03:24 -08:00 · afdcbe3d64
commit afdcbe3d64
parent 14d4b695df
6 changed files with 109 additions and 38 deletions
--- a/tests/local_testing/test_embedding.py
+++ b/tests/local_testing/test_embedding.py
@ -1019,6 +1019,28 @@ def test_hosted_vllm_embedding(monkeypatch):
        assert json_data["model"] == "jina-embeddings-v3"


+def test_lm_studio_embedding(monkeypatch):
+    monkeypatch.setenv("LM_STUDIO_API_BASE", "http://localhost:8000")
+    from litellm.llms.custom_httpx.http_handler import HTTPHandler
+
+    client = HTTPHandler()
+    with patch.object(client, "post") as mock_post:
+        try:
+            embedding(
+                model="lm_studio/jina-embeddings-v3",
+                input=["Hello world"],
+                client=client,
+            )
+        except Exception as e:
+            print(e)
+
+        mock_post.assert_called_once()
+
+        json_data = json.loads(mock_post.call_args.kwargs["data"])
+        assert json_data["input"] == ["Hello world"]
+        assert json_data["model"] == "jina-embeddings-v3"
+
+
@pytest.mark.parametrize(
    "model",
    [