Add Llamafile chat config and tests

2025-04-26 03:04:13 +00:00 · 2025-04-22 16:39:33 +01:00 · 2025-04-22 16:39:33 +01:00 · 17a40696de
commit 17a40696de
parent afaa3da3dd
5 changed files with 208 additions and 1 deletions
--- a/tests/local_testing/test_embedding.py
+++ b/tests/local_testing/test_embedding.py
@ -1029,6 +1029,28 @@ def test_hosted_vllm_embedding(monkeypatch):
        assert json_data["model"] == "jina-embeddings-v3"


+def test_llamafile_embedding(monkeypatch):
+    monkeypatch.setenv("LLAMAFILE_API_BASE", "http://localhost:8080/v1")
+    from litellm.llms.custom_httpx.http_handler import HTTPHandler
+
+    client = HTTPHandler()
+    with patch.object(client, "post") as mock_post:
+        try:
+            embedding(
+                model="llamafile/jina-embeddings-v3",
+                input=["Hello world"],
+                client=client,
+            )
+        except Exception as e:
+            print(e)
+
+        mock_post.assert_called_once()
+
+        json_data = json.loads(mock_post.call_args.kwargs["data"])
+        assert json_data["input"] == ["Hello world"]
+        assert json_data["model"] == "jina-embeddings-v3"
+
+
@pytest.mark.asyncio
@pytest.mark.parametrize("sync_mode", [True, False])
 async def test_lm_studio_embedding(monkeypatch, sync_mode):