fix(custom_llm.py): support async completion calls

2025-04-27 11:43:54 +00:00 · 2024-07-25 15:51:39 -07:00 · 2024-07-25 15:51:39 -07:00 · fe503386ab
commit fe503386ab
parent 54e1ca29b7
3 changed files with 50 additions and 11 deletions
--- a/litellm/tests/test_custom_llm.py
+++ b/litellm/tests/test_custom_llm.py
@ -23,7 +23,7 @@ import httpx
 from dotenv import load_dotenv

 import litellm
-from litellm import CustomLLM, completion, get_llm_provider
+from litellm import CustomLLM, acompletion, completion, get_llm_provider


 class MyCustomLLM(CustomLLM):
@ -35,6 +35,15 @@ class MyCustomLLM(CustomLLM):
        )  # type: ignore


+class MyCustomAsyncLLM(CustomLLM):
+    async def acompletion(self, *args, **kwargs) -> litellm.ModelResponse:
+        return litellm.completion(
+            model="gpt-3.5-turbo",
+            messages=[{"role": "user", "content": "Hello world"}],
+            mock_response="Hi!",
+        )  # type: ignore
+
+
 def test_get_llm_provider():
    from litellm.utils import custom_llm_setup

@ -61,3 +70,17 @@ def test_simple_completion():
    )

    assert resp.choices[0].message.content == "Hi!"
+
+
+@pytest.mark.asyncio
+async def test_simple_acompletion():
+    my_custom_llm = MyCustomAsyncLLM()
+    litellm.custom_provider_map = [
+        {"provider": "custom_llm", "custom_handler": my_custom_llm}
+    ]
+    resp = await acompletion(
+        model="custom_llm/my-fake-model",
+        messages=[{"role": "user", "content": "Hello world!"}],
+    )
+
+    assert resp.choices[0].message.content == "Hi!"