Make all API methods async def again

2025-12-13 04:22:35 +00:00 · 2024-10-18 16:50:57 -07:00 · 2024-10-18 16:50:57 -07:00 · 627edaf407
commit 627edaf407
parent 95a96afe34
17 changed files with 120 additions and 145 deletions
--- a/llama_stack/apis/inference/inference.py
+++ b/llama_stack/apis/inference/inference.py
@ -181,10 +181,8 @@ class ModelStore(Protocol):
 class Inference(Protocol):
    model_store: ModelStore

-    # This method is not `async def` because it can result in either an
-    # `AsyncGenerator` or a `CompletionResponse` depending on the value of `stream`.
    @webmethod(route="/inference/completion")
-    def completion(
+    async def completion(
        self,
        model: str,
        content: InterleavedTextMedia,
@ -196,7 +194,7 @@ class Inference(Protocol):
    # This method is not `async def` because it can result in either an
    # `AsyncGenerator` or a `ChatCompletionResponse` depending on the value of `stream`.
    @webmethod(route="/inference/chat_completion")
-    def chat_completion(
+    async def chat_completion(
        self,
        model: str,
        messages: List[Message],