diff --git a/llama_toolchain/inference/api/api.py b/llama_toolchain/inference/api/api.py index 712b25b2b..2bf225be4 100644 --- a/llama_toolchain/inference/api/api.py +++ b/llama_toolchain/inference/api/api.py @@ -170,7 +170,7 @@ class Inference(Protocol): @webmethod(route="/inference/completion") async def completion( self, - model: str + model: str, content: InterleavedTextMedia, sampling_params: Optional[SamplingParams] = SamplingParams(), stream: Optional[bool] = False,