Tests pass with Ollama now

2025-12-18 19:39:47 +00:00 · 2024-12-15 17:31:21 -08:00 · 2024-12-15 17:31:21 -08:00 · e51154964f
commit e51154964f
parent a9a041a1de
27 changed files with 83 additions and 65 deletions
--- a/llama_stack/apis/batch_inference/batch_inference.py
+++ b/llama_stack/apis/batch_inference/batch_inference.py
@ -17,7 +17,7 @@ from llama_stack.apis.inference import *  # noqa: F403
@json_schema_type
 class BatchCompletionRequest(BaseModel):
    model: str
-    content_batch: List[InterleavedTextMedia]
+    content_batch: List[InterleavedContent]
    sampling_params: Optional[SamplingParams] = SamplingParams()
    logprobs: Optional[LogProbConfig] = None

@ -53,7 +53,7 @@ class BatchInference(Protocol):
    async def batch_completion(
        self,
        model: str,
-        content_batch: List[InterleavedTextMedia],
+        content_batch: List[InterleavedContent],
        sampling_params: Optional[SamplingParams] = SamplingParams(),
        logprobs: Optional[LogProbConfig] = None,
    ) -> BatchCompletionResponse: ...