fix batch embeddings

2025-12-12 12:06:04 +00:00 · 2025-10-12 18:56:29 -07:00 · 2025-10-12 18:56:29 -07:00 · bbdde4ec12
commit bbdde4ec12
parent e6428492e6
1 changed files with 4 additions and 1 deletions
--- a/llama_stack/providers/inline/batches/reference/batches.py
+++ b/llama_stack/providers/inline/batches/reference/batches.py
@ -25,6 +25,7 @@ from llama_stack.apis.inference import (
    OpenAIChatCompletionRequestWithExtraBody,
    OpenAICompletionRequestWithExtraBody,
    OpenAIDeveloperMessageParam,
+    OpenAIEmbeddingsRequestWithExtraBody,
    OpenAIMessageParam,
    OpenAISystemMessageParam,
    OpenAIToolMessageParam,
@ -640,7 +641,9 @@ class ReferenceBatchesImpl(Batches):
                    },
                }
            else:  # /v1/embeddings
-                embeddings_response = await self.inference_api.openai_embeddings(**request.body)
+                embeddings_response = await self.inference_api.openai_embeddings(
+                    OpenAIEmbeddingsRequestWithExtraBody(**request.body)
+                )
                assert hasattr(embeddings_response, "model_dump_json"), (
                    "Embeddings response must have model_dump_json method"
                )