Merge branch 'main' into add-mcp-authentication-param

2025-12-04 10:10:36 +00:00 · 2025-11-13 13:49:06 -08:00 · 2025-11-13 13:49:06 -08:00 · 949756ebb8
commit 949756ebb8
parent b090ed2e46 a82b79ce57
2 changed files with 46 additions and 1 deletions
--- a/src/llama_stack/core/routers/vector_io.py
+++ b/src/llama_stack/core/routers/vector_io.py
@ -14,7 +14,9 @@ from llama_stack_api import (
    HealthResponse,
    HealthStatus,
    InterleavedContent,
+    ModelNotFoundError,
    ModelType,
+    ModelTypeError,
    OpenAICreateVectorStoreFileBatchRequestWithExtraBody,
    OpenAICreateVectorStoreRequestWithExtraBody,
    QueryChunksResponse,
@ -124,6 +126,14 @@ class VectorIORouter(VectorIO):
        if embedding_model is not None and embedding_dimension is None:
            embedding_dimension = await self._get_embedding_model_dimension(embedding_model)

+        # Validate that embedding model exists and is of the correct type
+        if embedding_model is not None:
+            model = await self.routing_table.get_object_by_identifier("model", embedding_model)
+            if model is None:
+                raise ModelNotFoundError(embedding_model)
+            if model.model_type != ModelType.embedding:
+                raise ModelTypeError(embedding_model, model.model_type, ModelType.embedding)
+
        # Auto-select provider if not specified
        if provider_id is None:
            num_providers = len(self.routing_table.impls_by_provider_id)