Merge branch 'main' into inference_refactor

2025-12-18 12:39:47 +00:00 · 2024-12-16 16:47:57 -08:00 · 2024-12-16 16:47:57 -08:00 · 6a51e2268d
commit 6a51e2268d
parent 35b1a6f2dc c2f7905fa4
117 changed files with 12698 additions and 2589 deletions
--- a/llama_stack/distribution/routers/routers.py
+++ b/llama_stack/distribution/routers/routers.py
@ -111,7 +111,7 @@ class InferenceRouter(Inference):
        model = await self.routing_table.get_model(model_id)
        if model is None:
            raise ValueError(f"Model '{model_id}' not found")
-        if model.model_type == ModelType.embedding_model:
+        if model.model_type == ModelType.embedding:
            raise ValueError(
                f"Model '{model_id}' is an embedding model and does not support chat completions"
            )
@ -144,7 +144,7 @@ class InferenceRouter(Inference):
        model = await self.routing_table.get_model(model_id)
        if model is None:
            raise ValueError(f"Model '{model_id}' not found")
-        if model.model_type == ModelType.embedding_model:
+        if model.model_type == ModelType.embedding:
            raise ValueError(
                f"Model '{model_id}' is an embedding model and does not support chat completions"
            )