mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-12-18 12:39:47 +00:00
Merge branch 'main' into inference_refactor
This commit is contained in:
commit
6a51e2268d
117 changed files with 12698 additions and 2589 deletions
|
|
@ -111,7 +111,7 @@ class InferenceRouter(Inference):
|
|||
model = await self.routing_table.get_model(model_id)
|
||||
if model is None:
|
||||
raise ValueError(f"Model '{model_id}' not found")
|
||||
if model.model_type == ModelType.embedding_model:
|
||||
if model.model_type == ModelType.embedding:
|
||||
raise ValueError(
|
||||
f"Model '{model_id}' is an embedding model and does not support chat completions"
|
||||
)
|
||||
|
|
@ -144,7 +144,7 @@ class InferenceRouter(Inference):
|
|||
model = await self.routing_table.get_model(model_id)
|
||||
if model is None:
|
||||
raise ValueError(f"Model '{model_id}' not found")
|
||||
if model.model_type == ModelType.embedding_model:
|
||||
if model.model_type == ModelType.embedding:
|
||||
raise ValueError(
|
||||
f"Model '{model_id}' is an embedding model and does not support chat completions"
|
||||
)
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue