Another round of simplification and clarity for models/shields/memory_banks stuff

2025-12-09 11:20:58 +00:00 · 2024-10-09 19:19:26 -07:00 · 2024-10-09 19:19:26 -07:00 · b55034c0de
commit b55034c0de
parent 73a0a34e39
27 changed files with 454 additions and 444 deletions
--- a/llama_stack/apis/inference/inference.py
+++ b/llama_stack/apis/inference/inference.py
@ -6,7 +6,7 @@

 from enum import Enum

-from typing import List, Literal, Optional, Protocol, Union
+from typing import List, Literal, Optional, Protocol, runtime_checkable, Union

 from llama_models.schema_utils import json_schema_type, webmethod

@ -177,6 +177,7 @@ class ModelStore(Protocol):
    def get_model(self, identifier: str) -> ModelDef: ...


+@runtime_checkable
 class Inference(Protocol):
    model_store: ModelStore

@ -214,6 +215,3 @@ class Inference(Protocol):
        model: str,
        contents: List[InterleavedTextMedia],
    ) -> EmbeddingsResponse: ...
-
-    @webmethod(route="/inference/register_model")
-    async def register_model(self, model: ModelDef) -> None: ...