# Copyright (c) Meta Platforms, Inc. and affiliates. # All rights reserved. # # This source code is licensed under the terms described in the LICENSE file in # the root directory of this source tree. from typing import Any, Dict, List, Optional, Protocol from llama_models.llama3.api.datatypes import Model from llama_models.schema_utils import json_schema_type, webmethod from llama_stack.distribution.datatypes import GenericProviderConfig from pydantic import BaseModel, Field @json_schema_type class ModelServingSpec(BaseModel): llama_model: Model = Field( description="All metadatas associated with llama model (defined in llama_models.models.sku_list).", ) provider_config: GenericProviderConfig = Field( description="Provider config for the model, including provider_id, and corresponding config. ", ) api: str = Field( description="The API that this model is serving (e.g. inference / safety).", default="inference", ) @json_schema_type class ModelsListResponse(BaseModel): models_list: List[ModelServingSpec] @json_schema_type class ModelsGetResponse(BaseModel): core_model_spec: Optional[ModelServingSpec] = None class Models(Protocol): @webmethod(route="/models/list", method="GET") async def list_models(self) -> ModelsListResponse: ... @webmethod(route="/models/get", method="POST") async def get_model(self, core_model_id: str) -> ModelsGetResponse: ...