mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-12-31 03:50:00 +00:00
currently the `inspect` API for providers is really a `list` API. Create a new `providers` API which has a GET `providers/{provider_id}` inspect API
which returns "user friendly" configuration to the end user. Also add a GET `/providers` endpoint which returns the list of providers as `inspect/providers` does today.
This API follows CRUD and is more intuitive/RESTful.
This work is part of the RFC at #1359
Signed-off-by: Charlie Doern <cdoern@redhat.com>
59 lines
1.3 KiB
Python
59 lines
1.3 KiB
Python
# Copyright (c) Meta Platforms, Inc. and affiliates.
|
|
# All rights reserved.
|
|
#
|
|
# This source code is licensed under the terms described in the LICENSE file in
|
|
# the root directory of this source tree.
|
|
|
|
from typing import List, Protocol, runtime_checkable
|
|
|
|
from pydantic import BaseModel
|
|
|
|
from llama_stack.schema_utils import json_schema_type, webmethod
|
|
|
|
|
|
@json_schema_type
|
|
class RouteInfo(BaseModel):
|
|
route: str
|
|
method: str
|
|
provider_types: List[str]
|
|
|
|
|
|
@json_schema_type
|
|
class HealthInfo(BaseModel):
|
|
status: str
|
|
# TODO: add a provider level status
|
|
|
|
|
|
@json_schema_type
|
|
class ProviderInfo(BaseModel):
|
|
api: str
|
|
provider_id: str
|
|
provider_type: str
|
|
|
|
|
|
class ListProvidersResponse(BaseModel):
|
|
data: List[ProviderInfo]
|
|
|
|
|
|
@json_schema_type
|
|
class VersionInfo(BaseModel):
|
|
version: str
|
|
|
|
|
|
class ListRoutesResponse(BaseModel):
|
|
data: List[RouteInfo]
|
|
|
|
|
|
@runtime_checkable
|
|
class Inspect(Protocol):
|
|
@webmethod(route="/inspect/providers", method="GET")
|
|
async def list_providers(self) -> ListProvidersResponse: ...
|
|
|
|
@webmethod(route="/inspect/routes", method="GET")
|
|
async def list_routes(self) -> ListRoutesResponse: ...
|
|
|
|
@webmethod(route="/health", method="GET")
|
|
async def health(self) -> HealthInfo: ...
|
|
|
|
@webmethod(route="/version", method="GET")
|
|
async def version(self) -> VersionInfo: ...
|