mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-10-24 00:47:00 +00:00
**This PR changes configurations in a backward incompatible way.** Run configs today repeat full SQLite/Postgres snippets everywhere a store is needed, which means duplicated credentials, extra connection pools, and lots of drift between files. This PR introduces named storage backends so the stack and providers can share a single catalog and reference those backends by name. ## Key Changes - Add `storage.backends` to `StackRunConfig`, register each KV/SQL backend once at startup, and validate that references point to the right family. - Move server stores under `storage.stores` with lightweight references (backend + namespace/table) instead of full configs. - Update every provider/config/doc to use the new reference style; docs/codegen now surface the simplified YAML. ## Migration Before: ```yaml metadata_store: type: sqlite db_path: ~/.llama/distributions/foo/registry.db inference_store: type: postgres host: ${env.POSTGRES_HOST} port: ${env.POSTGRES_PORT} db: ${env.POSTGRES_DB} user: ${env.POSTGRES_USER} password: ${env.POSTGRES_PASSWORD} conversations_store: type: postgres host: ${env.POSTGRES_HOST} port: ${env.POSTGRES_PORT} db: ${env.POSTGRES_DB} user: ${env.POSTGRES_USER} password: ${env.POSTGRES_PASSWORD} ``` After: ```yaml storage: backends: kv_default: type: kv_sqlite db_path: ~/.llama/distributions/foo/kvstore.db sql_default: type: sql_postgres host: ${env.POSTGRES_HOST} port: ${env.POSTGRES_PORT} db: ${env.POSTGRES_DB} user: ${env.POSTGRES_USER} password: ${env.POSTGRES_PASSWORD} stores: metadata: backend: kv_default namespace: registry inference: backend: sql_default table_name: inference_store max_write_queue_size: 10000 num_writers: 4 conversations: backend: sql_default table_name: openai_conversations ``` Provider configs follow the same pattern—for example, a Chroma vector adapter switches from: ```yaml providers: vector_io: - provider_id: chromadb provider_type: remote::chromadb config: url: ${env.CHROMADB_URL} kvstore: type: sqlite db_path: ~/.llama/distributions/foo/chroma.db ``` to: ```yaml providers: vector_io: - provider_id: chromadb provider_type: remote::chromadb config: url: ${env.CHROMADB_URL} persistence: backend: kv_default namespace: vector_io::chroma_remote ``` Once the backends are declared, everything else just points at them, so rotating credentials or swapping to Postgres happens in one place and the stack reuses a single connection pool.
309 lines
12 KiB
Python
309 lines
12 KiB
Python
# Copyright (c) Meta Platforms, Inc. and affiliates.
|
|
# All rights reserved.
|
|
#
|
|
# This source code is licensed under the terms described in the LICENSE file in
|
|
# the root directory of this source tree.
|
|
|
|
import secrets
|
|
import time
|
|
from typing import Any
|
|
|
|
from openai import NOT_GIVEN
|
|
from pydantic import BaseModel, TypeAdapter
|
|
|
|
from llama_stack.apis.conversations.conversations import (
|
|
Conversation,
|
|
ConversationDeletedResource,
|
|
ConversationItem,
|
|
ConversationItemDeletedResource,
|
|
ConversationItemList,
|
|
Conversations,
|
|
Metadata,
|
|
)
|
|
from llama_stack.core.datatypes import AccessRule, StackRunConfig
|
|
from llama_stack.log import get_logger
|
|
from llama_stack.providers.utils.sqlstore.api import ColumnDefinition, ColumnType
|
|
from llama_stack.providers.utils.sqlstore.authorized_sqlstore import AuthorizedSqlStore
|
|
from llama_stack.providers.utils.sqlstore.sqlstore import sqlstore_impl
|
|
|
|
logger = get_logger(name=__name__, category="openai_conversations")
|
|
|
|
|
|
class ConversationServiceConfig(BaseModel):
|
|
"""Configuration for the built-in conversation service.
|
|
|
|
:param run_config: Stack run configuration for resolving persistence
|
|
:param policy: Access control rules
|
|
"""
|
|
|
|
run_config: StackRunConfig
|
|
policy: list[AccessRule] = []
|
|
|
|
|
|
async def get_provider_impl(config: ConversationServiceConfig, deps: dict[Any, Any]):
|
|
"""Get the conversation service implementation."""
|
|
impl = ConversationServiceImpl(config, deps)
|
|
await impl.initialize()
|
|
return impl
|
|
|
|
|
|
class ConversationServiceImpl(Conversations):
|
|
"""Built-in conversation service implementation using AuthorizedSqlStore."""
|
|
|
|
def __init__(self, config: ConversationServiceConfig, deps: dict[Any, Any]):
|
|
self.config = config
|
|
self.deps = deps
|
|
self.policy = config.policy
|
|
|
|
# Use conversations store reference from run config
|
|
conversations_ref = config.run_config.storage.stores.conversations
|
|
if not conversations_ref:
|
|
raise ValueError("storage.stores.conversations must be configured in run config")
|
|
|
|
base_sql_store = sqlstore_impl(conversations_ref)
|
|
self.sql_store = AuthorizedSqlStore(base_sql_store, self.policy)
|
|
|
|
async def initialize(self) -> None:
|
|
"""Initialize the store and create tables."""
|
|
await self.sql_store.create_table(
|
|
"openai_conversations",
|
|
{
|
|
"id": ColumnDefinition(type=ColumnType.STRING, primary_key=True),
|
|
"created_at": ColumnType.INTEGER,
|
|
"items": ColumnType.JSON,
|
|
"metadata": ColumnType.JSON,
|
|
},
|
|
)
|
|
|
|
await self.sql_store.create_table(
|
|
"conversation_items",
|
|
{
|
|
"id": ColumnDefinition(type=ColumnType.STRING, primary_key=True),
|
|
"conversation_id": ColumnType.STRING,
|
|
"created_at": ColumnType.INTEGER,
|
|
"item_data": ColumnType.JSON,
|
|
},
|
|
)
|
|
|
|
async def create_conversation(
|
|
self, items: list[ConversationItem] | None = None, metadata: Metadata | None = None
|
|
) -> Conversation:
|
|
"""Create a conversation."""
|
|
random_bytes = secrets.token_bytes(24)
|
|
conversation_id = f"conv_{random_bytes.hex()}"
|
|
created_at = int(time.time())
|
|
|
|
record_data = {
|
|
"id": conversation_id,
|
|
"created_at": created_at,
|
|
"items": [],
|
|
"metadata": metadata,
|
|
}
|
|
|
|
await self.sql_store.insert(
|
|
table="openai_conversations",
|
|
data=record_data,
|
|
)
|
|
|
|
if items:
|
|
item_records = []
|
|
for item in items:
|
|
item_dict = item.model_dump()
|
|
item_id = self._get_or_generate_item_id(item, item_dict)
|
|
|
|
item_record = {
|
|
"id": item_id,
|
|
"conversation_id": conversation_id,
|
|
"created_at": created_at,
|
|
"item_data": item_dict,
|
|
}
|
|
|
|
item_records.append(item_record)
|
|
|
|
await self.sql_store.insert(table="conversation_items", data=item_records)
|
|
|
|
conversation = Conversation(
|
|
id=conversation_id,
|
|
created_at=created_at,
|
|
metadata=metadata,
|
|
object="conversation",
|
|
)
|
|
|
|
logger.debug(f"Created conversation {conversation_id}")
|
|
return conversation
|
|
|
|
async def get_conversation(self, conversation_id: str) -> Conversation:
|
|
"""Get a conversation with the given ID."""
|
|
record = await self.sql_store.fetch_one(table="openai_conversations", where={"id": conversation_id})
|
|
|
|
if record is None:
|
|
raise ValueError(f"Conversation {conversation_id} not found")
|
|
|
|
return Conversation(
|
|
id=record["id"], created_at=record["created_at"], metadata=record.get("metadata"), object="conversation"
|
|
)
|
|
|
|
async def update_conversation(self, conversation_id: str, metadata: Metadata) -> Conversation:
|
|
"""Update a conversation's metadata with the given ID"""
|
|
await self.sql_store.update(
|
|
table="openai_conversations", data={"metadata": metadata}, where={"id": conversation_id}
|
|
)
|
|
|
|
return await self.get_conversation(conversation_id)
|
|
|
|
async def openai_delete_conversation(self, conversation_id: str) -> ConversationDeletedResource:
|
|
"""Delete a conversation with the given ID."""
|
|
await self.sql_store.delete(table="openai_conversations", where={"id": conversation_id})
|
|
|
|
logger.debug(f"Deleted conversation {conversation_id}")
|
|
return ConversationDeletedResource(id=conversation_id)
|
|
|
|
def _validate_conversation_id(self, conversation_id: str) -> None:
|
|
"""Validate conversation ID format."""
|
|
if not conversation_id.startswith("conv_"):
|
|
raise ValueError(
|
|
f"Invalid 'conversation_id': '{conversation_id}'. Expected an ID that begins with 'conv_'."
|
|
)
|
|
|
|
def _get_or_generate_item_id(self, item: ConversationItem, item_dict: dict) -> str:
|
|
"""Get existing item ID or generate one if missing."""
|
|
if item.id is None:
|
|
random_bytes = secrets.token_bytes(24)
|
|
if item.type == "message":
|
|
item_id = f"msg_{random_bytes.hex()}"
|
|
else:
|
|
item_id = f"item_{random_bytes.hex()}"
|
|
item_dict["id"] = item_id
|
|
return item_id
|
|
return item.id
|
|
|
|
async def _get_validated_conversation(self, conversation_id: str) -> Conversation:
|
|
"""Validate conversation ID and return the conversation if it exists."""
|
|
self._validate_conversation_id(conversation_id)
|
|
return await self.get_conversation(conversation_id)
|
|
|
|
async def add_items(self, conversation_id: str, items: list[ConversationItem]) -> ConversationItemList:
|
|
"""Create (add) items to a conversation."""
|
|
await self._get_validated_conversation(conversation_id)
|
|
|
|
created_items = []
|
|
base_time = int(time.time())
|
|
|
|
for i, item in enumerate(items):
|
|
item_dict = item.model_dump()
|
|
item_id = self._get_or_generate_item_id(item, item_dict)
|
|
|
|
# make each timestamp unique to maintain order
|
|
created_at = base_time + i
|
|
|
|
item_record = {
|
|
"id": item_id,
|
|
"conversation_id": conversation_id,
|
|
"created_at": created_at,
|
|
"item_data": item_dict,
|
|
}
|
|
|
|
# TODO: Add support for upsert in sql_store, this will fail first if ID exists and then update
|
|
try:
|
|
await self.sql_store.insert(table="conversation_items", data=item_record)
|
|
except Exception:
|
|
# If insert fails due to ID conflict, update existing record
|
|
await self.sql_store.update(
|
|
table="conversation_items",
|
|
data={"created_at": created_at, "item_data": item_dict},
|
|
where={"id": item_id},
|
|
)
|
|
|
|
created_items.append(item_dict)
|
|
|
|
logger.debug(f"Created {len(created_items)} items in conversation {conversation_id}")
|
|
|
|
# Convert created items (dicts) to proper ConversationItem types
|
|
adapter: TypeAdapter[ConversationItem] = TypeAdapter(ConversationItem)
|
|
response_items: list[ConversationItem] = [adapter.validate_python(item_dict) for item_dict in created_items]
|
|
|
|
return ConversationItemList(
|
|
data=response_items,
|
|
first_id=created_items[0]["id"] if created_items else None,
|
|
last_id=created_items[-1]["id"] if created_items else None,
|
|
has_more=False,
|
|
)
|
|
|
|
async def retrieve(self, conversation_id: str, item_id: str) -> ConversationItem:
|
|
"""Retrieve a conversation item."""
|
|
if not conversation_id:
|
|
raise ValueError(f"Expected a non-empty value for `conversation_id` but received {conversation_id!r}")
|
|
if not item_id:
|
|
raise ValueError(f"Expected a non-empty value for `item_id` but received {item_id!r}")
|
|
|
|
# Get item from conversation_items table
|
|
record = await self.sql_store.fetch_one(
|
|
table="conversation_items", where={"id": item_id, "conversation_id": conversation_id}
|
|
)
|
|
|
|
if record is None:
|
|
raise ValueError(f"Item {item_id} not found in conversation {conversation_id}")
|
|
|
|
adapter: TypeAdapter[ConversationItem] = TypeAdapter(ConversationItem)
|
|
return adapter.validate_python(record["item_data"])
|
|
|
|
async def list(self, conversation_id: str, after=NOT_GIVEN, include=NOT_GIVEN, limit=NOT_GIVEN, order=NOT_GIVEN):
|
|
"""List items in the conversation."""
|
|
if not conversation_id:
|
|
raise ValueError(f"Expected a non-empty value for `conversation_id` but received {conversation_id!r}")
|
|
|
|
# check if conversation exists
|
|
await self.get_conversation(conversation_id)
|
|
|
|
result = await self.sql_store.fetch_all(table="conversation_items", where={"conversation_id": conversation_id})
|
|
records = result.data
|
|
|
|
if order != NOT_GIVEN and order == "asc":
|
|
records.sort(key=lambda x: x["created_at"])
|
|
else:
|
|
records.sort(key=lambda x: x["created_at"], reverse=True)
|
|
|
|
actual_limit = 20
|
|
if limit != NOT_GIVEN and isinstance(limit, int):
|
|
actual_limit = limit
|
|
|
|
records = records[:actual_limit]
|
|
items = [record["item_data"] for record in records]
|
|
|
|
adapter: TypeAdapter[ConversationItem] = TypeAdapter(ConversationItem)
|
|
response_items: list[ConversationItem] = [adapter.validate_python(item) for item in items]
|
|
|
|
first_id = response_items[0].id if response_items else None
|
|
last_id = response_items[-1].id if response_items else None
|
|
|
|
return ConversationItemList(
|
|
data=response_items,
|
|
first_id=first_id,
|
|
last_id=last_id,
|
|
has_more=False,
|
|
)
|
|
|
|
async def openai_delete_conversation_item(
|
|
self, conversation_id: str, item_id: str
|
|
) -> ConversationItemDeletedResource:
|
|
"""Delete a conversation item."""
|
|
if not conversation_id:
|
|
raise ValueError(f"Expected a non-empty value for `conversation_id` but received {conversation_id!r}")
|
|
if not item_id:
|
|
raise ValueError(f"Expected a non-empty value for `item_id` but received {item_id!r}")
|
|
|
|
_ = await self._get_validated_conversation(conversation_id)
|
|
|
|
record = await self.sql_store.fetch_one(
|
|
table="conversation_items", where={"id": item_id, "conversation_id": conversation_id}
|
|
)
|
|
|
|
if record is None:
|
|
raise ValueError(f"Item {item_id} not found in conversation {conversation_id}")
|
|
|
|
await self.sql_store.delete(
|
|
table="conversation_items", where={"id": item_id, "conversation_id": conversation_id}
|
|
)
|
|
|
|
logger.debug(f"Deleted item {item_id} from conversation {conversation_id}")
|
|
return ConversationItemDeletedResource(id=item_id)
|