mirror of
				https://github.com/meta-llama/llama-stack.git
				synced 2025-10-26 17:23:00 +00:00 
			
		
		
		
	**This PR changes configurations in a backward incompatible way.**
Run configs today repeat full SQLite/Postgres snippets everywhere a
store is needed, which means duplicated credentials, extra connection
pools, and lots of drift between files. This PR introduces named storage
backends so the stack and providers can share a single catalog and
reference those backends by name.
## Key Changes
- Add `storage.backends` to `StackRunConfig`, register each KV/SQL
backend once at startup, and validate that references point to the right
family.
- Move server stores under `storage.stores` with lightweight references
(backend + namespace/table) instead of full configs.
- Update every provider/config/doc to use the new reference style;
docs/codegen now surface the simplified YAML.
## Migration
Before:
```yaml
metadata_store:
  type: sqlite
  db_path: ~/.llama/distributions/foo/registry.db
inference_store:
  type: postgres
  host: ${env.POSTGRES_HOST}
  port: ${env.POSTGRES_PORT}
  db: ${env.POSTGRES_DB}
  user: ${env.POSTGRES_USER}
  password: ${env.POSTGRES_PASSWORD}
conversations_store:
  type: postgres
  host: ${env.POSTGRES_HOST}
  port: ${env.POSTGRES_PORT}
  db: ${env.POSTGRES_DB}
  user: ${env.POSTGRES_USER}
  password: ${env.POSTGRES_PASSWORD}
```
After:
```yaml
storage:
  backends:
    kv_default:
      type: kv_sqlite
      db_path: ~/.llama/distributions/foo/kvstore.db
    sql_default:
      type: sql_postgres
      host: ${env.POSTGRES_HOST}
      port: ${env.POSTGRES_PORT}
      db: ${env.POSTGRES_DB}
      user: ${env.POSTGRES_USER}
      password: ${env.POSTGRES_PASSWORD}
  stores:
    metadata:
      backend: kv_default
      namespace: registry
    inference:
      backend: sql_default
      table_name: inference_store
      max_write_queue_size: 10000
      num_writers: 4
    conversations:
      backend: sql_default
      table_name: openai_conversations
```
Provider configs follow the same pattern—for example, a Chroma vector
adapter switches from:
```yaml
providers:
  vector_io:
  - provider_id: chromadb
    provider_type: remote::chromadb
    config:
      url: ${env.CHROMADB_URL}
      kvstore:
        type: sqlite
        db_path: ~/.llama/distributions/foo/chroma.db
```
to:
```yaml
providers:
  vector_io:
  - provider_id: chromadb
    provider_type: remote::chromadb
    config:
      url: ${env.CHROMADB_URL}
      persistence:
        backend: kv_default
        namespace: vector_io::chroma_remote
```
Once the backends are declared, everything else just points at them, so
rotating credentials or swapping to Postgres happens in one place and
the stack reuses a single connection pool.
		
	
			
		
			
				
	
	
		
			212 lines
		
	
	
	
		
			7.5 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			212 lines
		
	
	
	
		
			7.5 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
| # Copyright (c) Meta Platforms, Inc. and affiliates.
 | |
| # All rights reserved.
 | |
| #
 | |
| # This source code is licensed under the terms described in the LICENSE file in
 | |
| # the root directory of this source tree.
 | |
| import textwrap
 | |
| from typing import Any
 | |
| 
 | |
| from llama_stack.core.datatypes import (
 | |
|     LLAMA_STACK_RUN_CONFIG_VERSION,
 | |
|     DistributionSpec,
 | |
|     Provider,
 | |
|     StackRunConfig,
 | |
| )
 | |
| from llama_stack.core.distribution import (
 | |
|     builtin_automatically_routed_apis,
 | |
|     get_provider_registry,
 | |
| )
 | |
| from llama_stack.core.stack import cast_image_name_to_string, replace_env_vars
 | |
| from llama_stack.core.utils.config_dirs import EXTERNAL_PROVIDERS_DIR
 | |
| from llama_stack.core.utils.dynamic import instantiate_class_type
 | |
| from llama_stack.core.utils.prompt_for_config import prompt_for_config
 | |
| from llama_stack.log import get_logger
 | |
| from llama_stack.providers.datatypes import Api, ProviderSpec
 | |
| 
 | |
| logger = get_logger(name=__name__, category="core")
 | |
| 
 | |
| 
 | |
| def configure_single_provider(registry: dict[str, ProviderSpec], provider: Provider) -> Provider:
 | |
|     provider_spec = registry[provider.provider_type]
 | |
|     config_type = instantiate_class_type(provider_spec.config_class)
 | |
|     try:
 | |
|         if provider.config:
 | |
|             existing = config_type(**provider.config)
 | |
|         else:
 | |
|             existing = None
 | |
|     except Exception:
 | |
|         existing = None
 | |
| 
 | |
|     cfg = prompt_for_config(config_type, existing)
 | |
|     return Provider(
 | |
|         provider_id=provider.provider_id,
 | |
|         provider_type=provider.provider_type,
 | |
|         config=cfg.model_dump(),
 | |
|     )
 | |
| 
 | |
| 
 | |
| def configure_api_providers(config: StackRunConfig, build_spec: DistributionSpec) -> StackRunConfig:
 | |
|     is_nux = len(config.providers) == 0
 | |
| 
 | |
|     if is_nux:
 | |
|         logger.info(
 | |
|             textwrap.dedent(
 | |
|                 """
 | |
|         Llama Stack is composed of several APIs working together. For each API served by the Stack,
 | |
|         we need to configure the providers (implementations) you want to use for these APIs.
 | |
| """
 | |
|             )
 | |
|         )
 | |
| 
 | |
|     provider_registry = get_provider_registry()
 | |
|     builtin_apis = [a.routing_table_api for a in builtin_automatically_routed_apis()]
 | |
| 
 | |
|     if config.apis:
 | |
|         apis_to_serve = config.apis
 | |
|     else:
 | |
|         apis_to_serve = [a.value for a in Api if a not in (Api.inspect, Api.providers)]
 | |
| 
 | |
|     for api_str in apis_to_serve:
 | |
|         api = Api(api_str)
 | |
|         if api in builtin_apis:
 | |
|             continue
 | |
|         if api not in provider_registry:
 | |
|             raise ValueError(f"Unknown API `{api_str}`")
 | |
| 
 | |
|         existing_providers = config.providers.get(api_str, [])
 | |
|         if existing_providers:
 | |
|             logger.info(f"Re-configuring existing providers for API `{api_str}`...")
 | |
|             updated_providers = []
 | |
|             for p in existing_providers:
 | |
|                 logger.info(f"> Configuring provider `({p.provider_type})`")
 | |
|                 updated_providers.append(configure_single_provider(provider_registry[api], p))
 | |
|                 logger.info("")
 | |
|         else:
 | |
|             # we are newly configuring this API
 | |
|             plist = build_spec.providers.get(api_str, [])
 | |
|             plist = plist if isinstance(plist, list) else [plist]
 | |
| 
 | |
|             if not plist:
 | |
|                 raise ValueError(f"No provider configured for API {api_str}?")
 | |
| 
 | |
|             logger.info(f"Configuring API `{api_str}`...")
 | |
|             updated_providers = []
 | |
|             for i, provider in enumerate(plist):
 | |
|                 if i >= 1:
 | |
|                     others = ", ".join(p.provider_type for p in plist[i:])
 | |
|                     logger.info(
 | |
|                         f"Not configuring other providers ({others}) interactively. Please edit the resulting YAML directly.\n"
 | |
|                     )
 | |
|                     break
 | |
| 
 | |
|                 logger.info(f"> Configuring provider `({provider.provider_type})`")
 | |
|                 pid = provider.provider_type.split("::")[-1]
 | |
|                 updated_providers.append(
 | |
|                     configure_single_provider(
 | |
|                         provider_registry[api],
 | |
|                         Provider(
 | |
|                             provider_id=(f"{pid}-{i:02d}" if len(plist) > 1 else pid),
 | |
|                             provider_type=provider.provider_type,
 | |
|                             config={},
 | |
|                         ),
 | |
|                     )
 | |
|                 )
 | |
|                 logger.info("")
 | |
| 
 | |
|         config.providers[api_str] = updated_providers
 | |
| 
 | |
|     return config
 | |
| 
 | |
| 
 | |
| def upgrade_from_routing_table(
 | |
|     config_dict: dict[str, Any],
 | |
| ) -> dict[str, Any]:
 | |
|     def get_providers(entries):
 | |
|         return [
 | |
|             Provider(
 | |
|                 provider_id=(f"{entry['provider_type']}-{i:02d}" if len(entries) > 1 else entry["provider_type"]),
 | |
|                 provider_type=entry["provider_type"],
 | |
|                 config=entry["config"],
 | |
|             )
 | |
|             for i, entry in enumerate(entries)
 | |
|         ]
 | |
| 
 | |
|     providers_by_api = {}
 | |
| 
 | |
|     routing_table = config_dict.get("routing_table", {})
 | |
|     for api_str, entries in routing_table.items():
 | |
|         providers = get_providers(entries)
 | |
|         providers_by_api[api_str] = providers
 | |
| 
 | |
|     provider_map = config_dict.get("api_providers", config_dict.get("provider_map", {}))
 | |
|     if provider_map:
 | |
|         for api_str, provider in provider_map.items():
 | |
|             if isinstance(provider, dict) and "provider_type" in provider:
 | |
|                 providers_by_api[api_str] = [
 | |
|                     Provider(
 | |
|                         provider_id=f"{provider['provider_type']}",
 | |
|                         provider_type=provider["provider_type"],
 | |
|                         config=provider["config"],
 | |
|                     )
 | |
|                 ]
 | |
| 
 | |
|     config_dict["providers"] = providers_by_api
 | |
| 
 | |
|     config_dict.pop("routing_table", None)
 | |
|     config_dict.pop("api_providers", None)
 | |
|     config_dict.pop("provider_map", None)
 | |
| 
 | |
|     config_dict["apis"] = config_dict["apis_to_serve"]
 | |
|     config_dict.pop("apis_to_serve", None)
 | |
| 
 | |
|     # Add default storage config if not present
 | |
|     if "storage" not in config_dict:
 | |
|         config_dict["storage"] = {
 | |
|             "backends": {
 | |
|                 "kv_default": {
 | |
|                     "type": "kv_sqlite",
 | |
|                     "db_path": "~/.llama/kvstore.db",
 | |
|                 },
 | |
|                 "sql_default": {
 | |
|                     "type": "sql_sqlite",
 | |
|                     "db_path": "~/.llama/sql_store.db",
 | |
|                 },
 | |
|             },
 | |
|             "stores": {
 | |
|                 "metadata": {
 | |
|                     "namespace": "registry",
 | |
|                     "backend": "kv_default",
 | |
|                 },
 | |
|                 "inference": {
 | |
|                     "table_name": "inference_store",
 | |
|                     "backend": "sql_default",
 | |
|                     "max_write_queue_size": 10000,
 | |
|                     "num_writers": 4,
 | |
|                 },
 | |
|                 "conversations": {
 | |
|                     "table_name": "openai_conversations",
 | |
|                     "backend": "sql_default",
 | |
|                 },
 | |
|             },
 | |
|         }
 | |
| 
 | |
|     return config_dict
 | |
| 
 | |
| 
 | |
| def parse_and_maybe_upgrade_config(config_dict: dict[str, Any]) -> StackRunConfig:
 | |
|     version = config_dict.get("version", None)
 | |
|     if version == LLAMA_STACK_RUN_CONFIG_VERSION:
 | |
|         processed_config_dict = replace_env_vars(config_dict)
 | |
|         return StackRunConfig(**cast_image_name_to_string(processed_config_dict))
 | |
| 
 | |
|     if "routing_table" in config_dict:
 | |
|         logger.info("Upgrading config...")
 | |
|         config_dict = upgrade_from_routing_table(config_dict)
 | |
| 
 | |
|     config_dict["version"] = LLAMA_STACK_RUN_CONFIG_VERSION
 | |
| 
 | |
|     if not config_dict.get("external_providers_dir", None):
 | |
|         config_dict["external_providers_dir"] = EXTERNAL_PROVIDERS_DIR
 | |
| 
 | |
|     processed_config_dict = replace_env_vars(config_dict)
 | |
|     return StackRunConfig(**cast_image_name_to_string(processed_config_dict))
 |