feat(stores)!: use backend storage references instead of configs (#3697)

**This PR changes configurations in a backward incompatible way.** Run configs today repeat full SQLite/Postgres snippets everywhere a store is needed, which means duplicated credentials, extra connection pools, and lots of drift between files. This PR introduces named storage backends so the stack and providers can share a single catalog and reference those backends by name. ## Key Changes - Add `storage.backends` to `StackRunConfig`, register each KV/SQL backend once at startup, and validate that references point to the right family. - Move server stores under `storage.stores` with lightweight references (backend + namespace/table) instead of full configs. - Update every provider/config/doc to use the new reference style; docs/codegen now surface the simplified YAML. ## Migration Before: ```yaml metadata_store: type: sqlite db_path: ~/.llama/distributions/foo/registry.db inference_store: type: postgres host: ${env.POSTGRES_HOST} port: ${env.POSTGRES_PORT} db: ${env.POSTGRES_DB} user: ${env.POSTGRES_USER} password: ${env.POSTGRES_PASSWORD} conversations_store: type: postgres host: ${env.POSTGRES_HOST} port: ${env.POSTGRES_PORT} db: ${env.POSTGRES_DB} user: ${env.POSTGRES_USER} password: ${env.POSTGRES_PASSWORD} ``` After: ```yaml storage: backends: kv_default: type: kv_sqlite db_path: ~/.llama/distributions/foo/kvstore.db sql_default: type: sql_postgres host: ${env.POSTGRES_HOST} port: ${env.POSTGRES_PORT} db: ${env.POSTGRES_DB} user: ${env.POSTGRES_USER} password: ${env.POSTGRES_PASSWORD} stores: metadata: backend: kv_default namespace: registry inference: backend: sql_default table_name: inference_store max_write_queue_size: 10000 num_writers: 4 conversations: backend: sql_default table_name: openai_conversations ``` Provider configs follow the same pattern—for example, a Chroma vector adapter switches from: ```yaml providers: vector_io: - provider_id: chromadb provider_type: remote::chromadb config: url: ${env.CHROMADB_URL} kvstore: type: sqlite db_path: ~/.llama/distributions/foo/chroma.db ``` to: ```yaml providers: vector_io: - provider_id: chromadb provider_type: remote::chromadb config: url: ${env.CHROMADB_URL} persistence: backend: kv_default namespace: vector_io::chroma_remote ``` Once the backends are declared, everything else just points at them, so rotating credentials or swapping to Postgres happens in one place and the stack reuses a single connection pool.
2025-10-22 16:23:08 +00:00 · 2025-10-20 13:20:09 -07:00 · 2025-10-20 13:20:09 -07:00 · 2c43285e22
commit 2c43285e22
parent add64e8e2a
105 changed files with 2290 additions and 1292 deletions
--- a/tests/unit/distribution/test_distribution.py
+++ b/tests/unit/distribution/test_distribution.py
@ -13,6 +13,15 @@ from pydantic import BaseModel, Field, ValidationError

 from llama_stack.core.datatypes import Api, Provider, StackRunConfig
 from llama_stack.core.distribution import INTERNAL_APIS, get_provider_registry, providable_apis
+from llama_stack.core.storage.datatypes import (
+    InferenceStoreReference,
+    KVStoreReference,
+    ServerStoresConfig,
+    SqliteKVStoreConfig,
+    SqliteSqlStoreConfig,
+    SqlStoreReference,
+    StorageConfig,
+)
 from llama_stack.providers.datatypes import ProviderSpec


@ -29,6 +38,32 @@ class SampleConfig(BaseModel):
        }


+def _default_storage() -> StorageConfig:
+    return StorageConfig(
+        backends={
+            "kv_default": SqliteKVStoreConfig(db_path=":memory:"),
+            "sql_default": SqliteSqlStoreConfig(db_path=":memory:"),
+        },
+        stores=ServerStoresConfig(
+            metadata=KVStoreReference(backend="kv_default", namespace="registry"),
+            inference=InferenceStoreReference(backend="sql_default", table_name="inference_store"),
+            conversations=SqlStoreReference(backend="sql_default", table_name="conversations"),
+        ),
+    )
+
+
+def make_stack_config(**overrides) -> StackRunConfig:
+    storage = overrides.pop("storage", _default_storage())
+    defaults = dict(
+        image_name="test_image",
+        apis=[],
+        providers={},
+        storage=storage,
+    )
+    defaults.update(overrides)
+    return StackRunConfig(**defaults)
+
+
@pytest.fixture
 def mock_providers():
    """Mock the available_providers function to return test providers."""
@ -47,8 +82,8 @@ def mock_providers():
@pytest.fixture
 def base_config(tmp_path):
    """Create a base StackRunConfig with common settings."""
-    return StackRunConfig(
-        image_name="test_image",
+    return make_stack_config(
+        apis=["inference"],
        providers={
            "inference": [
                Provider(
@ -222,8 +257,8 @@ class TestProviderRegistry:

    def test_missing_directory(self, mock_providers):
        """Test handling of missing external providers directory."""
-        config = StackRunConfig(
-            image_name="test_image",
+        config = make_stack_config(
+            apis=["inference"],
            providers={
                "inference": [
                    Provider(
@ -278,7 +313,6 @@ pip_packages:
        """Test loading an external provider from a module (success path)."""
        from types import SimpleNamespace

-        from llama_stack.core.datatypes import Provider, StackRunConfig
        from llama_stack.providers.datatypes import Api, ProviderSpec

        # Simulate a provider module with get_provider_spec
@ -293,7 +327,7 @@ pip_packages:
        import_module_side_effect = make_import_module_side_effect(external_module=fake_module)

        with patch("importlib.import_module", side_effect=import_module_side_effect) as mock_import:
-            config = StackRunConfig(
+            config = make_stack_config(
                image_name="test_image",
                providers={
                    "inference": [
@ -317,12 +351,11 @@ pip_packages:

    def test_external_provider_from_module_not_found(self, mock_providers):
        """Test handling ModuleNotFoundError for missing provider module."""
-        from llama_stack.core.datatypes import Provider, StackRunConfig

        import_module_side_effect = make_import_module_side_effect(raise_for_external=True)

        with patch("importlib.import_module", side_effect=import_module_side_effect):
-            config = StackRunConfig(
+            config = make_stack_config(
                image_name="test_image",
                providers={
                    "inference": [
@ -341,12 +374,11 @@ pip_packages:

    def test_external_provider_from_module_missing_get_provider_spec(self, mock_providers):
        """Test handling missing get_provider_spec in provider module (should raise ValueError)."""
-        from llama_stack.core.datatypes import Provider, StackRunConfig

        import_module_side_effect = make_import_module_side_effect(missing_get_provider_spec=True)

        with patch("importlib.import_module", side_effect=import_module_side_effect):
-            config = StackRunConfig(
+            config = make_stack_config(
                image_name="test_image",
                providers={
                    "inference": [
@ -399,13 +431,12 @@ class TestGetExternalProvidersFromModule:

    def test_stackrunconfig_provider_without_module(self, mock_providers):
        """Test that providers without module attribute are skipped."""
-        from llama_stack.core.datatypes import Provider, StackRunConfig
        from llama_stack.core.distribution import get_external_providers_from_module

        import_module_side_effect = make_import_module_side_effect()

        with patch("importlib.import_module", side_effect=import_module_side_effect):
-            config = StackRunConfig(
+            config = make_stack_config(
                image_name="test_image",
                providers={
                    "inference": [
@ -426,7 +457,6 @@ class TestGetExternalProvidersFromModule:
        """Test provider with module containing version spec (e.g., package==1.0.0)."""
        from types import SimpleNamespace

-        from llama_stack.core.datatypes import Provider, StackRunConfig
        from llama_stack.core.distribution import get_external_providers_from_module
        from llama_stack.providers.datatypes import ProviderSpec

@ -444,7 +474,7 @@ class TestGetExternalProvidersFromModule:
            raise ModuleNotFoundError(name)

        with patch("importlib.import_module", side_effect=import_side_effect):
-            config = StackRunConfig(
+            config = make_stack_config(
                image_name="test_image",
                providers={
                    "inference": [
@ -564,7 +594,6 @@ class TestGetExternalProvidersFromModule:
        """Test when get_provider_spec returns a list of specs."""
        from types import SimpleNamespace

-        from llama_stack.core.datatypes import Provider, StackRunConfig
        from llama_stack.core.distribution import get_external_providers_from_module
        from llama_stack.providers.datatypes import ProviderSpec

@ -589,7 +618,7 @@ class TestGetExternalProvidersFromModule:
            raise ModuleNotFoundError(name)

        with patch("importlib.import_module", side_effect=import_side_effect):
-            config = StackRunConfig(
+            config = make_stack_config(
                image_name="test_image",
                providers={
                    "inference": [
@ -613,7 +642,6 @@ class TestGetExternalProvidersFromModule:
        """Test that list return filters specs by provider_type."""
        from types import SimpleNamespace

-        from llama_stack.core.datatypes import Provider, StackRunConfig
        from llama_stack.core.distribution import get_external_providers_from_module
        from llama_stack.providers.datatypes import ProviderSpec

@ -638,7 +666,7 @@ class TestGetExternalProvidersFromModule:
            raise ModuleNotFoundError(name)

        with patch("importlib.import_module", side_effect=import_side_effect):
-            config = StackRunConfig(
+            config = make_stack_config(
                image_name="test_image",
                providers={
                    "inference": [
@ -662,7 +690,6 @@ class TestGetExternalProvidersFromModule:
        """Test that list return adds multiple different provider_types when config requests them."""
        from types import SimpleNamespace

-        from llama_stack.core.datatypes import Provider, StackRunConfig
        from llama_stack.core.distribution import get_external_providers_from_module
        from llama_stack.providers.datatypes import ProviderSpec

@ -688,7 +715,7 @@ class TestGetExternalProvidersFromModule:
            raise ModuleNotFoundError(name)

        with patch("importlib.import_module", side_effect=import_side_effect):
-            config = StackRunConfig(
+            config = make_stack_config(
                image_name="test_image",
                providers={
                    "inference": [
@ -718,7 +745,6 @@ class TestGetExternalProvidersFromModule:

    def test_module_not_found_raises_value_error(self, mock_providers):
        """Test that ModuleNotFoundError raises ValueError with helpful message."""
-        from llama_stack.core.datatypes import Provider, StackRunConfig
        from llama_stack.core.distribution import get_external_providers_from_module

        def import_side_effect(name):
@ -727,7 +753,7 @@ class TestGetExternalProvidersFromModule:
            raise ModuleNotFoundError(name)

        with patch("importlib.import_module", side_effect=import_side_effect):
-            config = StackRunConfig(
+            config = make_stack_config(
                image_name="test_image",
                providers={
                    "inference": [
@ -751,7 +777,6 @@ class TestGetExternalProvidersFromModule:
        """Test that generic exceptions are properly raised."""
        from types import SimpleNamespace

-        from llama_stack.core.datatypes import Provider, StackRunConfig
        from llama_stack.core.distribution import get_external_providers_from_module

        def bad_spec():
@ -765,7 +790,7 @@ class TestGetExternalProvidersFromModule:
            raise ModuleNotFoundError(name)

        with patch("importlib.import_module", side_effect=import_side_effect):
-            config = StackRunConfig(
+            config = make_stack_config(
                image_name="test_image",
                providers={
                    "inference": [
@ -787,10 +812,9 @@ class TestGetExternalProvidersFromModule:

    def test_empty_provider_list(self, mock_providers):
        """Test with empty provider list."""
-        from llama_stack.core.datatypes import StackRunConfig
        from llama_stack.core.distribution import get_external_providers_from_module

-        config = StackRunConfig(
+        config = make_stack_config(
            image_name="test_image",
            providers={},
        )
@ -805,7 +829,6 @@ class TestGetExternalProvidersFromModule:
        """Test multiple APIs with providers."""
        from types import SimpleNamespace

-        from llama_stack.core.datatypes import Provider, StackRunConfig
        from llama_stack.core.distribution import get_external_providers_from_module
        from llama_stack.providers.datatypes import ProviderSpec

@ -830,7 +853,7 @@ class TestGetExternalProvidersFromModule:
            raise ModuleNotFoundError(name)

        with patch("importlib.import_module", side_effect=import_side_effect):
-            config = StackRunConfig(
+            config = make_stack_config(
                image_name="test_image",
                providers={
                    "inference": [