feat(vector_io): add custom collection names support for vector stores (#4135)

2025-12-03 09:53:45 +00:00 · 2025-11-20 19:28:33 +02:00 · 2025-11-20 19:28:33 +02:00 · 6e6ddd3c69
commit 6e6ddd3c69
parent 91f1b352b4
5 changed files with 140 additions and 12 deletions
--- a/src/llama_stack/core/routers/vector_io.py
+++ b/src/llama_stack/core/routers/vector_io.py
@ -5,6 +5,7 @@
 # the root directory of this source tree.

 import asyncio
+import re
 import uuid
 from typing import Annotated, Any

@ -44,6 +45,17 @@ from llama_stack_api import (
 logger = get_logger(name=__name__, category="core::routers")


+def validate_collection_name(collection_name: str) -> None:
+    if not collection_name:
+        raise ValueError("collection_name cannot be empty")
+
+    if not re.match(r"^[a-zA-Z0-9_-]+$", collection_name):
+        raise ValueError(
+            f"collection_name '{collection_name}' contains invalid characters. "
+            "Only alphanumeric characters, hyphens, and underscores are allowed."
+        )
+
+
 class VectorIORouter(VectorIO):
    """Routes to an provider based on the vector db identifier"""

@ -160,13 +172,25 @@ class VectorIORouter(VectorIO):
            else:
                provider_id = list(self.routing_table.impls_by_provider_id.keys())[0]

+        # Extract and validate collection_name if provided
+        collection_name = extra.get("collection_name")
+        if collection_name:
+            validate_collection_name(collection_name)
+            provider_vector_store_id = collection_name
+            logger.debug(f"Using custom collection name: {collection_name}")
+        else:
+            # Fall back to auto-generated UUID for backward compatibility
+            provider_vector_store_id = f"vs_{uuid.uuid4()}"
+
+        # Always generate a unique vector_store_id for internal routing
        vector_store_id = f"vs_{uuid.uuid4()}"
+
        registered_vector_store = await self.routing_table.register_vector_store(
            vector_store_id=vector_store_id,
            embedding_model=embedding_model,
            embedding_dimension=embedding_dimension,
            provider_id=provider_id,
-            provider_vector_store_id=vector_store_id,
+            provider_vector_store_id=provider_vector_store_id,
            vector_store_name=params.name,
        )
        provider = await self.routing_table.get_provider_impl(registered_vector_store.identifier)
@ -174,8 +198,14 @@ class VectorIORouter(VectorIO):
        # Update model_extra with registered values so provider uses the already-registered vector_store
        if params.model_extra is None:
            params.model_extra = {}
+        params.model_extra["vector_store_id"] = vector_store_id  # Pass canonical UUID to Provider
        params.model_extra["provider_vector_store_id"] = registered_vector_store.provider_resource_id
        params.model_extra["provider_id"] = registered_vector_store.provider_id
+
+        # Add collection_name to metadata so users can see what was used
+        if params.metadata is None:
+            params.metadata = {}
+        params.metadata["provider_vector_store_id"] = provider_vector_store_id
        if embedding_model is not None:
            params.model_extra["embedding_model"] = embedding_model
        if embedding_dimension is not None:
--- a/src/llama_stack/providers/inline/vector_io/faiss/faiss.py
+++ b/src/llama_stack/providers/inline/vector_io/faiss/faiss.py
@ -201,7 +201,11 @@ class FaissVectorIOAdapter(OpenAIVectorStoreMixin, VectorIO, VectorStoresProtoco
            vector_store = VectorStore.model_validate_json(vector_store_data)
            index = VectorStoreWithIndex(
                vector_store,
-                await FaissIndex.create(vector_store.embedding_dimension, self.kvstore, vector_store.identifier),
+                await FaissIndex.create(
+                    vector_store.embedding_dimension,
+                    self.kvstore,
+                    vector_store.provider_resource_id or vector_store.identifier,
+                ),
                self.inference_api,
            )
            self.cache[vector_store.identifier] = index
@ -239,7 +243,11 @@ class FaissVectorIOAdapter(OpenAIVectorStoreMixin, VectorIO, VectorStoresProtoco
        # Store in cache
        self.cache[vector_store.identifier] = VectorStoreWithIndex(
            vector_store=vector_store,
-            index=await FaissIndex.create(vector_store.embedding_dimension, self.kvstore, vector_store.identifier),
+            index=await FaissIndex.create(
+                vector_store.embedding_dimension,
+                self.kvstore,
+                vector_store.provider_resource_id or vector_store.identifier,
+            ),
            inference_api=self.inference_api,
        )

@ -272,7 +280,11 @@ class FaissVectorIOAdapter(OpenAIVectorStoreMixin, VectorIO, VectorStoresProtoco
        vector_store = VectorStore.model_validate_json(vector_store_data)
        index = VectorStoreWithIndex(
            vector_store=vector_store,
-            index=await FaissIndex.create(vector_store.embedding_dimension, self.kvstore, vector_store.identifier),
+            index=await FaissIndex.create(
+                vector_store.embedding_dimension,
+                self.kvstore,
+                vector_store.provider_resource_id or vector_store.identifier,
+            ),
            inference_api=self.inference_api,
        )
        self.cache[vector_store_id] = index
--- a/src/llama_stack/providers/inline/vector_io/sqlite_vec/sqlite_vec.py
+++ b/src/llama_stack/providers/inline/vector_io/sqlite_vec/sqlite_vec.py
@ -401,7 +401,9 @@ class SQLiteVecVectorIOAdapter(OpenAIVectorStoreMixin, VectorIO, VectorStoresPro
        for db_json in stored_vector_stores:
            vector_store = VectorStore.model_validate_json(db_json)
            index = await SQLiteVecIndex.create(
-                vector_store.embedding_dimension, self.config.db_path, vector_store.identifier
+                vector_store.embedding_dimension,
+                self.config.db_path,
+                vector_store.provider_resource_id or vector_store.identifier,
            )
            self.cache[vector_store.identifier] = VectorStoreWithIndex(vector_store, index, self.inference_api)

@ -425,7 +427,9 @@ class SQLiteVecVectorIOAdapter(OpenAIVectorStoreMixin, VectorIO, VectorStoresPro

        # Create and cache the index
        index = await SQLiteVecIndex.create(
-            vector_store.embedding_dimension, self.config.db_path, vector_store.identifier
+            vector_store.embedding_dimension,
+            self.config.db_path,
+            vector_store.provider_resource_id or vector_store.identifier,
        )
        self.cache[vector_store.identifier] = VectorStoreWithIndex(vector_store, index, self.inference_api)

@ -448,7 +452,7 @@ class SQLiteVecVectorIOAdapter(OpenAIVectorStoreMixin, VectorIO, VectorStoresPro
            index=SQLiteVecIndex(
                dimension=vector_store.embedding_dimension,
                db_path=self.config.db_path,
-                bank_id=vector_store.identifier,
+                bank_id=vector_store.provider_resource_id or vector_store.identifier,
                kvstore=self.kvstore,
            ),
            inference_api=self.inference_api,
--- a/src/llama_stack/providers/utils/memory/openai_vector_store_mixin.py
+++ b/src/llama_stack/providers/utils/memory/openai_vector_store_mixin.py
@ -360,7 +360,11 @@ class OpenAIVectorStoreMixin(ABC):
        extra_body = params.model_extra or {}
        metadata = params.metadata or {}

-        provider_vector_store_id = extra_body.get("provider_vector_store_id")
+        # Get the canonical UUID from router (or generate if called directly without router)
+        vector_store_id = extra_body.get("vector_store_id") or generate_object_id("vector_store", lambda: f"vs_{uuid.uuid4()}")
+
+        # Get the physical storage name (custom collection name or fallback to UUID)
+        provider_vector_store_id = extra_body.get("provider_vector_store_id") or vector_store_id

        # Use embedding info from metadata if available, otherwise from extra_body
        if metadata.get("embedding_model"):
@ -381,8 +385,6 @@ class OpenAIVectorStoreMixin(ABC):

        # use provider_id set by router; fallback to provider's own ID when used directly via --stack-config
        provider_id = extra_body.get("provider_id") or getattr(self, "__provider_id__", None)
-        # Derive the canonical vector_store_id (allow override, else generate)
-        vector_store_id = provider_vector_store_id or generate_object_id("vector_store", lambda: f"vs_{uuid.uuid4()}")

        if embedding_model is None:
            raise ValueError("embedding_model is required")
@ -396,11 +398,11 @@ class OpenAIVectorStoreMixin(ABC):

        # call to the provider to create any index, etc.
        vector_store = VectorStore(
-            identifier=vector_store_id,
+            identifier=vector_store_id,  # Canonical UUID for routing
            embedding_dimension=embedding_dimension,
            embedding_model=embedding_model,
            provider_id=provider_id,
-            provider_resource_id=vector_store_id,
+            provider_resource_id=provider_vector_store_id,  # Physical storage name (custom or UUID)
            vector_store_name=params.name,
        )
        await self.register_vector_store(vector_store)
--- a/tests/integration/vector_io/test_openai_vector_stores.py
+++ b/tests/integration/vector_io/test_openai_vector_stores.py
@ -1698,3 +1698,83 @@ def test_openai_vector_store_file_contents_with_extra_query(
    assert with_flags_embedding is not None, "Embeddings should be included when include_embeddings=True"
    assert len(with_flags_embedding) > 0, "Embedding should be a non-empty list"
    assert without_flags_embedding is None, "Embeddings should not be included when include_embeddings=False"
+
+
+@vector_provider_wrapper
+def test_openai_vector_store_custom_collection_name(
+    compat_client_with_empty_stores, client_with_models, embedding_model_id, embedding_dimension, vector_io_provider_id
+):
+    """Test creating a vector store with a custom collection name."""
+    skip_if_provider_doesnt_support_openai_vector_stores(client_with_models)
+    client = compat_client_with_empty_stores
+
+    # Create vector store with custom collection name
+    vector_store = client.vector_stores.create(
+        name="Test Custom Collection",
+        extra_body={
+            "embedding_model": embedding_model_id,
+            "provider_id": vector_io_provider_id,
+            "collection_name": "my_custom_collection",
+        },
+    )
+
+    assert vector_store is not None
+    assert vector_store.id.startswith("vs_")
+    assert "provider_vector_store_id" in vector_store.metadata
+    assert vector_store.metadata["provider_vector_store_id"] == "my_custom_collection"
+
+
+@vector_provider_wrapper
+def test_openai_vector_store_collection_name_validation(
+    compat_client_with_empty_stores, client_with_models, embedding_model_id, embedding_dimension, vector_io_provider_id
+):
+    """Test that invalid collection names are rejected."""
+    skip_if_provider_doesnt_support_openai_vector_stores(client_with_models)
+    client = compat_client_with_empty_stores
+
+    # Test invalid collection names
+    invalid_names = ["with spaces", "with/slashes", "with@special", ""]
+
+    for invalid_name in invalid_names:
+        with pytest.raises((BadRequestError, ValueError)):
+            client.vector_stores.create(
+                name="Test Invalid",
+                extra_body={
+                    "embedding_model": embedding_model_id,
+                    "provider_id": vector_io_provider_id,
+                    "collection_name": invalid_name,
+                },
+            )
+
+
+@vector_provider_wrapper
+def test_openai_vector_store_collection_name_with_data(
+    compat_client_with_empty_stores, client_with_models, sample_chunks, embedding_model_id, embedding_dimension, vector_io_provider_id
+):
+    """Test that custom collection names work with data insertion and search."""
+    skip_if_provider_doesnt_support_openai_vector_stores(client_with_models)
+    compat_client = compat_client_with_empty_stores
+    llama_client = client_with_models
+
+    # Create vector store with custom collection name
+    vector_store = compat_client.vector_stores.create(
+        name="Data Test Collection",
+        extra_body={
+            "embedding_model": embedding_model_id,
+            "provider_id": vector_io_provider_id,
+            "collection_name": "test_data_collection",
+        },
+    )
+
+    # Insert and search data
+    llama_client.vector_io.insert(vector_store_id=vector_store.id, chunks=sample_chunks[:2])
+
+    search_response = compat_client.vector_stores.search(
+        vector_store_id=vector_store.id,
+        query="What is Python?",
+        max_num_results=2,
+    )
+
+    assert search_response is not None
+    assert len(search_response.data) > 0
+    assert search_response.data[0].attributes["document_id"] == "doc1"