chore: Adding unit tests for Milvus and OpenAI compatibility (#2640)

# What does this PR do? - Enabling Unit tests for Milvus to start to test OpenAI compatibility and fixing a few bugs. - Also fixed an inconsistency in the Milvus config between remote and inline. - Added pymilvus to extras for testing in CI I'm going to refactor this later to include the other inline providers so that we can catch issues sooner. I have another PR where I've been testing to find other bugs in the implementation (and required changes drafted here: https://github.com/meta-llama/llama-stack/pull/2617). ## Test Plan  --------- Signed-off-by: Francisco Javier Arceo <farceo@redhat.com>
2025-07-13 16:46:09 +00:00 · 2025-07-08 03:50:16 -04:00 · 2025-07-08 03:50:16 -04:00 · 83c89265e0
commit 83c89265e0
parent 27b3cd570f
6 changed files with 1970 additions and 1484 deletions
--- a/docs/source/providers/vector_io/inline_milvus.md
+++ b/docs/source/providers/vector_io/inline_milvus.md
@ -12,6 +12,7 @@ Please refer to the remote provider documentation.
 |-------|------|----------|---------|-------------|
 | `db_path` | `<class 'str'>` | No | PydanticUndefined |  |
 | `kvstore` | `utils.kvstore.config.RedisKVStoreConfig \| utils.kvstore.config.SqliteKVStoreConfig \| utils.kvstore.config.PostgresKVStoreConfig \| utils.kvstore.config.MongoDBKVStoreConfig` | No | sqlite |  |
 | `consistency_level` | `<class 'str'>` | No | Strong | The consistency level of the Milvus server |
 ## Sample Configuration
--- a/llama_stack/providers/inline/vector_io/milvus/config.py
+++ b/llama_stack/providers/inline/vector_io/milvus/config.py
@ -6,7 +6,7 @@
 from typing import Any
-from pydantic import BaseModel
+from pydantic import BaseModel, Field
 from llama_stack.providers.utils.kvstore.config import (
    KVStoreConfig,
@ -19,6 +19,7 @@ from llama_stack.schema_utils import json_schema_type
 class MilvusVectorIOConfig(BaseModel):
    db_path: str
    kvstore: KVStoreConfig
    consistency_level: str = Field(description="The consistency level of the Milvus server", default="Strong")
    @classmethod
    def sample_run_config(cls, __distro_dir__: str, **kwargs: Any) -> dict[str, Any]:
--- a/llama_stack/providers/remote/vector_io/milvus/milvus.py
+++ b/llama_stack/providers/remote/vector_io/milvus/milvus.py
@ -154,10 +154,10 @@ class MilvusVectorIOAdapter(OpenAIVectorStoreMixin, VectorIO, VectorDBsProtocolP
        stored_vector_dbs = await self.kvstore.values_in_range(start_key, end_key)
        for vector_db_data in stored_vector_dbs:
-            vector_db = VectorDB.mdel_validate_json(vector_db_data)
+            vector_db = VectorDB.model_validate_json(vector_db_data)
            index = VectorDBWithIndex(
                vector_db,
-                index=await MilvusIndex(
+                index=MilvusIndex(
                    client=self.client,
                    collection_name=vector_db.identifier,
                    consistency_level=self.config.consistency_level,
@ -259,6 +259,8 @@ class MilvusVectorIOAdapter(OpenAIVectorStoreMixin, VectorIO, VectorDBsProtocolP
        assert self.kvstore is not None
        key = f"{OPENAI_VECTOR_STORES_PREFIX}{store_id}"
        await self.kvstore.delete(key)
        if store_id in self.openai_vector_stores:
            del self.openai_vector_stores[store_id]
    async def _load_openai_vector_stores(self) -> dict[str, dict[str, Any]]:
        """Load all vector store metadata from persistent storage."""
@ -377,6 +379,29 @@ class MilvusVectorIOAdapter(OpenAIVectorStoreMixin, VectorIO, VectorDBsProtocolP
            logger.error(f"Error loading openai vector store file {file_id} for store {store_id}: {e}")
            return {}
    async def _update_openai_vector_store_file(self, store_id: str, file_id: str, file_info: dict[str, Any]) -> None:
        """Update vector store file metadata in Milvus database."""
        try:
            if not await asyncio.to_thread(self.client.has_collection, "openai_vector_store_files"):
                return
            file_data = [
                {
                    "store_file_id": f"{store_id}_{file_id}",
                    "store_id": store_id,
                    "file_id": file_id,
                    "file_info": json.dumps(file_info),
                }
            ]
            await asyncio.to_thread(
                self.client.upsert,
                collection_name="openai_vector_store_files",
                data=file_data,
            )
        except Exception as e:
            logger.error(f"Error updating openai vector store file {file_id} for store {store_id}: {e}")
            raise
    async def _load_openai_vector_store_file_contents(self, store_id: str, file_id: str) -> list[dict[str, Any]]:
        """Load vector store file contents from Milvus database."""
        try:
@ -405,29 +430,6 @@ class MilvusVectorIOAdapter(OpenAIVectorStoreMixin, VectorIO, VectorDBsProtocolP
            logger.error(f"Error loading openai vector store file contents for {file_id} in store {store_id}: {e}")
            return []
    async def _update_openai_vector_store_file(self, store_id: str, file_id: str, file_info: dict[str, Any]) -> None:
        """Update vector store file metadata in Milvus database."""
        try:
            if not await asyncio.to_thread(self.client.has_collection, "openai_vector_store_files"):
                return
            file_data = [
                {
                    "store_file_id": f"{store_id}_{file_id}",
                    "store_id": store_id,
                    "file_id": file_id,
                    "file_info": json.dumps(file_info),
                }
            ]
            await asyncio.to_thread(
                self.client.upsert,
                collection_name="openai_vector_store_files",
                data=file_data,
            )
        except Exception as e:
            logger.error(f"Error updating openai vector store file {file_id} for store {store_id}: {e}")
            raise
    async def _delete_openai_vector_store_file_from_storage(self, store_id: str, file_id: str) -> None:
        """Delete vector store file metadata from Milvus database."""
        try:
--- a/pyproject.toml
+++ b/pyproject.toml
@ -86,6 +86,7 @@ unit = [
    "sqlalchemy[asyncio]>=2.0.41",
    "blobfile",
    "faiss-cpu",
    "pymilvus>=2.5.12",
 ]
 # These are the core dependencies required for running integration tests. They are shared across all
 # providers. If a provider requires additional dependencies, please add them to your environment
@ -106,6 +107,7 @@ test = [
    "sqlalchemy",
    "sqlalchemy[asyncio]>=2.0.41",
    "requests",
    "pymilvus>=2.5.12",
 ]
 docs = [
    "setuptools",
--- a/tests/unit/providers/vector_io/test_vector_io_openai_vector_stores.py
+++ b/tests/unit/providers/vector_io/test_vector_io_openai_vector_stores.py
@ -0,0 +1,420 @@
 # Copyright (c) Meta Platforms, Inc. and affiliates.
 # All rights reserved.
 #
 # This source code is licensed under the terms described in the LICENSE file in
 # the root directory of this source tree.
 import asyncio
 import time
 from unittest.mock import AsyncMock
 import numpy as np
 import pytest
 import pytest_asyncio
 from pymilvus import Collection, MilvusClient, connections
 from llama_stack.apis.vector_dbs import VectorDB
 from llama_stack.apis.vector_io import Chunk, QueryChunksResponse
 from llama_stack.providers.inline.vector_io.milvus.config import MilvusVectorIOConfig, SqliteKVStoreConfig
 from llama_stack.providers.remote.vector_io.milvus.milvus import VECTOR_DBS_PREFIX, MilvusIndex, MilvusVectorIOAdapter
 from llama_stack.providers.utils.kvstore import kvstore_impl
 # TODO: Refactor these to be for inline vector-io providers
 MILVUS_ALIAS = "test_milvus"
 COLLECTION_PREFIX = "test_collection"
@pytest.fixture(scope="session")
 def loop():
    return asyncio.new_event_loop()
@pytest.fixture(scope="session")
 def mock_inference_api(embedding_dimension):
    class MockInferenceAPI:
        async def embed_batch(self, texts: list[str]) -> list[list[float]]:
            return [np.random.rand(embedding_dimension).astype(np.float32).tolist() for _ in texts]
    return MockInferenceAPI()
@pytest_asyncio.fixture
 async def unique_kvstore_config(tmp_path_factory):
    # Generate a unique filename for this test
    unique_id = f"test_kv_{np.random.randint(1e6)}"
    temp_dir = tmp_path_factory.getbasetemp()
    db_path = str(temp_dir / f"{unique_id}.db")
    return SqliteKVStoreConfig(db_path=db_path)
@pytest_asyncio.fixture(scope="session", autouse=True)
 async def milvus_vec_index(embedding_dimension, tmp_path_factory):
    temp_dir = tmp_path_factory.getbasetemp()
    db_path = str(temp_dir / "test_milvus.db")
    client = MilvusClient(db_path)
    name = f"{COLLECTION_PREFIX}_{np.random.randint(1e6)}"
    connections.connect(alias=MILVUS_ALIAS, uri=db_path)
    index = MilvusIndex(client, name, consistency_level="Strong")
    index.db_path = db_path
    yield index
@pytest_asyncio.fixture(scope="session")
 async def milvus_vec_adapter(milvus_vec_index, mock_inference_api):
    config = MilvusVectorIOConfig(
        db_path=milvus_vec_index.db_path,
        kvstore=SqliteKVStoreConfig(),
    )
    adapter = MilvusVectorIOAdapter(
        config=config,
        inference_api=mock_inference_api,
        files_api=None,
    )
    await adapter.initialize()
    await adapter.register_vector_db(
        VectorDB(
            identifier=adapter.metadata_collection_name,
            provider_id="test_provider",
            embedding_model="test_model",
            embedding_dimension=128,
        )
    )
    yield adapter
    await adapter.shutdown()
@pytest.mark.asyncio
 async def test_cache_contains_initial_collection(milvus_vec_adapter):
    coll_name = milvus_vec_adapter.metadata_collection_name
    assert coll_name in milvus_vec_adapter.cache
@pytest.mark.asyncio
 async def test_add_chunks(milvus_vec_index, sample_chunks, sample_embeddings):
    await milvus_vec_index.add_chunks(sample_chunks, sample_embeddings)
    resp = await milvus_vec_index.query_vector(sample_embeddings[0], k=1, score_threshold=-1)
    assert resp.chunks[0].content == sample_chunks[0].content
@pytest.mark.asyncio
 async def test_query_chunks_vector(milvus_vec_index, sample_chunks, sample_embeddings, embedding_dimension):
    await milvus_vec_index.add_chunks(sample_chunks, sample_embeddings)
    query_emb = np.random.rand(embedding_dimension).astype(np.float32)
    resp = await milvus_vec_index.query_vector(query_emb, k=2, score_threshold=0.0)
    assert isinstance(resp, QueryChunksResponse)
    assert len(resp.chunks) == 2
@pytest.mark.asyncio
 async def test_chunk_id_conflict(milvus_vec_index, sample_chunks, embedding_dimension):
    embeddings = np.random.rand(len(sample_chunks), embedding_dimension).astype(np.float32)
    await milvus_vec_index.add_chunks(sample_chunks, embeddings)
    coll = Collection(milvus_vec_index.collection_name, using=MILVUS_ALIAS)
    ids = coll.query(expr="id >= 0", output_fields=["id"], timeout=30)
    flat_ids = [i["id"] for i in ids]
    assert len(flat_ids) == len(set(flat_ids))
@pytest.mark.asyncio
 async def test_initialize_with_milvus_client(milvus_vec_index, unique_kvstore_config):
    kvstore = await kvstore_impl(unique_kvstore_config)
    vector_db = VectorDB(
        identifier="test_db",
        provider_id="test_provider",
        embedding_model="test_model",
        embedding_dimension=128,
        metadata={"test_key": "test_value"},
    )
    test_vector_db_data = vector_db.model_dump_json()
    await kvstore.set(f"{VECTOR_DBS_PREFIX}test_db", test_vector_db_data)
    tmp_milvus_vec_adapter = MilvusVectorIOAdapter(
        config=MilvusVectorIOConfig(
            db_path=milvus_vec_index.db_path,
            kvstore=unique_kvstore_config,
        ),
        inference_api=None,
        files_api=None,
    )
    await tmp_milvus_vec_adapter.initialize()
    vector_db = VectorDB(
        identifier="test_db",
        provider_id="test_provider",
        embedding_model="test_model",
        embedding_dimension=128,
    )
    test_vector_db_data = vector_db.model_dump_json()
    await tmp_milvus_vec_adapter.kvstore.set(f"{VECTOR_DBS_PREFIX}/test_db", test_vector_db_data)
    assert milvus_vec_index.client is not None
    assert isinstance(milvus_vec_index.client, MilvusClient)
    assert tmp_milvus_vec_adapter.cache is not None
    # registering a vector won't update the cache or openai_vector_store collection name
    assert (
        tmp_milvus_vec_adapter.metadata_collection_name not in tmp_milvus_vec_adapter.cache
        or tmp_milvus_vec_adapter.openai_vector_stores
    )
@pytest.mark.asyncio
 async def test_persistence_across_adapter_restarts(
    tmp_path, milvus_vec_index, mock_inference_api, unique_kvstore_config
 ):
    adapter1 = MilvusVectorIOAdapter(
        config=MilvusVectorIOConfig(db_path=milvus_vec_index.db_path, kvstore=unique_kvstore_config),
        inference_api=mock_inference_api,
        files_api=None,
    )
    await adapter1.initialize()
    dummy = VectorDB(
        identifier="foo_db", provider_id="test_provider", embedding_model="test_model", embedding_dimension=128
    )
    await adapter1.register_vector_db(dummy)
    await adapter1.shutdown()
    await adapter1.initialize()
    assert "foo_db" in adapter1.cache
    await adapter1.shutdown()
@pytest.mark.asyncio
 async def test_register_and_unregister_vector_db(milvus_vec_adapter):
    try:
        connections.disconnect(MILVUS_ALIAS)
    except Exception as _:
        pass
    connections.connect(alias=MILVUS_ALIAS, uri=milvus_vec_adapter.config.db_path)
    unique_id = f"foo_db_{np.random.randint(1e6)}"
    dummy = VectorDB(
        identifier=unique_id, provider_id="test_provider", embedding_model="test_model", embedding_dimension=128
    )
    await milvus_vec_adapter.register_vector_db(dummy)
    assert dummy.identifier in milvus_vec_adapter.cache
    if dummy.identifier in milvus_vec_adapter.cache:
        index = milvus_vec_adapter.cache[dummy.identifier].index
        if hasattr(index, "client") and hasattr(index.client, "_using"):
            index.client._using = MILVUS_ALIAS
    await milvus_vec_adapter.unregister_vector_db(dummy.identifier)
    assert dummy.identifier not in milvus_vec_adapter.cache
@pytest.mark.asyncio
 async def test_query_unregistered_raises(milvus_vec_adapter):
    fake_emb = np.zeros(8, dtype=np.float32)
    with pytest.raises(AttributeError):
        await milvus_vec_adapter.query_chunks("no_such_db", fake_emb)
@pytest.mark.asyncio
 async def test_insert_chunks_calls_underlying_index(milvus_vec_adapter):
    fake_index = AsyncMock()
    milvus_vec_adapter._get_and_cache_vector_db_index = AsyncMock(return_value=fake_index)
    chunks = ["chunk1", "chunk2"]
    await milvus_vec_adapter.insert_chunks("db1", chunks)
    fake_index.insert_chunks.assert_awaited_once_with(chunks)
@pytest.mark.asyncio
 async def test_insert_chunks_missing_db_raises(milvus_vec_adapter):
    milvus_vec_adapter._get_and_cache_vector_db_index = AsyncMock(return_value=None)
    with pytest.raises(ValueError):
        await milvus_vec_adapter.insert_chunks("db_not_exist", [])
@pytest.mark.asyncio
 async def test_query_chunks_calls_underlying_index_and_returns(milvus_vec_adapter):
    expected = QueryChunksResponse(chunks=[Chunk(content="c1")], scores=[0.1])
    fake_index = AsyncMock(query_chunks=AsyncMock(return_value=expected))
    milvus_vec_adapter._get_and_cache_vector_db_index = AsyncMock(return_value=fake_index)
    response = await milvus_vec_adapter.query_chunks("db1", "my_query", {"param": 1})
    fake_index.query_chunks.assert_awaited_once_with("my_query", {"param": 1})
    assert response is expected
@pytest.mark.asyncio
 async def test_query_chunks_missing_db_raises(milvus_vec_adapter):
    milvus_vec_adapter._get_and_cache_vector_db_index = AsyncMock(return_value=None)
    with pytest.raises(ValueError):
        await milvus_vec_adapter.query_chunks("db_missing", "q", None)
@pytest.mark.asyncio
 async def test_save_openai_vector_store(milvus_vec_adapter):
    store_id = "vs_1234"
    openai_vector_store = {
        "id": store_id,
        "name": "Test Store",
        "description": "A test OpenAI vector store",
        "vector_db_id": "test_db",
        "embedding_model": "test_model",
    }
    await milvus_vec_adapter._save_openai_vector_store(store_id, openai_vector_store)
    assert openai_vector_store["id"] in milvus_vec_adapter.openai_vector_stores
    assert milvus_vec_adapter.openai_vector_stores[openai_vector_store["id"]] == openai_vector_store
@pytest.mark.asyncio
 async def test_update_openai_vector_store(milvus_vec_adapter):
    store_id = "vs_1234"
    openai_vector_store = {
        "id": store_id,
        "name": "Test Store",
        "description": "A test OpenAI vector store",
        "vector_db_id": "test_db",
        "embedding_model": "test_model",
    }
    await milvus_vec_adapter._save_openai_vector_store(store_id, openai_vector_store)
    openai_vector_store["description"] = "Updated description"
    await milvus_vec_adapter._update_openai_vector_store(store_id, openai_vector_store)
    assert milvus_vec_adapter.openai_vector_stores[openai_vector_store["id"]] == openai_vector_store
@pytest.mark.asyncio
 async def test_delete_openai_vector_store(milvus_vec_adapter):
    store_id = "vs_1234"
    openai_vector_store = {
        "id": store_id,
        "name": "Test Store",
        "description": "A test OpenAI vector store",
        "vector_db_id": "test_db",
        "embedding_model": "test_model",
    }
    await milvus_vec_adapter._save_openai_vector_store(store_id, openai_vector_store)
    await milvus_vec_adapter._delete_openai_vector_store_from_storage(store_id)
    assert openai_vector_store["id"] not in milvus_vec_adapter.openai_vector_stores
@pytest.mark.asyncio
 async def test_load_openai_vector_stores(milvus_vec_adapter):
    store_id = "vs_1234"
    openai_vector_store = {
        "id": store_id,
        "name": "Test Store",
        "description": "A test OpenAI vector store",
        "vector_db_id": "test_db",
        "embedding_model": "test_model",
    }
    await milvus_vec_adapter._save_openai_vector_store(store_id, openai_vector_store)
    loaded_stores = await milvus_vec_adapter._load_openai_vector_stores()
    assert loaded_stores[store_id] == openai_vector_store
@pytest.mark.asyncio
 async def test_save_openai_vector_store_file(milvus_vec_adapter, tmp_path_factory):
    store_id = "vs_1234"
    file_id = "file_1234"
    file_info = {
        "id": file_id,
        "status": "completed",
        "vector_store_id": store_id,
        "attributes": {},
        "filename": "test_file.txt",
        "created_at": int(time.time()),
    }
    file_contents = [
        {"content": "Test content", "chunk_metadata": {"chunk_id": "chunk_001"}, "metadata": {"file_id": file_id}}
    ]
    # validating we don't raise an exception
    await milvus_vec_adapter._save_openai_vector_store_file(store_id, file_id, file_info, file_contents)
@pytest.mark.asyncio
 async def test_update_openai_vector_store_file(milvus_vec_adapter, tmp_path_factory):
    store_id = "vs_1234"
    file_id = "file_1234"
    file_info = {
        "id": file_id,
        "status": "completed",
        "vector_store_id": store_id,
        "attributes": {},
        "filename": "test_file.txt",
        "created_at": int(time.time()),
    }
    file_contents = [
        {"content": "Test content", "chunk_metadata": {"chunk_id": "chunk_001"}, "metadata": {"file_id": file_id}}
    ]
    await milvus_vec_adapter._save_openai_vector_store_file(store_id, file_id, file_info, file_contents)
    updated_file_info = file_info.copy()
    updated_file_info["filename"] = "updated_test_file.txt"
    await milvus_vec_adapter._update_openai_vector_store_file(
        store_id,
        file_id,
        updated_file_info,
    )
    loaded_contents = await milvus_vec_adapter._load_openai_vector_store_file(store_id, file_id)
    assert loaded_contents == updated_file_info
    assert loaded_contents != file_info
@pytest.mark.asyncio
 async def test_load_openai_vector_store_file_contents(milvus_vec_adapter, tmp_path_factory):
    store_id = "vs_1234"
    file_id = "file_1234"
    file_info = {
        "id": file_id,
        "status": "completed",
        "vector_store_id": store_id,
        "attributes": {},
        "filename": "test_file.txt",
        "created_at": int(time.time()),
    }
    file_contents = [
        {"content": "Test content", "chunk_metadata": {"chunk_id": "chunk_001"}, "metadata": {"file_id": file_id}}
    ]
    await milvus_vec_adapter._save_openai_vector_store_file(store_id, file_id, file_info, file_contents)
    loaded_contents = await milvus_vec_adapter._load_openai_vector_store_file_contents(store_id, file_id)
    assert loaded_contents == file_contents
@pytest.mark.asyncio
 async def test_delete_openai_vector_store_file_from_storage(milvus_vec_adapter, tmp_path_factory):
    store_id = "vs_1234"
    file_id = "file_1234"
    file_info = {
        "id": file_id,
        "status": "completed",
        "vector_store_id": store_id,
        "attributes": {},
        "filename": "test_file.txt",
        "created_at": int(time.time()),
    }
    file_contents = [
        {"content": "Test content", "chunk_metadata": {"chunk_id": "chunk_001"}, "metadata": {"file_id": file_id}}
    ]
    await milvus_vec_adapter._save_openai_vector_store_file(store_id, file_id, file_info, file_contents)
    await milvus_vec_adapter._delete_openai_vector_store_file_from_storage(store_id, file_id)
    loaded_contents = await milvus_vec_adapter._load_openai_vector_store_file_contents(store_id, file_id)
    assert loaded_contents == []
--- a/uv.lock
+++ b/uv.lock