mirror of
				https://github.com/meta-llama/llama-stack.git
				synced 2025-10-26 01:12:59 +00:00 
			
		
		
		
	
		
			Some checks failed
		
		
	
	Integration Auth Tests / test-matrix (oauth2_token) (push) Failing after 5s
				
			Test Llama Stack Build / build-ubi9-container-distribution (push) Failing after 7s
				
			Vector IO Integration Tests / test-matrix (3.12, inline::faiss) (push) Failing after 15s
				
			Test Llama Stack Build / generate-matrix (push) Successful in 9s
				
			Vector IO Integration Tests / test-matrix (3.12, remote::chromadb) (push) Failing after 15s
				
			Vector IO Integration Tests / test-matrix (3.12, inline::milvus) (push) Failing after 19s
				
			Test Llama Stack Build / build-custom-container-distribution (push) Failing after 13s
				
			Test Llama Stack Build / build-single-provider (push) Failing after 13s
				
			Vector IO Integration Tests / test-matrix (3.13, remote::pgvector) (push) Failing after 15s
				
			Test External Providers Installed via Module / test-external-providers-from-module (venv) (push) Has been skipped
				
			SqlStore Integration Tests / test-postgres (3.13) (push) Failing after 22s
				
			Vector IO Integration Tests / test-matrix (3.13, remote::chromadb) (push) Failing after 14s
				
			Integration Tests (Replay) / discover-tests (push) Successful in 24s
				
			Vector IO Integration Tests / test-matrix (3.13, remote::qdrant) (push) Failing after 16s
				
			Vector IO Integration Tests / test-matrix (3.12, remote::weaviate) (push) Failing after 17s
				
			Vector IO Integration Tests / test-matrix (3.13, remote::weaviate) (push) Failing after 15s
				
			Vector IO Integration Tests / test-matrix (3.13, inline::milvus) (push) Failing after 17s
				
			Vector IO Integration Tests / test-matrix (3.13, inline::faiss) (push) Failing after 18s
				
			Update ReadTheDocs / update-readthedocs (push) Failing after 12s
				
			Unit Tests / unit-tests (3.12) (push) Failing after 11s
				
			Vector IO Integration Tests / test-matrix (3.12, remote::qdrant) (push) Failing after 16s
				
			Python Package Build Test / build (3.12) (push) Failing after 20s
				
			Python Package Build Test / build (3.13) (push) Failing after 18s
				
			Vector IO Integration Tests / test-matrix (3.12, inline::sqlite-vec) (push) Failing after 18s
				
			Test External API and Providers / test-external (venv) (push) Failing after 18s
				
			Unit Tests / unit-tests (3.13) (push) Failing after 19s
				
			SqlStore Integration Tests / test-postgres (3.12) (push) Failing after 42s
				
			Integration Tests (Replay) / run-replay-mode-tests (push) Failing after 22s
				
			Vector IO Integration Tests / test-matrix (3.13, inline::sqlite-vec) (push) Failing after 1m12s
				
			Vector IO Integration Tests / test-matrix (3.12, remote::pgvector) (push) Failing after 1m15s
				
			Test Llama Stack Build / build (push) Failing after 32s
				
			Pre-commit / pre-commit (push) Successful in 2m39s
				
			# What does this PR do? Adds support to Vector store Open AI APIs in Qdrant. <!-- If resolving an issue, uncomment and update the line below --> Closes #2463 ## Test Plan <!-- Describe the tests you ran to verify your changes with result summaries. *Provide clear instructions so the plan can be easily re-executed.* --> Signed-off-by: Varsha Prasad Narsing <varshaprasad96@gmail.com> Co-authored-by: ehhuang <ehhuang@users.noreply.github.com> Co-authored-by: Francisco Arceo <arceofrancisco@gmail.com>
		
			
				
	
	
		
			138 lines
		
	
	
	
		
			4.7 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			138 lines
		
	
	
	
		
			4.7 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
| # Copyright (c) Meta Platforms, Inc. and affiliates.
 | |
| # All rights reserved.
 | |
| #
 | |
| # This source code is licensed under the terms described in the LICENSE file in
 | |
| # the root directory of this source tree.
 | |
| 
 | |
| import asyncio
 | |
| import os
 | |
| from typing import Any
 | |
| from unittest.mock import AsyncMock, MagicMock, patch
 | |
| 
 | |
| import pytest
 | |
| 
 | |
| from llama_stack.apis.inference import EmbeddingsResponse, Inference
 | |
| from llama_stack.apis.vector_io import (
 | |
|     QueryChunksResponse,
 | |
|     VectorDB,
 | |
|     VectorDBStore,
 | |
| )
 | |
| from llama_stack.providers.inline.vector_io.qdrant.config import (
 | |
|     QdrantVectorIOConfig as InlineQdrantVectorIOConfig,
 | |
| )
 | |
| from llama_stack.providers.remote.vector_io.qdrant.qdrant import (
 | |
|     QdrantVectorIOAdapter,
 | |
| )
 | |
| from llama_stack.providers.utils.kvstore.config import SqliteKVStoreConfig
 | |
| 
 | |
| # This test is a unit test for the QdrantVectorIOAdapter class. This should only contain
 | |
| # tests which are specific to this class. More general (API-level) tests should be placed in
 | |
| # tests/integration/vector_io/
 | |
| #
 | |
| # How to run this test:
 | |
| #
 | |
| # pytest tests/unit/providers/vector_io/test_qdrant.py \
 | |
| # -v -s --tb=short --disable-warnings --asyncio-mode=auto
 | |
| 
 | |
| 
 | |
| @pytest.fixture
 | |
| def qdrant_config(tmp_path) -> InlineQdrantVectorIOConfig:
 | |
|     kvstore_config = SqliteKVStoreConfig(db_name=os.path.join(tmp_path, "test_kvstore.db"))
 | |
|     return InlineQdrantVectorIOConfig(path=os.path.join(tmp_path, "qdrant.db"), kvstore=kvstore_config)
 | |
| 
 | |
| 
 | |
| @pytest.fixture(scope="session")
 | |
| def loop():
 | |
|     return asyncio.new_event_loop()
 | |
| 
 | |
| 
 | |
| @pytest.fixture
 | |
| def mock_vector_db(vector_db_id) -> MagicMock:
 | |
|     mock_vector_db = MagicMock(spec=VectorDB)
 | |
|     mock_vector_db.embedding_model = "embedding_model"
 | |
|     mock_vector_db.identifier = vector_db_id
 | |
|     mock_vector_db.embedding_dimension = 384
 | |
|     mock_vector_db.model_dump_json.return_value = (
 | |
|         '{"identifier": "' + vector_db_id + '", "embedding_model": "embedding_model", "embedding_dimension": 384}'
 | |
|     )
 | |
|     return mock_vector_db
 | |
| 
 | |
| 
 | |
| @pytest.fixture
 | |
| def mock_vector_db_store(mock_vector_db) -> MagicMock:
 | |
|     mock_store = MagicMock(spec=VectorDBStore)
 | |
|     mock_store.get_vector_db = AsyncMock(return_value=mock_vector_db)
 | |
|     return mock_store
 | |
| 
 | |
| 
 | |
| @pytest.fixture
 | |
| def mock_api_service(sample_embeddings):
 | |
|     mock_api_service = MagicMock(spec=Inference)
 | |
|     mock_api_service.embeddings = AsyncMock(return_value=EmbeddingsResponse(embeddings=sample_embeddings))
 | |
|     return mock_api_service
 | |
| 
 | |
| 
 | |
| @pytest.fixture
 | |
| async def qdrant_adapter(qdrant_config, mock_vector_db_store, mock_api_service, loop) -> QdrantVectorIOAdapter:
 | |
|     adapter = QdrantVectorIOAdapter(config=qdrant_config, inference_api=mock_api_service, files_api=None)
 | |
|     adapter.vector_db_store = mock_vector_db_store
 | |
|     await adapter.initialize()
 | |
|     yield adapter
 | |
|     await adapter.shutdown()
 | |
| 
 | |
| 
 | |
| __QUERY = "Sample query"
 | |
| 
 | |
| 
 | |
| @pytest.mark.parametrize("max_query_chunks, expected_chunks", [(2, 2), (100, 60)])
 | |
| async def test_qdrant_adapter_returns_expected_chunks(
 | |
|     qdrant_adapter: QdrantVectorIOAdapter,
 | |
|     vector_db_id,
 | |
|     sample_chunks,
 | |
|     sample_embeddings,
 | |
|     max_query_chunks,
 | |
|     expected_chunks,
 | |
| ) -> None:
 | |
|     assert qdrant_adapter is not None
 | |
|     await qdrant_adapter.insert_chunks(vector_db_id, sample_chunks)
 | |
| 
 | |
|     index = await qdrant_adapter._get_and_cache_vector_db_index(vector_db_id=vector_db_id)
 | |
|     assert index is not None
 | |
| 
 | |
|     response = await qdrant_adapter.query_chunks(
 | |
|         query=__QUERY,
 | |
|         vector_db_id=vector_db_id,
 | |
|         params={"max_chunks": max_query_chunks, "mode": "vector"},
 | |
|     )
 | |
|     assert isinstance(response, QueryChunksResponse)
 | |
|     assert len(response.chunks) == expected_chunks
 | |
| 
 | |
| 
 | |
| # To by-pass attempt to convert a Mock to JSON
 | |
| def _prepare_for_json(value: Any) -> str:
 | |
|     return str(value)
 | |
| 
 | |
| 
 | |
| @patch("llama_stack.providers.utils.telemetry.trace_protocol._prepare_for_json", new=_prepare_for_json)
 | |
| async def test_qdrant_register_and_unregister_vector_db(
 | |
|     qdrant_adapter: QdrantVectorIOAdapter,
 | |
|     mock_vector_db,
 | |
|     sample_chunks,
 | |
| ) -> None:
 | |
|     # Initially, no collections
 | |
|     vector_db_id = mock_vector_db.identifier
 | |
|     assert len((await qdrant_adapter.client.get_collections()).collections) == 0
 | |
| 
 | |
|     # Register does not create a collection
 | |
|     assert not (await qdrant_adapter.client.collection_exists(vector_db_id))
 | |
|     await qdrant_adapter.register_vector_db(mock_vector_db)
 | |
|     assert not (await qdrant_adapter.client.collection_exists(vector_db_id))
 | |
| 
 | |
|     # First insert creates the collection
 | |
|     await qdrant_adapter.insert_chunks(vector_db_id, sample_chunks)
 | |
|     assert await qdrant_adapter.client.collection_exists(vector_db_id)
 | |
| 
 | |
|     # Unregister deletes the collection
 | |
|     await qdrant_adapter.unregister_vector_db(vector_db_id)
 | |
|     assert not (await qdrant_adapter.client.collection_exists(vector_db_id))
 | |
|     assert len((await qdrant_adapter.client.get_collections()).collections) == 0
 |