mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-07-29 15:23:51 +00:00
reverting to original call order for a simpler change
Signed-off-by: Francisco Javier Arceo <farceo@redhat.com>
This commit is contained in:
parent
56811a1483
commit
d361154102
6 changed files with 25 additions and 17 deletions
11
docs/_static/llama-stack-spec.html
vendored
11
docs/_static/llama-stack-spec.html
vendored
|
@ -15610,10 +15610,6 @@
|
||||||
"type": "string",
|
"type": "string",
|
||||||
"description": "The identifier of the vector database to register."
|
"description": "The identifier of the vector database to register."
|
||||||
},
|
},
|
||||||
"provider_vector_db_id": {
|
|
||||||
"type": "string",
|
|
||||||
"description": "The identifier of the vector database in the provider."
|
|
||||||
},
|
|
||||||
"embedding_model": {
|
"embedding_model": {
|
||||||
"type": "string",
|
"type": "string",
|
||||||
"description": "The embedding model to use."
|
"description": "The embedding model to use."
|
||||||
|
@ -15628,13 +15624,16 @@
|
||||||
},
|
},
|
||||||
"vector_db_name": {
|
"vector_db_name": {
|
||||||
"type": "string",
|
"type": "string",
|
||||||
"description": "The name of the vector database."
|
"description": "The name of the vector database. :param provider_vector_db_id: The identifier of the vector database in the provider."
|
||||||
|
},
|
||||||
|
"provider_vector_db_id": {
|
||||||
|
"type": "string",
|
||||||
|
"description": "The identifier of the vector database in the provider."
|
||||||
}
|
}
|
||||||
},
|
},
|
||||||
"additionalProperties": false,
|
"additionalProperties": false,
|
||||||
"required": [
|
"required": [
|
||||||
"vector_db_id",
|
"vector_db_id",
|
||||||
"provider_vector_db_id",
|
|
||||||
"embedding_model"
|
"embedding_model"
|
||||||
],
|
],
|
||||||
"title": "RegisterVectorDbRequest"
|
"title": "RegisterVectorDbRequest"
|
||||||
|
|
13
docs/_static/llama-stack-spec.yaml
vendored
13
docs/_static/llama-stack-spec.yaml
vendored
|
@ -10922,10 +10922,6 @@ components:
|
||||||
type: string
|
type: string
|
||||||
description: >-
|
description: >-
|
||||||
The identifier of the vector database to register.
|
The identifier of the vector database to register.
|
||||||
provider_vector_db_id:
|
|
||||||
type: string
|
|
||||||
description: >-
|
|
||||||
The identifier of the vector database in the provider.
|
|
||||||
embedding_model:
|
embedding_model:
|
||||||
type: string
|
type: string
|
||||||
description: The embedding model to use.
|
description: The embedding model to use.
|
||||||
|
@ -10937,11 +10933,16 @@ components:
|
||||||
description: The identifier of the provider.
|
description: The identifier of the provider.
|
||||||
vector_db_name:
|
vector_db_name:
|
||||||
type: string
|
type: string
|
||||||
description: The name of the vector database.
|
description: >-
|
||||||
|
The name of the vector database. :param provider_vector_db_id: The identifier
|
||||||
|
of the vector database in the provider.
|
||||||
|
provider_vector_db_id:
|
||||||
|
type: string
|
||||||
|
description: >-
|
||||||
|
The identifier of the vector database in the provider.
|
||||||
additionalProperties: false
|
additionalProperties: false
|
||||||
required:
|
required:
|
||||||
- vector_db_id
|
- vector_db_id
|
||||||
- provider_vector_db_id
|
|
||||||
- embedding_model
|
- embedding_model
|
||||||
title: RegisterVectorDbRequest
|
title: RegisterVectorDbRequest
|
||||||
ResumeAgentTurnRequest:
|
ResumeAgentTurnRequest:
|
||||||
|
|
|
@ -68,11 +68,11 @@ class VectorDBs(Protocol):
|
||||||
async def register_vector_db(
|
async def register_vector_db(
|
||||||
self,
|
self,
|
||||||
vector_db_id: str,
|
vector_db_id: str,
|
||||||
provider_vector_db_id: str,
|
|
||||||
embedding_model: str,
|
embedding_model: str,
|
||||||
embedding_dimension: int | None = 384,
|
embedding_dimension: int | None = 384,
|
||||||
provider_id: str | None = None,
|
provider_id: str | None = None,
|
||||||
vector_db_name: str | None = None,
|
vector_db_name: str | None = None,
|
||||||
|
provider_vector_db_id: str | None = None,
|
||||||
) -> VectorDB:
|
) -> VectorDB:
|
||||||
"""Register a vector database.
|
"""Register a vector database.
|
||||||
|
|
||||||
|
@ -82,6 +82,7 @@ class VectorDBs(Protocol):
|
||||||
:param embedding_dimension: The dimension of the embedding model.
|
:param embedding_dimension: The dimension of the embedding model.
|
||||||
:param provider_id: The identifier of the provider.
|
:param provider_id: The identifier of the provider.
|
||||||
:param vector_db_name: The name of the vector database.
|
:param vector_db_name: The name of the vector database.
|
||||||
|
:param provider_vector_db_id: The identifier of the vector database in the provider.
|
||||||
:returns: A VectorDB.
|
:returns: A VectorDB.
|
||||||
"""
|
"""
|
||||||
...
|
...
|
||||||
|
|
|
@ -79,20 +79,20 @@ class VectorIORouter(VectorIO):
|
||||||
async def register_vector_db(
|
async def register_vector_db(
|
||||||
self,
|
self,
|
||||||
vector_db_id: str,
|
vector_db_id: str,
|
||||||
provider_vector_db_id: str,
|
|
||||||
embedding_model: str,
|
embedding_model: str,
|
||||||
embedding_dimension: int | None = 384,
|
embedding_dimension: int | None = 384,
|
||||||
provider_id: str | None = None,
|
provider_id: str | None = None,
|
||||||
vector_db_name: str | None = None,
|
vector_db_name: str | None = None,
|
||||||
|
provider_vector_db_id: str | None = None,
|
||||||
) -> None:
|
) -> None:
|
||||||
logger.debug(f"VectorIORouter.register_vector_db: {vector_db_id}, {embedding_model}")
|
logger.debug(f"VectorIORouter.register_vector_db: {vector_db_id}, {embedding_model}")
|
||||||
await self.routing_table.register_vector_db(
|
await self.routing_table.register_vector_db(
|
||||||
vector_db_id,
|
vector_db_id,
|
||||||
provider_vector_db_id,
|
|
||||||
embedding_model,
|
embedding_model,
|
||||||
embedding_dimension,
|
embedding_dimension,
|
||||||
provider_id,
|
provider_id,
|
||||||
vector_db_name,
|
vector_db_name,
|
||||||
|
provider_vector_db_id,
|
||||||
)
|
)
|
||||||
|
|
||||||
async def insert_chunks(
|
async def insert_chunks(
|
||||||
|
@ -126,6 +126,7 @@ class VectorIORouter(VectorIO):
|
||||||
embedding_model: str | None = None,
|
embedding_model: str | None = None,
|
||||||
embedding_dimension: int | None = None,
|
embedding_dimension: int | None = None,
|
||||||
provider_id: str | None = None,
|
provider_id: str | None = None,
|
||||||
|
provider_vector_db_id: str | None = None,
|
||||||
) -> VectorStoreObject:
|
) -> VectorStoreObject:
|
||||||
logger.debug(f"VectorIORouter.openai_create_vector_store: name={name}, provider_id={provider_id}")
|
logger.debug(f"VectorIORouter.openai_create_vector_store: name={name}, provider_id={provider_id}")
|
||||||
|
|
||||||
|
@ -139,11 +140,11 @@ class VectorIORouter(VectorIO):
|
||||||
|
|
||||||
vector_db_id = f"vs_{uuid.uuid4()}"
|
vector_db_id = f"vs_{uuid.uuid4()}"
|
||||||
registered_vector_db = await self.routing_table.register_vector_db(
|
registered_vector_db = await self.routing_table.register_vector_db(
|
||||||
vector_db_id,
|
|
||||||
vector_db_id,
|
vector_db_id,
|
||||||
embedding_model,
|
embedding_model,
|
||||||
embedding_dimension,
|
embedding_dimension,
|
||||||
provider_id,
|
provider_id,
|
||||||
|
provider_vector_db_id,
|
||||||
name,
|
name,
|
||||||
)
|
)
|
||||||
return await self.routing_table.get_provider_impl(registered_vector_db.identifier).openai_create_vector_store(
|
return await self.routing_table.get_provider_impl(registered_vector_db.identifier).openai_create_vector_store(
|
||||||
|
|
|
@ -32,12 +32,14 @@ class VectorDBsRoutingTable(CommonRoutingTableImpl, VectorDBs):
|
||||||
async def register_vector_db(
|
async def register_vector_db(
|
||||||
self,
|
self,
|
||||||
vector_db_id: str,
|
vector_db_id: str,
|
||||||
provider_vector_db_id: str,
|
|
||||||
embedding_model: str,
|
embedding_model: str,
|
||||||
embedding_dimension: int | None = 384,
|
embedding_dimension: int | None = 384,
|
||||||
provider_id: str | None = None,
|
provider_id: str | None = None,
|
||||||
|
provider_vector_db_id: str | None = None,
|
||||||
vector_db_name: str | None = None,
|
vector_db_name: str | None = None,
|
||||||
) -> VectorDB:
|
) -> VectorDB:
|
||||||
|
if provider_vector_db_id is None:
|
||||||
|
provider_vector_db_id = vector_db_id
|
||||||
if provider_id is None:
|
if provider_id is None:
|
||||||
if len(self.impls_by_provider_id) > 0:
|
if len(self.impls_by_provider_id) > 0:
|
||||||
provider_id = list(self.impls_by_provider_id.keys())[0]
|
provider_id = list(self.impls_by_provider_id.keys())[0]
|
||||||
|
|
|
@ -53,6 +53,7 @@ def test_vector_db_retrieve(client_with_empty_registry, embedding_model_id, embe
|
||||||
vector_db_id=vector_db_id,
|
vector_db_id=vector_db_id,
|
||||||
embedding_model=embedding_model_id,
|
embedding_model=embedding_model_id,
|
||||||
embedding_dimension=embedding_dimension,
|
embedding_dimension=embedding_dimension,
|
||||||
|
provider_vector_db_id=vector_db_id,
|
||||||
)
|
)
|
||||||
|
|
||||||
# Retrieve the memory bank and validate its properties
|
# Retrieve the memory bank and validate its properties
|
||||||
|
@ -69,6 +70,7 @@ def test_vector_db_register(client_with_empty_registry, embedding_model_id, embe
|
||||||
vector_db_id=vector_db_id,
|
vector_db_id=vector_db_id,
|
||||||
embedding_model=embedding_model_id,
|
embedding_model=embedding_model_id,
|
||||||
embedding_dimension=embedding_dimension,
|
embedding_dimension=embedding_dimension,
|
||||||
|
provider_vector_db_id=vector_db_id,
|
||||||
)
|
)
|
||||||
|
|
||||||
vector_dbs_after_register = [vector_db.identifier for vector_db in client_with_empty_registry.vector_dbs.list()]
|
vector_dbs_after_register = [vector_db.identifier for vector_db in client_with_empty_registry.vector_dbs.list()]
|
||||||
|
@ -96,6 +98,7 @@ def test_insert_chunks(client_with_empty_registry, embedding_model_id, embedding
|
||||||
vector_db_id=vector_db_id,
|
vector_db_id=vector_db_id,
|
||||||
embedding_model=embedding_model_id,
|
embedding_model=embedding_model_id,
|
||||||
embedding_dimension=embedding_dimension,
|
embedding_dimension=embedding_dimension,
|
||||||
|
provider_vector_db_id=vector_db_id,
|
||||||
)
|
)
|
||||||
|
|
||||||
client_with_empty_registry.vector_io.insert(
|
client_with_empty_registry.vector_io.insert(
|
||||||
|
@ -131,6 +134,7 @@ def test_insert_chunks_with_precomputed_embeddings(client_with_empty_registry, e
|
||||||
vector_db_id=vector_db_id,
|
vector_db_id=vector_db_id,
|
||||||
embedding_model=embedding_model_id,
|
embedding_model=embedding_model_id,
|
||||||
embedding_dimension=embedding_dimension,
|
embedding_dimension=embedding_dimension,
|
||||||
|
provider_vector_db_id=vector_db_id,
|
||||||
)
|
)
|
||||||
|
|
||||||
chunks_with_embeddings = [
|
chunks_with_embeddings = [
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue