mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-10-04 04:04:14 +00:00
Merge fa7144163e
into 2f58d87c22
This commit is contained in:
commit
d483239cd7
4 changed files with 12 additions and 19 deletions
11
docs/_static/llama-stack-spec.html
vendored
11
docs/_static/llama-stack-spec.html
vendored
|
@ -17091,14 +17091,14 @@
|
|||
"type": "string",
|
||||
"description": "The embedding model to use."
|
||||
},
|
||||
"embedding_dimension": {
|
||||
"type": "integer",
|
||||
"description": "The dimension of the embedding model."
|
||||
},
|
||||
"provider_id": {
|
||||
"type": "string",
|
||||
"description": "The identifier of the provider."
|
||||
},
|
||||
"embedding_dimension": {
|
||||
"type": "integer",
|
||||
"description": "The dimension of the embedding model."
|
||||
},
|
||||
"vector_db_name": {
|
||||
"type": "string",
|
||||
"description": "The name of the vector database."
|
||||
|
@ -17111,7 +17111,8 @@
|
|||
"additionalProperties": false,
|
||||
"required": [
|
||||
"vector_db_id",
|
||||
"embedding_model"
|
||||
"embedding_model",
|
||||
"provider_id"
|
||||
],
|
||||
"title": "RegisterVectorDbRequest"
|
||||
},
|
||||
|
|
7
docs/_static/llama-stack-spec.yaml
vendored
7
docs/_static/llama-stack-spec.yaml
vendored
|
@ -12708,12 +12708,12 @@ components:
|
|||
embedding_model:
|
||||
type: string
|
||||
description: The embedding model to use.
|
||||
embedding_dimension:
|
||||
type: integer
|
||||
description: The dimension of the embedding model.
|
||||
provider_id:
|
||||
type: string
|
||||
description: The identifier of the provider.
|
||||
embedding_dimension:
|
||||
type: integer
|
||||
description: The dimension of the embedding model.
|
||||
vector_db_name:
|
||||
type: string
|
||||
description: The name of the vector database.
|
||||
|
@ -12725,6 +12725,7 @@ components:
|
|||
required:
|
||||
- vector_db_id
|
||||
- embedding_model
|
||||
- provider_id
|
||||
title: RegisterVectorDbRequest
|
||||
RerankRequest:
|
||||
type: object
|
||||
|
|
|
@ -90,8 +90,8 @@ class VectorDBs(Protocol):
|
|||
self,
|
||||
vector_db_id: str,
|
||||
embedding_model: str,
|
||||
provider_id: str,
|
||||
embedding_dimension: int | None = 384,
|
||||
provider_id: str | None = None,
|
||||
vector_db_name: str | None = None,
|
||||
provider_vector_db_id: str | None = None,
|
||||
) -> VectorDB:
|
||||
|
|
|
@ -47,20 +47,11 @@ class VectorDBsRoutingTable(CommonRoutingTableImpl, VectorDBs):
|
|||
self,
|
||||
vector_db_id: str,
|
||||
embedding_model: str,
|
||||
provider_id: str,
|
||||
embedding_dimension: int | None = 384,
|
||||
provider_id: str | None = None,
|
||||
provider_vector_db_id: str | None = None,
|
||||
vector_db_name: str | None = None,
|
||||
) -> VectorDB:
|
||||
if provider_id is None:
|
||||
if len(self.impls_by_provider_id) > 0:
|
||||
provider_id = list(self.impls_by_provider_id.keys())[0]
|
||||
if len(self.impls_by_provider_id) > 1:
|
||||
logger.warning(
|
||||
f"No provider specified and multiple providers available. Arbitrarily selected the first provider {provider_id}."
|
||||
)
|
||||
else:
|
||||
raise ValueError("No provider available. Please configure a vector_io provider.")
|
||||
model = await lookup_model(self, embedding_model)
|
||||
if model is None:
|
||||
raise ModelNotFoundError(embedding_model)
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue