mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-10-04 04:04:14 +00:00
Merge fa7144163e
into 2f58d87c22
This commit is contained in:
commit
d483239cd7
4 changed files with 12 additions and 19 deletions
11
docs/_static/llama-stack-spec.html
vendored
11
docs/_static/llama-stack-spec.html
vendored
|
@ -17091,14 +17091,14 @@
|
||||||
"type": "string",
|
"type": "string",
|
||||||
"description": "The embedding model to use."
|
"description": "The embedding model to use."
|
||||||
},
|
},
|
||||||
"embedding_dimension": {
|
|
||||||
"type": "integer",
|
|
||||||
"description": "The dimension of the embedding model."
|
|
||||||
},
|
|
||||||
"provider_id": {
|
"provider_id": {
|
||||||
"type": "string",
|
"type": "string",
|
||||||
"description": "The identifier of the provider."
|
"description": "The identifier of the provider."
|
||||||
},
|
},
|
||||||
|
"embedding_dimension": {
|
||||||
|
"type": "integer",
|
||||||
|
"description": "The dimension of the embedding model."
|
||||||
|
},
|
||||||
"vector_db_name": {
|
"vector_db_name": {
|
||||||
"type": "string",
|
"type": "string",
|
||||||
"description": "The name of the vector database."
|
"description": "The name of the vector database."
|
||||||
|
@ -17111,7 +17111,8 @@
|
||||||
"additionalProperties": false,
|
"additionalProperties": false,
|
||||||
"required": [
|
"required": [
|
||||||
"vector_db_id",
|
"vector_db_id",
|
||||||
"embedding_model"
|
"embedding_model",
|
||||||
|
"provider_id"
|
||||||
],
|
],
|
||||||
"title": "RegisterVectorDbRequest"
|
"title": "RegisterVectorDbRequest"
|
||||||
},
|
},
|
||||||
|
|
7
docs/_static/llama-stack-spec.yaml
vendored
7
docs/_static/llama-stack-spec.yaml
vendored
|
@ -12708,12 +12708,12 @@ components:
|
||||||
embedding_model:
|
embedding_model:
|
||||||
type: string
|
type: string
|
||||||
description: The embedding model to use.
|
description: The embedding model to use.
|
||||||
embedding_dimension:
|
|
||||||
type: integer
|
|
||||||
description: The dimension of the embedding model.
|
|
||||||
provider_id:
|
provider_id:
|
||||||
type: string
|
type: string
|
||||||
description: The identifier of the provider.
|
description: The identifier of the provider.
|
||||||
|
embedding_dimension:
|
||||||
|
type: integer
|
||||||
|
description: The dimension of the embedding model.
|
||||||
vector_db_name:
|
vector_db_name:
|
||||||
type: string
|
type: string
|
||||||
description: The name of the vector database.
|
description: The name of the vector database.
|
||||||
|
@ -12725,6 +12725,7 @@ components:
|
||||||
required:
|
required:
|
||||||
- vector_db_id
|
- vector_db_id
|
||||||
- embedding_model
|
- embedding_model
|
||||||
|
- provider_id
|
||||||
title: RegisterVectorDbRequest
|
title: RegisterVectorDbRequest
|
||||||
RerankRequest:
|
RerankRequest:
|
||||||
type: object
|
type: object
|
||||||
|
|
|
@ -90,8 +90,8 @@ class VectorDBs(Protocol):
|
||||||
self,
|
self,
|
||||||
vector_db_id: str,
|
vector_db_id: str,
|
||||||
embedding_model: str,
|
embedding_model: str,
|
||||||
|
provider_id: str,
|
||||||
embedding_dimension: int | None = 384,
|
embedding_dimension: int | None = 384,
|
||||||
provider_id: str | None = None,
|
|
||||||
vector_db_name: str | None = None,
|
vector_db_name: str | None = None,
|
||||||
provider_vector_db_id: str | None = None,
|
provider_vector_db_id: str | None = None,
|
||||||
) -> VectorDB:
|
) -> VectorDB:
|
||||||
|
|
|
@ -47,20 +47,11 @@ class VectorDBsRoutingTable(CommonRoutingTableImpl, VectorDBs):
|
||||||
self,
|
self,
|
||||||
vector_db_id: str,
|
vector_db_id: str,
|
||||||
embedding_model: str,
|
embedding_model: str,
|
||||||
|
provider_id: str,
|
||||||
embedding_dimension: int | None = 384,
|
embedding_dimension: int | None = 384,
|
||||||
provider_id: str | None = None,
|
|
||||||
provider_vector_db_id: str | None = None,
|
provider_vector_db_id: str | None = None,
|
||||||
vector_db_name: str | None = None,
|
vector_db_name: str | None = None,
|
||||||
) -> VectorDB:
|
) -> VectorDB:
|
||||||
if provider_id is None:
|
|
||||||
if len(self.impls_by_provider_id) > 0:
|
|
||||||
provider_id = list(self.impls_by_provider_id.keys())[0]
|
|
||||||
if len(self.impls_by_provider_id) > 1:
|
|
||||||
logger.warning(
|
|
||||||
f"No provider specified and multiple providers available. Arbitrarily selected the first provider {provider_id}."
|
|
||||||
)
|
|
||||||
else:
|
|
||||||
raise ValueError("No provider available. Please configure a vector_io provider.")
|
|
||||||
model = await lookup_model(self, embedding_model)
|
model = await lookup_model(self, embedding_model)
|
||||||
if model is None:
|
if model is None:
|
||||||
raise ModelNotFoundError(embedding_model)
|
raise ModelNotFoundError(embedding_model)
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue