mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-10-04 12:07:34 +00:00
Update docs
This commit is contained in:
parent
a0e6e82c1e
commit
3538477070
7 changed files with 6 additions and 137 deletions
|
@ -191,7 +191,6 @@ class InferenceRouter(Inference):
|
|||
items: list[str | OpenAIChatCompletionContentPartTextParam | OpenAIChatCompletionContentPartImageParam],
|
||||
max_num_results: int | None = None,
|
||||
) -> RerankResponse:
|
||||
"""Route rerank requests to the appropriate provider based on the model."""
|
||||
logger.debug(f"InferenceRouter.rerank: {model}")
|
||||
model_obj = await self._get_model(model, ModelType.rerank)
|
||||
provider = await self.routing_table.get_provider_impl(model_obj.identifier)
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue