Update docs

2025-10-04 12:07:34 +00:00 · 2025-09-12 19:55:04 -07:00 · 2025-09-12 19:55:04 -07:00 · 3538477070
commit 3538477070
parent a0e6e82c1e
7 changed files with 6 additions and 137 deletions
--- a/llama_stack/apis/inference/inference.py
+++ b/llama_stack/apis/inference/inference.py
@ -1162,7 +1162,7 @@ class Inference(InferenceProvider):
    This API provides the raw interface to the underlying models. Three kinds of models are supported:
    - LLM models: these models generate "raw" and "chat" (conversational) completions.
    - Embedding models: these models generate embeddings to be used for semantic search.
-    - Rerank models: these models reorder the documents by relevance.
+    - Rerank models: these models reorder the documents based on their relevance to a query.
    """

    @webmethod(route="/openai/v1/chat/completions", method="GET", level=LLAMA_STACK_API_V1, deprecated=True)