Update docs to include rerank models

2025-10-03 19:57:35 +00:00 · 2025-09-10 11:50:55 -07:00 · 2025-09-10 11:50:55 -07:00 · d1b4e090ef
commit d1b4e090ef
parent 78375889ec
2 changed files with 5 additions and 3 deletions
--- a/docs/static/llama-stack-spec.html
+++ b/docs/static/llama-stack-spec.html
@ -17875,7 +17875,7 @@
        },
        {
            "name": "Inference",
-            "description": "This API provides the raw interface to the underlying models. Two kinds of models are supported:\n- LLM models: these models generate \"raw\" and \"chat\" (conversational) completions.\n- Embedding models: these models generate embeddings to be used for semantic search.",
+            "description": "This API provides the raw interface to the underlying models. Three kinds of models are supported:\n- LLM models: these models generate \"raw\" and \"chat\" (conversational) completions.\n- Embedding models: these models generate embeddings to be used for semantic search.\n- Rerank models: these models reorder the documents by relevance.",
            "x-displayName": "Llama Stack Inference API for generating completions, chat completions, and embeddings."
        },
        {
--- a/docs/static/llama-stack-spec.yaml
+++ b/docs/static/llama-stack-spec.yaml
@ -13452,13 +13452,15 @@ tags:
    description: ''
  - name: Inference
    description: >-
-      This API provides the raw interface to the underlying models. Two kinds of models
+      This API provides the raw interface to the underlying models. Three kinds of
-      are supported:
+      models are supported:
      - LLM models: these models generate "raw" and "chat" (conversational) completions.
      - Embedding models: these models generate embeddings to be used for semantic
      search.
      - Rerank models: these models reorder the documents by relevance.
    x-displayName: >-
      Llama Stack Inference API for generating completions, chat completions, and
      embeddings.