diff --git a/docs/static/deprecated-llama-stack-spec.yaml b/docs/static/deprecated-llama-stack-spec.yaml
index 8a230f8b6..3bc965eb7 100644
--- a/docs/static/deprecated-llama-stack-spec.yaml
+++ b/docs/static/deprecated-llama-stack-spec.yaml
@@ -13,1183 +13,7 @@ info:
     migration reference only.
 servers:
   - url: http://any-hosted-llama-stack.com
-paths:
-  /v1/agents:
-    get:
-      responses:
-        '200':
-          description: A PaginatedResponse.
-          content:
-            application/json:
-              schema:
-                $ref: '#/components/schemas/PaginatedResponse'
-        '400':
-          $ref: '#/components/responses/BadRequest400'
-        '429':
-          $ref: >-
-            #/components/responses/TooManyRequests429
-        '500':
-          $ref: >-
-            #/components/responses/InternalServerError500
-        default:
-          $ref: '#/components/responses/DefaultError'
-      tags:
-        - Agents
-      summary: List all agents.
-      description: List all agents.
-      parameters:
-        - name: start_index
-          in: query
-          description: The index to start the pagination from.
-          required: false
-          schema:
-            type: integer
-        - name: limit
-          in: query
-          description: The number of agents to return.
-          required: false
-          schema:
-            type: integer
-      deprecated: true
-    post:
-      responses:
-        '200':
-          description: >-
-            An AgentCreateResponse with the agent ID.
-          content:
-            application/json:
-              schema:
-                $ref: '#/components/schemas/AgentCreateResponse'
-        '400':
-          $ref: '#/components/responses/BadRequest400'
-        '429':
-          $ref: >-
-            #/components/responses/TooManyRequests429
-        '500':
-          $ref: >-
-            #/components/responses/InternalServerError500
-        default:
-          $ref: '#/components/responses/DefaultError'
-      tags:
-        - Agents
-      summary: >-
-        Create an agent with the given configuration.
-      description: >-
-        Create an agent with the given configuration.
-      parameters: []
-      requestBody:
-        content:
-          application/json:
-            schema:
-              $ref: '#/components/schemas/CreateAgentRequest'
-        required: true
-      deprecated: true
-  /v1/agents/{agent_id}:
-    get:
-      responses:
-        '200':
-          description: An Agent of the agent.
-          content:
-            application/json:
-              schema:
-                $ref: '#/components/schemas/Agent'
-        '400':
-          $ref: '#/components/responses/BadRequest400'
-        '429':
-          $ref: >-
-            #/components/responses/TooManyRequests429
-        '500':
-          $ref: >-
-            #/components/responses/InternalServerError500
-        default:
-          $ref: '#/components/responses/DefaultError'
-      tags:
-        - Agents
-      summary: Describe an agent by its ID.
-      description: Describe an agent by its ID.
-      parameters:
-        - name: agent_id
-          in: path
-          description: ID of the agent.
-          required: true
-          schema:
-            type: string
-      deprecated: true
-    delete:
-      responses:
-        '200':
-          description: OK
-        '400':
-          $ref: '#/components/responses/BadRequest400'
-        '429':
-          $ref: >-
-            #/components/responses/TooManyRequests429
-        '500':
-          $ref: >-
-            #/components/responses/InternalServerError500
-        default:
-          $ref: '#/components/responses/DefaultError'
-      tags:
-        - Agents
-      summary: >-
-        Delete an agent by its ID and its associated sessions and turns.
-      description: >-
-        Delete an agent by its ID and its associated sessions and turns.
-      parameters:
-        - name: agent_id
-          in: path
-          description: The ID of the agent to delete.
-          required: true
-          schema:
-            type: string
-      deprecated: true
-  /v1/agents/{agent_id}/session:
-    post:
-      responses:
-        '200':
-          description: An AgentSessionCreateResponse.
-          content:
-            application/json:
-              schema:
-                $ref: '#/components/schemas/AgentSessionCreateResponse'
-        '400':
-          $ref: '#/components/responses/BadRequest400'
-        '429':
-          $ref: >-
-            #/components/responses/TooManyRequests429
-        '500':
-          $ref: >-
-            #/components/responses/InternalServerError500
-        default:
-          $ref: '#/components/responses/DefaultError'
-      tags:
-        - Agents
-      summary: Create a new session for an agent.
-      description: Create a new session for an agent.
-      parameters:
-        - name: agent_id
-          in: path
-          description: >-
-            The ID of the agent to create the session for.
-          required: true
-          schema:
-            type: string
-      requestBody:
-        content:
-          application/json:
-            schema:
-              $ref: '#/components/schemas/CreateAgentSessionRequest'
-        required: true
-      deprecated: true
-  /v1/agents/{agent_id}/session/{session_id}:
-    get:
-      responses:
-        '200':
-          description: A Session.
-          content:
-            application/json:
-              schema:
-                $ref: '#/components/schemas/Session'
-        '400':
-          $ref: '#/components/responses/BadRequest400'
-        '429':
-          $ref: >-
-            #/components/responses/TooManyRequests429
-        '500':
-          $ref: >-
-            #/components/responses/InternalServerError500
-        default:
-          $ref: '#/components/responses/DefaultError'
-      tags:
-        - Agents
-      summary: Retrieve an agent session by its ID.
-      description: Retrieve an agent session by its ID.
-      parameters:
-        - name: session_id
-          in: path
-          description: The ID of the session to get.
-          required: true
-          schema:
-            type: string
-        - name: agent_id
-          in: path
-          description: >-
-            The ID of the agent to get the session for.
-          required: true
-          schema:
-            type: string
-        - name: turn_ids
-          in: query
-          description: >-
-            (Optional) List of turn IDs to filter the session by.
-          required: false
-          schema:
-            type: array
-            items:
-              type: string
-      deprecated: true
-    delete:
-      responses:
-        '200':
-          description: OK
-        '400':
-          $ref: '#/components/responses/BadRequest400'
-        '429':
-          $ref: >-
-            #/components/responses/TooManyRequests429
-        '500':
-          $ref: >-
-            #/components/responses/InternalServerError500
-        default:
-          $ref: '#/components/responses/DefaultError'
-      tags:
-        - Agents
-      summary: >-
-        Delete an agent session by its ID and its associated turns.
-      description: >-
-        Delete an agent session by its ID and its associated turns.
-      parameters:
-        - name: session_id
-          in: path
-          description: The ID of the session to delete.
-          required: true
-          schema:
-            type: string
-        - name: agent_id
-          in: path
-          description: >-
-            The ID of the agent to delete the session for.
-          required: true
-          schema:
-            type: string
-      deprecated: true
-  /v1/agents/{agent_id}/session/{session_id}/turn:
-    post:
-      responses:
-        '200':
-          description: >-
-            If stream=False, returns a Turn object. If stream=True, returns an SSE
-            event stream of AgentTurnResponseStreamChunk.
-          content:
-            application/json:
-              schema:
-                $ref: '#/components/schemas/Turn'
-            text/event-stream:
-              schema:
-                $ref: '#/components/schemas/AgentTurnResponseStreamChunk'
-        '400':
-          $ref: '#/components/responses/BadRequest400'
-        '429':
-          $ref: >-
-            #/components/responses/TooManyRequests429
-        '500':
-          $ref: >-
-            #/components/responses/InternalServerError500
-        default:
-          $ref: '#/components/responses/DefaultError'
-      tags:
-        - Agents
-      summary: Create a new turn for an agent.
-      description: Create a new turn for an agent.
-      parameters:
-        - name: agent_id
-          in: path
-          description: >-
-            The ID of the agent to create the turn for.
-          required: true
-          schema:
-            type: string
-        - name: session_id
-          in: path
-          description: >-
-            The ID of the session to create the turn for.
-          required: true
-          schema:
-            type: string
-      requestBody:
-        content:
-          application/json:
-            schema:
-              $ref: '#/components/schemas/CreateAgentTurnRequest'
-        required: true
-      deprecated: true
-  /v1/agents/{agent_id}/session/{session_id}/turn/{turn_id}:
-    get:
-      responses:
-        '200':
-          description: A Turn.
-          content:
-            application/json:
-              schema:
-                $ref: '#/components/schemas/Turn'
-        '400':
-          $ref: '#/components/responses/BadRequest400'
-        '429':
-          $ref: >-
-            #/components/responses/TooManyRequests429
-        '500':
-          $ref: >-
-            #/components/responses/InternalServerError500
-        default:
-          $ref: '#/components/responses/DefaultError'
-      tags:
-        - Agents
-      summary: Retrieve an agent turn by its ID.
-      description: Retrieve an agent turn by its ID.
-      parameters:
-        - name: agent_id
-          in: path
-          description: The ID of the agent to get the turn for.
-          required: true
-          schema:
-            type: string
-        - name: session_id
-          in: path
-          description: >-
-            The ID of the session to get the turn for.
-          required: true
-          schema:
-            type: string
-        - name: turn_id
-          in: path
-          description: The ID of the turn to get.
-          required: true
-          schema:
-            type: string
-      deprecated: true
-  /v1/agents/{agent_id}/session/{session_id}/turn/{turn_id}/resume:
-    post:
-      responses:
-        '200':
-          description: >-
-            A Turn object if stream is False, otherwise an AsyncIterator of AgentTurnResponseStreamChunk
-            objects.
-          content:
-            application/json:
-              schema:
-                $ref: '#/components/schemas/Turn'
-            text/event-stream:
-              schema:
-                $ref: '#/components/schemas/AgentTurnResponseStreamChunk'
-        '400':
-          $ref: '#/components/responses/BadRequest400'
-        '429':
-          $ref: >-
-            #/components/responses/TooManyRequests429
-        '500':
-          $ref: >-
-            #/components/responses/InternalServerError500
-        default:
-          $ref: '#/components/responses/DefaultError'
-      tags:
-        - Agents
-      summary: >-
-        Resume an agent turn with executed tool call responses.
-      description: >-
-        Resume an agent turn with executed tool call responses.
-
-        When a Turn has the status `awaiting_input` due to pending input from client
-        side tool calls, this endpoint can be used to submit the outputs from the
-        tool calls once they are ready.
-      parameters:
-        - name: agent_id
-          in: path
-          description: The ID of the agent to resume.
-          required: true
-          schema:
-            type: string
-        - name: session_id
-          in: path
-          description: The ID of the session to resume.
-          required: true
-          schema:
-            type: string
-        - name: turn_id
-          in: path
-          description: The ID of the turn to resume.
-          required: true
-          schema:
-            type: string
-      requestBody:
-        content:
-          application/json:
-            schema:
-              $ref: '#/components/schemas/ResumeAgentTurnRequest'
-        required: true
-      deprecated: true
-  /v1/agents/{agent_id}/session/{session_id}/turn/{turn_id}/step/{step_id}:
-    get:
-      responses:
-        '200':
-          description: An AgentStepResponse.
-          content:
-            application/json:
-              schema:
-                $ref: '#/components/schemas/AgentStepResponse'
-        '400':
-          $ref: '#/components/responses/BadRequest400'
-        '429':
-          $ref: >-
-            #/components/responses/TooManyRequests429
-        '500':
-          $ref: >-
-            #/components/responses/InternalServerError500
-        default:
-          $ref: '#/components/responses/DefaultError'
-      tags:
-        - Agents
-      summary: Retrieve an agent step by its ID.
-      description: Retrieve an agent step by its ID.
-      parameters:
-        - name: agent_id
-          in: path
-          description: The ID of the agent to get the step for.
-          required: true
-          schema:
-            type: string
-        - name: session_id
-          in: path
-          description: >-
-            The ID of the session to get the step for.
-          required: true
-          schema:
-            type: string
-        - name: turn_id
-          in: path
-          description: The ID of the turn to get the step for.
-          required: true
-          schema:
-            type: string
-        - name: step_id
-          in: path
-          description: The ID of the step to get.
-          required: true
-          schema:
-            type: string
-      deprecated: true
-  /v1/agents/{agent_id}/sessions:
-    get:
-      responses:
-        '200':
-          description: A PaginatedResponse.
-          content:
-            application/json:
-              schema:
-                $ref: '#/components/schemas/PaginatedResponse'
-        '400':
-          $ref: '#/components/responses/BadRequest400'
-        '429':
-          $ref: >-
-            #/components/responses/TooManyRequests429
-        '500':
-          $ref: >-
-            #/components/responses/InternalServerError500
-        default:
-          $ref: '#/components/responses/DefaultError'
-      tags:
-        - Agents
-      summary: List all session(s) of a given agent.
-      description: List all session(s) of a given agent.
-      parameters:
-        - name: agent_id
-          in: path
-          description: >-
-            The ID of the agent to list sessions for.
-          required: true
-          schema:
-            type: string
-        - name: start_index
-          in: query
-          description: The index to start the pagination from.
-          required: false
-          schema:
-            type: integer
-        - name: limit
-          in: query
-          description: The number of sessions to return.
-          required: false
-          schema:
-            type: integer
-      deprecated: true
-  /v1/datasetio/append-rows/{dataset_id}:
-    post:
-      responses:
-        '200':
-          description: OK
-        '400':
-          $ref: '#/components/responses/BadRequest400'
-        '429':
-          $ref: >-
-            #/components/responses/TooManyRequests429
-        '500':
-          $ref: >-
-            #/components/responses/InternalServerError500
-        default:
-          $ref: '#/components/responses/DefaultError'
-      tags:
-        - DatasetIO
-      summary: Append rows to a dataset.
-      description: Append rows to a dataset.
-      parameters:
-        - name: dataset_id
-          in: path
-          description: >-
-            The ID of the dataset to append the rows to.
-          required: true
-          schema:
-            type: string
-      requestBody:
-        content:
-          application/json:
-            schema:
-              $ref: '#/components/schemas/AppendRowsRequest'
-        required: true
-      deprecated: true
-  /v1/datasetio/iterrows/{dataset_id}:
-    get:
-      responses:
-        '200':
-          description: A PaginatedResponse.
-          content:
-            application/json:
-              schema:
-                $ref: '#/components/schemas/PaginatedResponse'
-        '400':
-          $ref: '#/components/responses/BadRequest400'
-        '429':
-          $ref: >-
-            #/components/responses/TooManyRequests429
-        '500':
-          $ref: >-
-            #/components/responses/InternalServerError500
-        default:
-          $ref: '#/components/responses/DefaultError'
-      tags:
-        - DatasetIO
-      summary: >-
-        Get a paginated list of rows from a dataset.
-      description: >-
-        Get a paginated list of rows from a dataset.
-
-        Uses offset-based pagination where:
-
-        - start_index: The starting index (0-based). If None, starts from beginning.
-
-        - limit: Number of items to return. If None or -1, returns all items.
-
-
-        The response includes:
-
-        - data: List of items for the current page.
-
-        - has_more: Whether there are more items available after this set.
-      parameters:
-        - name: dataset_id
-          in: path
-          description: >-
-            The ID of the dataset to get the rows from.
-          required: true
-          schema:
-            type: string
-        - name: start_index
-          in: query
-          description: >-
-            Index into dataset for the first row to get. Get all rows if None.
-          required: false
-          schema:
-            type: integer
-        - name: limit
-          in: query
-          description: The number of rows to get.
-          required: false
-          schema:
-            type: integer
-      deprecated: true
-  /v1/datasets:
-    get:
-      responses:
-        '200':
-          description: A ListDatasetsResponse.
-          content:
-            application/json:
-              schema:
-                $ref: '#/components/schemas/ListDatasetsResponse'
-        '400':
-          $ref: '#/components/responses/BadRequest400'
-        '429':
-          $ref: >-
-            #/components/responses/TooManyRequests429
-        '500':
-          $ref: >-
-            #/components/responses/InternalServerError500
-        default:
-          $ref: '#/components/responses/DefaultError'
-      tags:
-        - Datasets
-      summary: List all datasets.
-      description: List all datasets.
-      parameters: []
-      deprecated: true
-    post:
-      responses:
-        '200':
-          description: A Dataset.
-          content:
-            application/json:
-              schema:
-                $ref: '#/components/schemas/Dataset'
-        '400':
-          $ref: '#/components/responses/BadRequest400'
-        '429':
-          $ref: >-
-            #/components/responses/TooManyRequests429
-        '500':
-          $ref: >-
-            #/components/responses/InternalServerError500
-        default:
-          $ref: '#/components/responses/DefaultError'
-      tags:
-        - Datasets
-      summary: Register a new dataset.
-      description: Register a new dataset.
-      parameters: []
-      requestBody:
-        content:
-          application/json:
-            schema:
-              $ref: '#/components/schemas/RegisterDatasetRequest'
-        required: true
-      deprecated: true
-  /v1/datasets/{dataset_id}:
-    get:
-      responses:
-        '200':
-          description: A Dataset.
-          content:
-            application/json:
-              schema:
-                $ref: '#/components/schemas/Dataset'
-        '400':
-          $ref: '#/components/responses/BadRequest400'
-        '429':
-          $ref: >-
-            #/components/responses/TooManyRequests429
-        '500':
-          $ref: >-
-            #/components/responses/InternalServerError500
-        default:
-          $ref: '#/components/responses/DefaultError'
-      tags:
-        - Datasets
-      summary: Get a dataset by its ID.
-      description: Get a dataset by its ID.
-      parameters:
-        - name: dataset_id
-          in: path
-          description: The ID of the dataset to get.
-          required: true
-          schema:
-            type: string
-      deprecated: true
-    delete:
-      responses:
-        '200':
-          description: OK
-        '400':
-          $ref: '#/components/responses/BadRequest400'
-        '429':
-          $ref: >-
-            #/components/responses/TooManyRequests429
-        '500':
-          $ref: >-
-            #/components/responses/InternalServerError500
-        default:
-          $ref: '#/components/responses/DefaultError'
-      tags:
-        - Datasets
-      summary: Unregister a dataset by its ID.
-      description: Unregister a dataset by its ID.
-      parameters:
-        - name: dataset_id
-          in: path
-          description: The ID of the dataset to unregister.
-          required: true
-          schema:
-            type: string
-      deprecated: true
-  /v1/eval/benchmarks:
-    get:
-      responses:
-        '200':
-          description: A ListBenchmarksResponse.
-          content:
-            application/json:
-              schema:
-                $ref: '#/components/schemas/ListBenchmarksResponse'
-        '400':
-          $ref: '#/components/responses/BadRequest400'
-        '429':
-          $ref: >-
-            #/components/responses/TooManyRequests429
-        '500':
-          $ref: >-
-            #/components/responses/InternalServerError500
-        default:
-          $ref: '#/components/responses/DefaultError'
-      tags:
-        - Benchmarks
-      summary: List all benchmarks.
-      description: List all benchmarks.
-      parameters: []
-      deprecated: true
-    post:
-      responses:
-        '200':
-          description: OK
-        '400':
-          $ref: '#/components/responses/BadRequest400'
-        '429':
-          $ref: >-
-            #/components/responses/TooManyRequests429
-        '500':
-          $ref: >-
-            #/components/responses/InternalServerError500
-        default:
-          $ref: '#/components/responses/DefaultError'
-      tags:
-        - Benchmarks
-      summary: Register a benchmark.
-      description: Register a benchmark.
-      parameters: []
-      requestBody:
-        content:
-          application/json:
-            schema:
-              $ref: '#/components/schemas/RegisterBenchmarkRequest'
-        required: true
-      deprecated: true
-  /v1/eval/benchmarks/{benchmark_id}:
-    get:
-      responses:
-        '200':
-          description: A Benchmark.
-          content:
-            application/json:
-              schema:
-                $ref: '#/components/schemas/Benchmark'
-        '400':
-          $ref: '#/components/responses/BadRequest400'
-        '429':
-          $ref: >-
-            #/components/responses/TooManyRequests429
-        '500':
-          $ref: >-
-            #/components/responses/InternalServerError500
-        default:
-          $ref: '#/components/responses/DefaultError'
-      tags:
-        - Benchmarks
-      summary: Get a benchmark by its ID.
-      description: Get a benchmark by its ID.
-      parameters:
-        - name: benchmark_id
-          in: path
-          description: The ID of the benchmark to get.
-          required: true
-          schema:
-            type: string
-      deprecated: true
-    delete:
-      responses:
-        '200':
-          description: OK
-        '400':
-          $ref: '#/components/responses/BadRequest400'
-        '429':
-          $ref: >-
-            #/components/responses/TooManyRequests429
-        '500':
-          $ref: >-
-            #/components/responses/InternalServerError500
-        default:
-          $ref: '#/components/responses/DefaultError'
-      tags:
-        - Benchmarks
-      summary: Unregister a benchmark.
-      description: Unregister a benchmark.
-      parameters:
-        - name: benchmark_id
-          in: path
-          description: The ID of the benchmark to unregister.
-          required: true
-          schema:
-            type: string
-      deprecated: true
-  /v1/eval/benchmarks/{benchmark_id}/evaluations:
-    post:
-      responses:
-        '200':
-          description: >-
-            EvaluateResponse object containing generations and scores.
-          content:
-            application/json:
-              schema:
-                $ref: '#/components/schemas/EvaluateResponse'
-        '400':
-          $ref: '#/components/responses/BadRequest400'
-        '429':
-          $ref: >-
-            #/components/responses/TooManyRequests429
-        '500':
-          $ref: >-
-            #/components/responses/InternalServerError500
-        default:
-          $ref: '#/components/responses/DefaultError'
-      tags:
-        - Eval
-      summary: Evaluate a list of rows on a benchmark.
-      description: Evaluate a list of rows on a benchmark.
-      parameters:
-        - name: benchmark_id
-          in: path
-          description: >-
-            The ID of the benchmark to run the evaluation on.
-          required: true
-          schema:
-            type: string
-      requestBody:
-        content:
-          application/json:
-            schema:
-              $ref: '#/components/schemas/EvaluateRowsRequest'
-        required: true
-      deprecated: true
-  /v1/eval/benchmarks/{benchmark_id}/jobs:
-    post:
-      responses:
-        '200':
-          description: >-
-            The job that was created to run the evaluation.
-          content:
-            application/json:
-              schema:
-                $ref: '#/components/schemas/Job'
-        '400':
-          $ref: '#/components/responses/BadRequest400'
-        '429':
-          $ref: >-
-            #/components/responses/TooManyRequests429
-        '500':
-          $ref: >-
-            #/components/responses/InternalServerError500
-        default:
-          $ref: '#/components/responses/DefaultError'
-      tags:
-        - Eval
-      summary: Run an evaluation on a benchmark.
-      description: Run an evaluation on a benchmark.
-      parameters:
-        - name: benchmark_id
-          in: path
-          description: >-
-            The ID of the benchmark to run the evaluation on.
-          required: true
-          schema:
-            type: string
-      requestBody:
-        content:
-          application/json:
-            schema:
-              $ref: '#/components/schemas/RunEvalRequest'
-        required: true
-      deprecated: true
-  /v1/eval/benchmarks/{benchmark_id}/jobs/{job_id}:
-    get:
-      responses:
-        '200':
-          description: The status of the evaluation job.
-          content:
-            application/json:
-              schema:
-                $ref: '#/components/schemas/Job'
-        '400':
-          $ref: '#/components/responses/BadRequest400'
-        '429':
-          $ref: >-
-            #/components/responses/TooManyRequests429
-        '500':
-          $ref: >-
-            #/components/responses/InternalServerError500
-        default:
-          $ref: '#/components/responses/DefaultError'
-      tags:
-        - Eval
-      summary: Get the status of a job.
-      description: Get the status of a job.
-      parameters:
-        - name: benchmark_id
-          in: path
-          description: >-
-            The ID of the benchmark to run the evaluation on.
-          required: true
-          schema:
-            type: string
-        - name: job_id
-          in: path
-          description: The ID of the job to get the status of.
-          required: true
-          schema:
-            type: string
-      deprecated: true
-    delete:
-      responses:
-        '200':
-          description: OK
-        '400':
-          $ref: '#/components/responses/BadRequest400'
-        '429':
-          $ref: >-
-            #/components/responses/TooManyRequests429
-        '500':
-          $ref: >-
-            #/components/responses/InternalServerError500
-        default:
-          $ref: '#/components/responses/DefaultError'
-      tags:
-        - Eval
-      summary: Cancel a job.
-      description: Cancel a job.
-      parameters:
-        - name: benchmark_id
-          in: path
-          description: >-
-            The ID of the benchmark to run the evaluation on.
-          required: true
-          schema:
-            type: string
-        - name: job_id
-          in: path
-          description: The ID of the job to cancel.
-          required: true
-          schema:
-            type: string
-      deprecated: true
-  /v1/eval/benchmarks/{benchmark_id}/jobs/{job_id}/result:
-    get:
-      responses:
-        '200':
-          description: The result of the job.
-          content:
-            application/json:
-              schema:
-                $ref: '#/components/schemas/EvaluateResponse'
-        '400':
-          $ref: '#/components/responses/BadRequest400'
-        '429':
-          $ref: >-
-            #/components/responses/TooManyRequests429
-        '500':
-          $ref: >-
-            #/components/responses/InternalServerError500
-        default:
-          $ref: '#/components/responses/DefaultError'
-      tags:
-        - Eval
-      summary: Get the result of a job.
-      description: Get the result of a job.
-      parameters:
-        - name: benchmark_id
-          in: path
-          description: >-
-            The ID of the benchmark to run the evaluation on.
-          required: true
-          schema:
-            type: string
-        - name: job_id
-          in: path
-          description: The ID of the job to get the result of.
-          required: true
-          schema:
-            type: string
-      deprecated: true
-  /v1/post-training/job/artifacts:
-    get:
-      responses:
-        '200':
-          description: A PostTrainingJobArtifactsResponse.
-          content:
-            application/json:
-              schema:
-                $ref: '#/components/schemas/PostTrainingJobArtifactsResponse'
-        '400':
-          $ref: '#/components/responses/BadRequest400'
-        '429':
-          $ref: >-
-            #/components/responses/TooManyRequests429
-        '500':
-          $ref: >-
-            #/components/responses/InternalServerError500
-        default:
-          $ref: '#/components/responses/DefaultError'
-      tags:
-        - PostTraining (Coming Soon)
-      summary: Get the artifacts of a training job.
-      description: Get the artifacts of a training job.
-      parameters:
-        - name: job_uuid
-          in: query
-          description: >-
-            The UUID of the job to get the artifacts of.
-          required: true
-          schema:
-            type: string
-      deprecated: true
-  /v1/post-training/job/cancel:
-    post:
-      responses:
-        '200':
-          description: OK
-        '400':
-          $ref: '#/components/responses/BadRequest400'
-        '429':
-          $ref: >-
-            #/components/responses/TooManyRequests429
-        '500':
-          $ref: >-
-            #/components/responses/InternalServerError500
-        default:
-          $ref: '#/components/responses/DefaultError'
-      tags:
-        - PostTraining (Coming Soon)
-      summary: Cancel a training job.
-      description: Cancel a training job.
-      parameters: []
-      requestBody:
-        content:
-          application/json:
-            schema:
-              $ref: '#/components/schemas/CancelTrainingJobRequest'
-        required: true
-      deprecated: true
-  /v1/post-training/job/status:
-    get:
-      responses:
-        '200':
-          description: A PostTrainingJobStatusResponse.
-          content:
-            application/json:
-              schema:
-                $ref: '#/components/schemas/PostTrainingJobStatusResponse'
-        '400':
-          $ref: '#/components/responses/BadRequest400'
-        '429':
-          $ref: >-
-            #/components/responses/TooManyRequests429
-        '500':
-          $ref: >-
-            #/components/responses/InternalServerError500
-        default:
-          $ref: '#/components/responses/DefaultError'
-      tags:
-        - PostTraining (Coming Soon)
-      summary: Get the status of a training job.
-      description: Get the status of a training job.
-      parameters:
-        - name: job_uuid
-          in: query
-          description: >-
-            The UUID of the job to get the status of.
-          required: true
-          schema:
-            type: string
-      deprecated: true
-  /v1/post-training/jobs:
-    get:
-      responses:
-        '200':
-          description: A ListPostTrainingJobsResponse.
-          content:
-            application/json:
-              schema:
-                $ref: '#/components/schemas/ListPostTrainingJobsResponse'
-        '400':
-          $ref: '#/components/responses/BadRequest400'
-        '429':
-          $ref: >-
-            #/components/responses/TooManyRequests429
-        '500':
-          $ref: >-
-            #/components/responses/InternalServerError500
-        default:
-          $ref: '#/components/responses/DefaultError'
-      tags:
-        - PostTraining (Coming Soon)
-      summary: Get all training jobs.
-      description: Get all training jobs.
-      parameters: []
-      deprecated: true
-  /v1/post-training/preference-optimize:
-    post:
-      responses:
-        '200':
-          description: A PostTrainingJob.
-          content:
-            application/json:
-              schema:
-                $ref: '#/components/schemas/PostTrainingJob'
-        '400':
-          $ref: '#/components/responses/BadRequest400'
-        '429':
-          $ref: >-
-            #/components/responses/TooManyRequests429
-        '500':
-          $ref: >-
-            #/components/responses/InternalServerError500
-        default:
-          $ref: '#/components/responses/DefaultError'
-      tags:
-        - PostTraining (Coming Soon)
-      summary: Run preference optimization of a model.
-      description: Run preference optimization of a model.
-      parameters: []
-      requestBody:
-        content:
-          application/json:
-            schema:
-              $ref: '#/components/schemas/PreferenceOptimizeRequest'
-        required: true
-      deprecated: true
-  /v1/post-training/supervised-fine-tune:
-    post:
-      responses:
-        '200':
-          description: A PostTrainingJob.
-          content:
-            application/json:
-              schema:
-                $ref: '#/components/schemas/PostTrainingJob'
-        '400':
-          $ref: '#/components/responses/BadRequest400'
-        '429':
-          $ref: >-
-            #/components/responses/TooManyRequests429
-        '500':
-          $ref: >-
-            #/components/responses/InternalServerError500
-        default:
-          $ref: '#/components/responses/DefaultError'
-      tags:
-        - PostTraining (Coming Soon)
-      summary: Run supervised fine-tuning of a model.
-      description: Run supervised fine-tuning of a model.
-      parameters: []
-      requestBody:
-        content:
-          application/json:
-            schema:
-              $ref: '#/components/schemas/SupervisedFineTuneRequest'
-        required: true
-      deprecated: true
+paths: {}
 jsonSchemaDialect: >-
   https://json-schema.org/draft/2020-12/schema
 components:
@@ -1222,2638 +46,6 @@ components:
       title: Error
       description: >-
         Error response from the API. Roughly follows RFC 7807.
-    PaginatedResponse:
-      type: object
-      properties:
-        data:
-          type: array
-          items:
-            type: object
-            additionalProperties:
-              oneOf:
-                - type: 'null'
-                - type: boolean
-                - type: number
-                - type: string
-                - type: array
-                - type: object
-          description: The list of items for the current page
-        has_more:
-          type: boolean
-          description: >-
-            Whether there are more items available after this set
-        url:
-          type: string
-          description: The URL for accessing this list
-      additionalProperties: false
-      required:
-        - data
-        - has_more
-      title: PaginatedResponse
-      description: >-
-        A generic paginated response that follows a simple format.
-    AgentConfig:
-      type: object
-      properties:
-        sampling_params:
-          $ref: '#/components/schemas/SamplingParams'
-        input_shields:
-          type: array
-          items:
-            type: string
-        output_shields:
-          type: array
-          items:
-            type: string
-        toolgroups:
-          type: array
-          items:
-            $ref: '#/components/schemas/AgentTool'
-        client_tools:
-          type: array
-          items:
-            $ref: '#/components/schemas/ToolDef'
-        tool_choice:
-          type: string
-          enum:
-            - auto
-            - required
-            - none
-          title: ToolChoice
-          description: >-
-            Whether tool use is required or automatic. This is a hint to the model
-            which may not be followed. It depends on the Instruction Following capabilities
-            of the model.
-          deprecated: true
-        tool_prompt_format:
-          type: string
-          enum:
-            - json
-            - function_tag
-            - python_list
-          title: ToolPromptFormat
-          description: >-
-            Prompt format for calling custom / zero shot tools.
-          deprecated: true
-        tool_config:
-          $ref: '#/components/schemas/ToolConfig'
-        max_infer_iters:
-          type: integer
-          default: 10
-        model:
-          type: string
-          description: >-
-            The model identifier to use for the agent
-        instructions:
-          type: string
-          description: The system instructions for the agent
-        name:
-          type: string
-          description: >-
-            Optional name for the agent, used in telemetry and identification
-        enable_session_persistence:
-          type: boolean
-          default: false
-          description: >-
-            Optional flag indicating whether session data has to be persisted
-        response_format:
-          $ref: '#/components/schemas/ResponseFormat'
-          description: Optional response format configuration
-      additionalProperties: false
-      required:
-        - model
-        - instructions
-      title: AgentConfig
-      description: Configuration for an agent.
-    AgentTool:
-      oneOf:
-        - type: string
-        - type: object
-          properties:
-            name:
-              type: string
-            args:
-              type: object
-              additionalProperties:
-                oneOf:
-                  - type: 'null'
-                  - type: boolean
-                  - type: number
-                  - type: string
-                  - type: array
-                  - type: object
-          additionalProperties: false
-          required:
-            - name
-            - args
-          title: AgentToolGroupWithArgs
-    GrammarResponseFormat:
-      type: object
-      properties:
-        type:
-          type: string
-          enum:
-            - json_schema
-            - grammar
-          description: >-
-            Must be "grammar" to identify this format type
-          const: grammar
-          default: grammar
-        bnf:
-          type: object
-          additionalProperties:
-            oneOf:
-              - type: 'null'
-              - type: boolean
-              - type: number
-              - type: string
-              - type: array
-              - type: object
-          description: >-
-            The BNF grammar specification the response should conform to
-      additionalProperties: false
-      required:
-        - type
-        - bnf
-      title: GrammarResponseFormat
-      description: >-
-        Configuration for grammar-guided response generation.
-    GreedySamplingStrategy:
-      type: object
-      properties:
-        type:
-          type: string
-          const: greedy
-          default: greedy
-          description: >-
-            Must be "greedy" to identify this sampling strategy
-      additionalProperties: false
-      required:
-        - type
-      title: GreedySamplingStrategy
-      description: >-
-        Greedy sampling strategy that selects the highest probability token at each
-        step.
-    JsonSchemaResponseFormat:
-      type: object
-      properties:
-        type:
-          type: string
-          enum:
-            - json_schema
-            - grammar
-          description: >-
-            Must be "json_schema" to identify this format type
-          const: json_schema
-          default: json_schema
-        json_schema:
-          type: object
-          additionalProperties:
-            oneOf:
-              - type: 'null'
-              - type: boolean
-              - type: number
-              - type: string
-              - type: array
-              - type: object
-          description: >-
-            The JSON schema the response should conform to. In a Python SDK, this
-            is often a `pydantic` model.
-      additionalProperties: false
-      required:
-        - type
-        - json_schema
-      title: JsonSchemaResponseFormat
-      description: >-
-        Configuration for JSON schema-guided response generation.
-    ResponseFormat:
-      oneOf:
-        - $ref: '#/components/schemas/JsonSchemaResponseFormat'
-        - $ref: '#/components/schemas/GrammarResponseFormat'
-      discriminator:
-        propertyName: type
-        mapping:
-          json_schema: '#/components/schemas/JsonSchemaResponseFormat'
-          grammar: '#/components/schemas/GrammarResponseFormat'
-    SamplingParams:
-      type: object
-      properties:
-        strategy:
-          oneOf:
-            - $ref: '#/components/schemas/GreedySamplingStrategy'
-            - $ref: '#/components/schemas/TopPSamplingStrategy'
-            - $ref: '#/components/schemas/TopKSamplingStrategy'
-          discriminator:
-            propertyName: type
-            mapping:
-              greedy: '#/components/schemas/GreedySamplingStrategy'
-              top_p: '#/components/schemas/TopPSamplingStrategy'
-              top_k: '#/components/schemas/TopKSamplingStrategy'
-          description: The sampling strategy.
-        max_tokens:
-          type: integer
-          description: >-
-            The maximum number of tokens that can be generated in the completion.
-            The token count of your prompt plus max_tokens cannot exceed the model's
-            context length.
-        repetition_penalty:
-          type: number
-          default: 1.0
-          description: >-
-            Number between -2.0 and 2.0. Positive values penalize new tokens based
-            on whether they appear in the text so far, increasing the model's likelihood
-            to talk about new topics.
-        stop:
-          type: array
-          items:
-            type: string
-          description: >-
-            Up to 4 sequences where the API will stop generating further tokens. The
-            returned text will not contain the stop sequence.
-      additionalProperties: false
-      required:
-        - strategy
-      title: SamplingParams
-      description: Sampling parameters.
-    ToolConfig:
-      type: object
-      properties:
-        tool_choice:
-          oneOf:
-            - type: string
-              enum:
-                - auto
-                - required
-                - none
-              title: ToolChoice
-              description: >-
-                Whether tool use is required or automatic. This is a hint to the model
-                which may not be followed. It depends on the Instruction Following
-                capabilities of the model.
-            - type: string
-          default: auto
-          description: >-
-            (Optional) Whether tool use is automatic, required, or none. Can also
-            specify a tool name to use a specific tool. Defaults to ToolChoice.auto.
-        tool_prompt_format:
-          type: string
-          enum:
-            - json
-            - function_tag
-            - python_list
-          description: >-
-            (Optional) Instructs the model how to format tool calls. By default, Llama
-            Stack will attempt to use a format that is best adapted to the model.
-            - `ToolPromptFormat.json`: The tool calls are formatted as a JSON object.
-            - `ToolPromptFormat.function_tag`: The tool calls are enclosed in a <function=function_name>
-            tag. - `ToolPromptFormat.python_list`: The tool calls are output as Python
-            syntax -- a list of function calls.
-        system_message_behavior:
-          type: string
-          enum:
-            - append
-            - replace
-          description: >-
-            (Optional) Config for how to override the default system prompt. - `SystemMessageBehavior.append`:
-            Appends the provided system message to the default system prompt. - `SystemMessageBehavior.replace`:
-            Replaces the default system prompt with the provided system message. The
-            system message can include the string '{{function_definitions}}' to indicate
-            where the function definitions should be inserted.
-          default: append
-      additionalProperties: false
-      title: ToolConfig
-      description: Configuration for tool use.
-    ToolDef:
-      type: object
-      properties:
-        toolgroup_id:
-          type: string
-          description: >-
-            (Optional) ID of the tool group this tool belongs to
-        name:
-          type: string
-          description: Name of the tool
-        description:
-          type: string
-          description: >-
-            (Optional) Human-readable description of what the tool does
-        input_schema:
-          type: object
-          additionalProperties:
-            oneOf:
-              - type: 'null'
-              - type: boolean
-              - type: number
-              - type: string
-              - type: array
-              - type: object
-          description: >-
-            (Optional) JSON Schema for tool inputs (MCP inputSchema)
-        output_schema:
-          type: object
-          additionalProperties:
-            oneOf:
-              - type: 'null'
-              - type: boolean
-              - type: number
-              - type: string
-              - type: array
-              - type: object
-          description: >-
-            (Optional) JSON Schema for tool outputs (MCP outputSchema)
-        metadata:
-          type: object
-          additionalProperties:
-            oneOf:
-              - type: 'null'
-              - type: boolean
-              - type: number
-              - type: string
-              - type: array
-              - type: object
-          description: >-
-            (Optional) Additional metadata about the tool
-      additionalProperties: false
-      required:
-        - name
-      title: ToolDef
-      description: >-
-        Tool definition used in runtime contexts.
-    TopKSamplingStrategy:
-      type: object
-      properties:
-        type:
-          type: string
-          const: top_k
-          default: top_k
-          description: >-
-            Must be "top_k" to identify this sampling strategy
-        top_k:
-          type: integer
-          description: >-
-            Number of top tokens to consider for sampling. Must be at least 1
-      additionalProperties: false
-      required:
-        - type
-        - top_k
-      title: TopKSamplingStrategy
-      description: >-
-        Top-k sampling strategy that restricts sampling to the k most likely tokens.
-    TopPSamplingStrategy:
-      type: object
-      properties:
-        type:
-          type: string
-          const: top_p
-          default: top_p
-          description: >-
-            Must be "top_p" to identify this sampling strategy
-        temperature:
-          type: number
-          description: >-
-            Controls randomness in sampling. Higher values increase randomness
-        top_p:
-          type: number
-          default: 0.95
-          description: >-
-            Cumulative probability threshold for nucleus sampling. Defaults to 0.95
-      additionalProperties: false
-      required:
-        - type
-      title: TopPSamplingStrategy
-      description: >-
-        Top-p (nucleus) sampling strategy that samples from the smallest set of tokens
-        with cumulative probability >= p.
-    CreateAgentRequest:
-      type: object
-      properties:
-        agent_config:
-          $ref: '#/components/schemas/AgentConfig'
-          description: The configuration for the agent.
-      additionalProperties: false
-      required:
-        - agent_config
-      title: CreateAgentRequest
-    AgentCreateResponse:
-      type: object
-      properties:
-        agent_id:
-          type: string
-          description: Unique identifier for the created agent
-      additionalProperties: false
-      required:
-        - agent_id
-      title: AgentCreateResponse
-      description: >-
-        Response returned when creating a new agent.
-    Agent:
-      type: object
-      properties:
-        agent_id:
-          type: string
-          description: Unique identifier for the agent
-        agent_config:
-          $ref: '#/components/schemas/AgentConfig'
-          description: Configuration settings for the agent
-        created_at:
-          type: string
-          format: date-time
-          description: Timestamp when the agent was created
-      additionalProperties: false
-      required:
-        - agent_id
-        - agent_config
-        - created_at
-      title: Agent
-      description: >-
-        An agent instance with configuration and metadata.
-    CreateAgentSessionRequest:
-      type: object
-      properties:
-        session_name:
-          type: string
-          description: The name of the session to create.
-      additionalProperties: false
-      required:
-        - session_name
-      title: CreateAgentSessionRequest
-    AgentSessionCreateResponse:
-      type: object
-      properties:
-        session_id:
-          type: string
-          description: >-
-            Unique identifier for the created session
-      additionalProperties: false
-      required:
-        - session_id
-      title: AgentSessionCreateResponse
-      description: >-
-        Response returned when creating a new agent session.
-    CompletionMessage:
-      type: object
-      properties:
-        role:
-          type: string
-          const: assistant
-          default: assistant
-          description: >-
-            Must be "assistant" to identify this as the model's response
-        content:
-          $ref: '#/components/schemas/InterleavedContent'
-          description: The content of the model's response
-        stop_reason:
-          type: string
-          enum:
-            - end_of_turn
-            - end_of_message
-            - out_of_tokens
-          description: >-
-            Reason why the model stopped generating. Options are: - `StopReason.end_of_turn`:
-            The model finished generating the entire response. - `StopReason.end_of_message`:
-            The model finished generating but generated a partial response -- usually,
-            a tool call. The user may call the tool and continue the conversation
-            with the tool's response. - `StopReason.out_of_tokens`: The model ran
-            out of token budget.
-        tool_calls:
-          type: array
-          items:
-            $ref: '#/components/schemas/ToolCall'
-          description: >-
-            List of tool calls. Each tool call is a ToolCall object.
-      additionalProperties: false
-      required:
-        - role
-        - content
-        - stop_reason
-      title: CompletionMessage
-      description: >-
-        A message containing the model's (assistant) response in a chat conversation.
-    ImageContentItem:
-      type: object
-      properties:
-        type:
-          type: string
-          const: image
-          default: image
-          description: >-
-            Discriminator type of the content item. Always "image"
-        image:
-          type: object
-          properties:
-            url:
-              $ref: '#/components/schemas/URL'
-              description: >-
-                A URL of the image or data URL in the format of data:image/{type};base64,{data}.
-                Note that URL could have length limits.
-            data:
-              type: string
-              contentEncoding: base64
-              description: base64 encoded image data as string
-          additionalProperties: false
-          description: >-
-            Image as a base64 encoded string or an URL
-      additionalProperties: false
-      required:
-        - type
-        - image
-      title: ImageContentItem
-      description: A image content item
-    InferenceStep:
-      type: object
-      properties:
-        turn_id:
-          type: string
-          description: The ID of the turn.
-        step_id:
-          type: string
-          description: The ID of the step.
-        started_at:
-          type: string
-          format: date-time
-          description: The time the step started.
-        completed_at:
-          type: string
-          format: date-time
-          description: The time the step completed.
-        step_type:
-          type: string
-          enum:
-            - inference
-            - tool_execution
-            - shield_call
-            - memory_retrieval
-          title: StepType
-          description: Type of the step in an agent turn.
-          const: inference
-          default: inference
-        model_response:
-          $ref: '#/components/schemas/CompletionMessage'
-          description: The response from the LLM.
-      additionalProperties: false
-      required:
-        - turn_id
-        - step_id
-        - step_type
-        - model_response
-      title: InferenceStep
-      description: An inference step in an agent turn.
-    InterleavedContent:
-      oneOf:
-        - type: string
-        - $ref: '#/components/schemas/InterleavedContentItem'
-        - type: array
-          items:
-            $ref: '#/components/schemas/InterleavedContentItem'
-    InterleavedContentItem:
-      oneOf:
-        - $ref: '#/components/schemas/ImageContentItem'
-        - $ref: '#/components/schemas/TextContentItem'
-      discriminator:
-        propertyName: type
-        mapping:
-          image: '#/components/schemas/ImageContentItem'
-          text: '#/components/schemas/TextContentItem'
-    MemoryRetrievalStep:
-      type: object
-      properties:
-        turn_id:
-          type: string
-          description: The ID of the turn.
-        step_id:
-          type: string
-          description: The ID of the step.
-        started_at:
-          type: string
-          format: date-time
-          description: The time the step started.
-        completed_at:
-          type: string
-          format: date-time
-          description: The time the step completed.
-        step_type:
-          type: string
-          enum:
-            - inference
-            - tool_execution
-            - shield_call
-            - memory_retrieval
-          title: StepType
-          description: Type of the step in an agent turn.
-          const: memory_retrieval
-          default: memory_retrieval
-        vector_store_ids:
-          type: string
-          description: >-
-            The IDs of the vector databases to retrieve context from.
-        inserted_context:
-          $ref: '#/components/schemas/InterleavedContent'
-          description: >-
-            The context retrieved from the vector databases.
-      additionalProperties: false
-      required:
-        - turn_id
-        - step_id
-        - step_type
-        - vector_store_ids
-        - inserted_context
-      title: MemoryRetrievalStep
-      description: >-
-        A memory retrieval step in an agent turn.
-    SafetyViolation:
-      type: object
-      properties:
-        violation_level:
-          $ref: '#/components/schemas/ViolationLevel'
-          description: Severity level of the violation
-        user_message:
-          type: string
-          description: >-
-            (Optional) Message to convey to the user about the violation
-        metadata:
-          type: object
-          additionalProperties:
-            oneOf:
-              - type: 'null'
-              - type: boolean
-              - type: number
-              - type: string
-              - type: array
-              - type: object
-          description: >-
-            Additional metadata including specific violation codes for debugging and
-            telemetry
-      additionalProperties: false
-      required:
-        - violation_level
-        - metadata
-      title: SafetyViolation
-      description: >-
-        Details of a safety violation detected by content moderation.
-    Session:
-      type: object
-      properties:
-        session_id:
-          type: string
-          description: >-
-            Unique identifier for the conversation session
-        session_name:
-          type: string
-          description: Human-readable name for the session
-        turns:
-          type: array
-          items:
-            $ref: '#/components/schemas/Turn'
-          description: >-
-            List of all turns that have occurred in this session
-        started_at:
-          type: string
-          format: date-time
-          description: Timestamp when the session was created
-      additionalProperties: false
-      required:
-        - session_id
-        - session_name
-        - turns
-        - started_at
-      title: Session
-      description: >-
-        A single session of an interaction with an Agentic System.
-    ShieldCallStep:
-      type: object
-      properties:
-        turn_id:
-          type: string
-          description: The ID of the turn.
-        step_id:
-          type: string
-          description: The ID of the step.
-        started_at:
-          type: string
-          format: date-time
-          description: The time the step started.
-        completed_at:
-          type: string
-          format: date-time
-          description: The time the step completed.
-        step_type:
-          type: string
-          enum:
-            - inference
-            - tool_execution
-            - shield_call
-            - memory_retrieval
-          title: StepType
-          description: Type of the step in an agent turn.
-          const: shield_call
-          default: shield_call
-        violation:
-          $ref: '#/components/schemas/SafetyViolation'
-          description: The violation from the shield call.
-      additionalProperties: false
-      required:
-        - turn_id
-        - step_id
-        - step_type
-      title: ShieldCallStep
-      description: A shield call step in an agent turn.
-    TextContentItem:
-      type: object
-      properties:
-        type:
-          type: string
-          const: text
-          default: text
-          description: >-
-            Discriminator type of the content item. Always "text"
-        text:
-          type: string
-          description: Text content
-      additionalProperties: false
-      required:
-        - type
-        - text
-      title: TextContentItem
-      description: A text content item
-    ToolCall:
-      type: object
-      properties:
-        call_id:
-          type: string
-        tool_name:
-          oneOf:
-            - type: string
-              enum:
-                - brave_search
-                - wolfram_alpha
-                - photogen
-                - code_interpreter
-              title: BuiltinTool
-            - type: string
-        arguments:
-          type: string
-      additionalProperties: false
-      required:
-        - call_id
-        - tool_name
-        - arguments
-      title: ToolCall
-    ToolExecutionStep:
-      type: object
-      properties:
-        turn_id:
-          type: string
-          description: The ID of the turn.
-        step_id:
-          type: string
-          description: The ID of the step.
-        started_at:
-          type: string
-          format: date-time
-          description: The time the step started.
-        completed_at:
-          type: string
-          format: date-time
-          description: The time the step completed.
-        step_type:
-          type: string
-          enum:
-            - inference
-            - tool_execution
-            - shield_call
-            - memory_retrieval
-          title: StepType
-          description: Type of the step in an agent turn.
-          const: tool_execution
-          default: tool_execution
-        tool_calls:
-          type: array
-          items:
-            $ref: '#/components/schemas/ToolCall'
-          description: The tool calls to execute.
-        tool_responses:
-          type: array
-          items:
-            $ref: '#/components/schemas/ToolResponse'
-          description: The tool responses from the tool calls.
-      additionalProperties: false
-      required:
-        - turn_id
-        - step_id
-        - step_type
-        - tool_calls
-        - tool_responses
-      title: ToolExecutionStep
-      description: A tool execution step in an agent turn.
-    ToolResponse:
-      type: object
-      properties:
-        call_id:
-          type: string
-          description: >-
-            Unique identifier for the tool call this response is for
-        tool_name:
-          oneOf:
-            - type: string
-              enum:
-                - brave_search
-                - wolfram_alpha
-                - photogen
-                - code_interpreter
-              title: BuiltinTool
-            - type: string
-          description: Name of the tool that was invoked
-        content:
-          $ref: '#/components/schemas/InterleavedContent'
-          description: The response content from the tool
-        metadata:
-          type: object
-          additionalProperties:
-            oneOf:
-              - type: 'null'
-              - type: boolean
-              - type: number
-              - type: string
-              - type: array
-              - type: object
-          description: >-
-            (Optional) Additional metadata about the tool response
-      additionalProperties: false
-      required:
-        - call_id
-        - tool_name
-        - content
-      title: ToolResponse
-      description: Response from a tool invocation.
-    ToolResponseMessage:
-      type: object
-      properties:
-        role:
-          type: string
-          const: tool
-          default: tool
-          description: >-
-            Must be "tool" to identify this as a tool response
-        call_id:
-          type: string
-          description: >-
-            Unique identifier for the tool call this response is for
-        content:
-          $ref: '#/components/schemas/InterleavedContent'
-          description: The response content from the tool
-      additionalProperties: false
-      required:
-        - role
-        - call_id
-        - content
-      title: ToolResponseMessage
-      description: >-
-        A message representing the result of a tool invocation.
-    Turn:
-      type: object
-      properties:
-        turn_id:
-          type: string
-          description: >-
-            Unique identifier for the turn within a session
-        session_id:
-          type: string
-          description: >-
-            Unique identifier for the conversation session
-        input_messages:
-          type: array
-          items:
-            oneOf:
-              - $ref: '#/components/schemas/UserMessage'
-              - $ref: '#/components/schemas/ToolResponseMessage'
-          description: >-
-            List of messages that initiated this turn
-        steps:
-          type: array
-          items:
-            oneOf:
-              - $ref: '#/components/schemas/InferenceStep'
-              - $ref: '#/components/schemas/ToolExecutionStep'
-              - $ref: '#/components/schemas/ShieldCallStep'
-              - $ref: '#/components/schemas/MemoryRetrievalStep'
-            discriminator:
-              propertyName: step_type
-              mapping:
-                inference: '#/components/schemas/InferenceStep'
-                tool_execution: '#/components/schemas/ToolExecutionStep'
-                shield_call: '#/components/schemas/ShieldCallStep'
-                memory_retrieval: '#/components/schemas/MemoryRetrievalStep'
-          description: >-
-            Ordered list of processing steps executed during this turn
-        output_message:
-          $ref: '#/components/schemas/CompletionMessage'
-          description: >-
-            The model's generated response containing content and metadata
-        output_attachments:
-          type: array
-          items:
-            type: object
-            properties:
-              content:
-                oneOf:
-                  - type: string
-                  - $ref: '#/components/schemas/InterleavedContentItem'
-                  - type: array
-                    items:
-                      $ref: '#/components/schemas/InterleavedContentItem'
-                  - $ref: '#/components/schemas/URL'
-                description: The content of the attachment.
-              mime_type:
-                type: string
-                description: The MIME type of the attachment.
-            additionalProperties: false
-            required:
-              - content
-              - mime_type
-            title: Attachment
-            description: An attachment to an agent turn.
-          description: >-
-            (Optional) Files or media attached to the agent's response
-        started_at:
-          type: string
-          format: date-time
-          description: Timestamp when the turn began
-        completed_at:
-          type: string
-          format: date-time
-          description: >-
-            (Optional) Timestamp when the turn finished, if completed
-      additionalProperties: false
-      required:
-        - turn_id
-        - session_id
-        - input_messages
-        - steps
-        - output_message
-        - started_at
-      title: Turn
-      description: >-
-        A single turn in an interaction with an Agentic System.
-    URL:
-      type: object
-      properties:
-        uri:
-          type: string
-          description: The URL string pointing to the resource
-      additionalProperties: false
-      required:
-        - uri
-      title: URL
-      description: A URL reference to external content.
-    UserMessage:
-      type: object
-      properties:
-        role:
-          type: string
-          const: user
-          default: user
-          description: >-
-            Must be "user" to identify this as a user message
-        content:
-          $ref: '#/components/schemas/InterleavedContent'
-          description: >-
-            The content of the message, which can include text and other media
-        context:
-          $ref: '#/components/schemas/InterleavedContent'
-          description: >-
-            (Optional) This field is used internally by Llama Stack to pass RAG context.
-            This field may be removed in the API in the future.
-      additionalProperties: false
-      required:
-        - role
-        - content
-      title: UserMessage
-      description: >-
-        A message from the user in a chat conversation.
-    ViolationLevel:
-      type: string
-      enum:
-        - info
-        - warn
-        - error
-      title: ViolationLevel
-      description: Severity level of a safety violation.
-    CreateAgentTurnRequest:
-      type: object
-      properties:
-        messages:
-          type: array
-          items:
-            oneOf:
-              - $ref: '#/components/schemas/UserMessage'
-              - $ref: '#/components/schemas/ToolResponseMessage'
-          description: List of messages to start the turn with.
-        stream:
-          type: boolean
-          description: >-
-            (Optional) If True, generate an SSE event stream of the response. Defaults
-            to False.
-        documents:
-          type: array
-          items:
-            type: object
-            properties:
-              content:
-                oneOf:
-                  - type: string
-                  - $ref: '#/components/schemas/InterleavedContentItem'
-                  - type: array
-                    items:
-                      $ref: '#/components/schemas/InterleavedContentItem'
-                  - $ref: '#/components/schemas/URL'
-                description: The content of the document.
-              mime_type:
-                type: string
-                description: The MIME type of the document.
-            additionalProperties: false
-            required:
-              - content
-              - mime_type
-            title: Document
-            description: A document to be used by an agent.
-          description: >-
-            (Optional) List of documents to create the turn with.
-        toolgroups:
-          type: array
-          items:
-            $ref: '#/components/schemas/AgentTool'
-          description: >-
-            (Optional) List of toolgroups to create the turn with, will be used in
-            addition to the agent's config toolgroups for the request.
-        tool_config:
-          $ref: '#/components/schemas/ToolConfig'
-          description: >-
-            (Optional) The tool configuration to create the turn with, will be used
-            to override the agent's tool_config.
-      additionalProperties: false
-      required:
-        - messages
-      title: CreateAgentTurnRequest
-    AgentTurnResponseEvent:
-      type: object
-      properties:
-        payload:
-          oneOf:
-            - $ref: '#/components/schemas/AgentTurnResponseStepStartPayload'
-            - $ref: '#/components/schemas/AgentTurnResponseStepProgressPayload'
-            - $ref: '#/components/schemas/AgentTurnResponseStepCompletePayload'
-            - $ref: '#/components/schemas/AgentTurnResponseTurnStartPayload'
-            - $ref: '#/components/schemas/AgentTurnResponseTurnCompletePayload'
-            - $ref: '#/components/schemas/AgentTurnResponseTurnAwaitingInputPayload'
-          discriminator:
-            propertyName: event_type
-            mapping:
-              step_start: '#/components/schemas/AgentTurnResponseStepStartPayload'
-              step_progress: '#/components/schemas/AgentTurnResponseStepProgressPayload'
-              step_complete: '#/components/schemas/AgentTurnResponseStepCompletePayload'
-              turn_start: '#/components/schemas/AgentTurnResponseTurnStartPayload'
-              turn_complete: '#/components/schemas/AgentTurnResponseTurnCompletePayload'
-              turn_awaiting_input: '#/components/schemas/AgentTurnResponseTurnAwaitingInputPayload'
-          description: >-
-            Event-specific payload containing event data
-      additionalProperties: false
-      required:
-        - payload
-      title: AgentTurnResponseEvent
-      description: >-
-        An event in an agent turn response stream.
-    AgentTurnResponseStepCompletePayload:
-      type: object
-      properties:
-        event_type:
-          type: string
-          enum:
-            - step_start
-            - step_complete
-            - step_progress
-            - turn_start
-            - turn_complete
-            - turn_awaiting_input
-          const: step_complete
-          default: step_complete
-          description: Type of event being reported
-        step_type:
-          type: string
-          enum:
-            - inference
-            - tool_execution
-            - shield_call
-            - memory_retrieval
-          description: Type of step being executed
-        step_id:
-          type: string
-          description: >-
-            Unique identifier for the step within a turn
-        step_details:
-          oneOf:
-            - $ref: '#/components/schemas/InferenceStep'
-            - $ref: '#/components/schemas/ToolExecutionStep'
-            - $ref: '#/components/schemas/ShieldCallStep'
-            - $ref: '#/components/schemas/MemoryRetrievalStep'
-          discriminator:
-            propertyName: step_type
-            mapping:
-              inference: '#/components/schemas/InferenceStep'
-              tool_execution: '#/components/schemas/ToolExecutionStep'
-              shield_call: '#/components/schemas/ShieldCallStep'
-              memory_retrieval: '#/components/schemas/MemoryRetrievalStep'
-          description: Complete details of the executed step
-      additionalProperties: false
-      required:
-        - event_type
-        - step_type
-        - step_id
-        - step_details
-      title: AgentTurnResponseStepCompletePayload
-      description: >-
-        Payload for step completion events in agent turn responses.
-    AgentTurnResponseStepProgressPayload:
-      type: object
-      properties:
-        event_type:
-          type: string
-          enum:
-            - step_start
-            - step_complete
-            - step_progress
-            - turn_start
-            - turn_complete
-            - turn_awaiting_input
-          const: step_progress
-          default: step_progress
-          description: Type of event being reported
-        step_type:
-          type: string
-          enum:
-            - inference
-            - tool_execution
-            - shield_call
-            - memory_retrieval
-          description: Type of step being executed
-        step_id:
-          type: string
-          description: >-
-            Unique identifier for the step within a turn
-        delta:
-          oneOf:
-            - $ref: '#/components/schemas/TextDelta'
-            - $ref: '#/components/schemas/ImageDelta'
-            - $ref: '#/components/schemas/ToolCallDelta'
-          discriminator:
-            propertyName: type
-            mapping:
-              text: '#/components/schemas/TextDelta'
-              image: '#/components/schemas/ImageDelta'
-              tool_call: '#/components/schemas/ToolCallDelta'
-          description: >-
-            Incremental content changes during step execution
-      additionalProperties: false
-      required:
-        - event_type
-        - step_type
-        - step_id
-        - delta
-      title: AgentTurnResponseStepProgressPayload
-      description: >-
-        Payload for step progress events in agent turn responses.
-    AgentTurnResponseStepStartPayload:
-      type: object
-      properties:
-        event_type:
-          type: string
-          enum:
-            - step_start
-            - step_complete
-            - step_progress
-            - turn_start
-            - turn_complete
-            - turn_awaiting_input
-          const: step_start
-          default: step_start
-          description: Type of event being reported
-        step_type:
-          type: string
-          enum:
-            - inference
-            - tool_execution
-            - shield_call
-            - memory_retrieval
-          description: Type of step being executed
-        step_id:
-          type: string
-          description: >-
-            Unique identifier for the step within a turn
-        metadata:
-          type: object
-          additionalProperties:
-            oneOf:
-              - type: 'null'
-              - type: boolean
-              - type: number
-              - type: string
-              - type: array
-              - type: object
-          description: >-
-            (Optional) Additional metadata for the step
-      additionalProperties: false
-      required:
-        - event_type
-        - step_type
-        - step_id
-      title: AgentTurnResponseStepStartPayload
-      description: >-
-        Payload for step start events in agent turn responses.
-    AgentTurnResponseStreamChunk:
-      type: object
-      properties:
-        event:
-          $ref: '#/components/schemas/AgentTurnResponseEvent'
-          description: >-
-            Individual event in the agent turn response stream
-      additionalProperties: false
-      required:
-        - event
-      title: AgentTurnResponseStreamChunk
-      description: Streamed agent turn completion response.
-    "AgentTurnResponseTurnAwaitingInputPayload":
-      type: object
-      properties:
-        event_type:
-          type: string
-          enum:
-            - step_start
-            - step_complete
-            - step_progress
-            - turn_start
-            - turn_complete
-            - turn_awaiting_input
-          const: turn_awaiting_input
-          default: turn_awaiting_input
-          description: Type of event being reported
-        turn:
-          $ref: '#/components/schemas/Turn'
-          description: >-
-            Turn data when waiting for external tool responses
-      additionalProperties: false
-      required:
-        - event_type
-        - turn
-      title: >-
-        AgentTurnResponseTurnAwaitingInputPayload
-      description: >-
-        Payload for turn awaiting input events in agent turn responses.
-    AgentTurnResponseTurnCompletePayload:
-      type: object
-      properties:
-        event_type:
-          type: string
-          enum:
-            - step_start
-            - step_complete
-            - step_progress
-            - turn_start
-            - turn_complete
-            - turn_awaiting_input
-          const: turn_complete
-          default: turn_complete
-          description: Type of event being reported
-        turn:
-          $ref: '#/components/schemas/Turn'
-          description: >-
-            Complete turn data including all steps and results
-      additionalProperties: false
-      required:
-        - event_type
-        - turn
-      title: AgentTurnResponseTurnCompletePayload
-      description: >-
-        Payload for turn completion events in agent turn responses.
-    AgentTurnResponseTurnStartPayload:
-      type: object
-      properties:
-        event_type:
-          type: string
-          enum:
-            - step_start
-            - step_complete
-            - step_progress
-            - turn_start
-            - turn_complete
-            - turn_awaiting_input
-          const: turn_start
-          default: turn_start
-          description: Type of event being reported
-        turn_id:
-          type: string
-          description: >-
-            Unique identifier for the turn within a session
-      additionalProperties: false
-      required:
-        - event_type
-        - turn_id
-      title: AgentTurnResponseTurnStartPayload
-      description: >-
-        Payload for turn start events in agent turn responses.
-    ImageDelta:
-      type: object
-      properties:
-        type:
-          type: string
-          const: image
-          default: image
-          description: >-
-            Discriminator type of the delta. Always "image"
-        image:
-          type: string
-          contentEncoding: base64
-          description: The incremental image data as bytes
-      additionalProperties: false
-      required:
-        - type
-        - image
-      title: ImageDelta
-      description: >-
-        An image content delta for streaming responses.
-    TextDelta:
-      type: object
-      properties:
-        type:
-          type: string
-          const: text
-          default: text
-          description: >-
-            Discriminator type of the delta. Always "text"
-        text:
-          type: string
-          description: The incremental text content
-      additionalProperties: false
-      required:
-        - type
-        - text
-      title: TextDelta
-      description: >-
-        A text content delta for streaming responses.
-    ToolCallDelta:
-      type: object
-      properties:
-        type:
-          type: string
-          const: tool_call
-          default: tool_call
-          description: >-
-            Discriminator type of the delta. Always "tool_call"
-        tool_call:
-          oneOf:
-            - type: string
-            - $ref: '#/components/schemas/ToolCall'
-          description: >-
-            Either an in-progress tool call string or the final parsed tool call
-        parse_status:
-          type: string
-          enum:
-            - started
-            - in_progress
-            - failed
-            - succeeded
-          description: Current parsing status of the tool call
-      additionalProperties: false
-      required:
-        - type
-        - tool_call
-        - parse_status
-      title: ToolCallDelta
-      description: >-
-        A tool call content delta for streaming responses.
-    ResumeAgentTurnRequest:
-      type: object
-      properties:
-        tool_responses:
-          type: array
-          items:
-            $ref: '#/components/schemas/ToolResponse'
-          description: >-
-            The tool call responses to resume the turn with.
-        stream:
-          type: boolean
-          description: Whether to stream the response.
-      additionalProperties: false
-      required:
-        - tool_responses
-      title: ResumeAgentTurnRequest
-    AgentStepResponse:
-      type: object
-      properties:
-        step:
-          oneOf:
-            - $ref: '#/components/schemas/InferenceStep'
-            - $ref: '#/components/schemas/ToolExecutionStep'
-            - $ref: '#/components/schemas/ShieldCallStep'
-            - $ref: '#/components/schemas/MemoryRetrievalStep'
-          discriminator:
-            propertyName: step_type
-            mapping:
-              inference: '#/components/schemas/InferenceStep'
-              tool_execution: '#/components/schemas/ToolExecutionStep'
-              shield_call: '#/components/schemas/ShieldCallStep'
-              memory_retrieval: '#/components/schemas/MemoryRetrievalStep'
-          description: >-
-            The complete step data and execution details
-      additionalProperties: false
-      required:
-        - step
-      title: AgentStepResponse
-      description: >-
-        Response containing details of a specific agent step.
-    AppendRowsRequest:
-      type: object
-      properties:
-        rows:
-          type: array
-          items:
-            type: object
-            additionalProperties:
-              oneOf:
-                - type: 'null'
-                - type: boolean
-                - type: number
-                - type: string
-                - type: array
-                - type: object
-          description: The rows to append to the dataset.
-      additionalProperties: false
-      required:
-        - rows
-      title: AppendRowsRequest
-    Dataset:
-      type: object
-      properties:
-        identifier:
-          type: string
-        provider_resource_id:
-          type: string
-        provider_id:
-          type: string
-        type:
-          type: string
-          enum:
-            - model
-            - shield
-            - vector_store
-            - dataset
-            - scoring_function
-            - benchmark
-            - tool
-            - tool_group
-            - prompt
-          const: dataset
-          default: dataset
-          description: >-
-            Type of resource, always 'dataset' for datasets
-        purpose:
-          type: string
-          enum:
-            - post-training/messages
-            - eval/question-answer
-            - eval/messages-answer
-          description: >-
-            Purpose of the dataset indicating its intended use
-        source:
-          oneOf:
-            - $ref: '#/components/schemas/URIDataSource'
-            - $ref: '#/components/schemas/RowsDataSource'
-          discriminator:
-            propertyName: type
-            mapping:
-              uri: '#/components/schemas/URIDataSource'
-              rows: '#/components/schemas/RowsDataSource'
-          description: >-
-            Data source configuration for the dataset
-        metadata:
-          type: object
-          additionalProperties:
-            oneOf:
-              - type: 'null'
-              - type: boolean
-              - type: number
-              - type: string
-              - type: array
-              - type: object
-          description: Additional metadata for the dataset
-      additionalProperties: false
-      required:
-        - identifier
-        - provider_id
-        - type
-        - purpose
-        - source
-        - metadata
-      title: Dataset
-      description: >-
-        Dataset resource for storing and accessing training or evaluation data.
-    RowsDataSource:
-      type: object
-      properties:
-        type:
-          type: string
-          const: rows
-          default: rows
-        rows:
-          type: array
-          items:
-            type: object
-            additionalProperties:
-              oneOf:
-                - type: 'null'
-                - type: boolean
-                - type: number
-                - type: string
-                - type: array
-                - type: object
-          description: >-
-            The dataset is stored in rows. E.g. - [ {"messages": [{"role": "user",
-            "content": "Hello, world!"}, {"role": "assistant", "content": "Hello,
-            world!"}]} ]
-      additionalProperties: false
-      required:
-        - type
-        - rows
-      title: RowsDataSource
-      description: A dataset stored in rows.
-    URIDataSource:
-      type: object
-      properties:
-        type:
-          type: string
-          const: uri
-          default: uri
-        uri:
-          type: string
-          description: >-
-            The dataset can be obtained from a URI. E.g. - "https://mywebsite.com/mydata.jsonl"
-            - "lsfs://mydata.jsonl" - "data:csv;base64,{base64_content}"
-      additionalProperties: false
-      required:
-        - type
-        - uri
-      title: URIDataSource
-      description: >-
-        A dataset that can be obtained from a URI.
-    ListDatasetsResponse:
-      type: object
-      properties:
-        data:
-          type: array
-          items:
-            $ref: '#/components/schemas/Dataset'
-          description: List of datasets
-      additionalProperties: false
-      required:
-        - data
-      title: ListDatasetsResponse
-      description: Response from listing datasets.
-    DataSource:
-      oneOf:
-        - $ref: '#/components/schemas/URIDataSource'
-        - $ref: '#/components/schemas/RowsDataSource'
-      discriminator:
-        propertyName: type
-        mapping:
-          uri: '#/components/schemas/URIDataSource'
-          rows: '#/components/schemas/RowsDataSource'
-    RegisterDatasetRequest:
-      type: object
-      properties:
-        purpose:
-          type: string
-          enum:
-            - post-training/messages
-            - eval/question-answer
-            - eval/messages-answer
-          description: >-
-            The purpose of the dataset. One of: - "post-training/messages": The dataset
-            contains a messages column with list of messages for post-training. {
-            "messages": [ {"role": "user", "content": "Hello, world!"}, {"role": "assistant",
-            "content": "Hello, world!"}, ] } - "eval/question-answer": The dataset
-            contains a question column and an answer column for evaluation. { "question":
-            "What is the capital of France?", "answer": "Paris" } - "eval/messages-answer":
-            The dataset contains a messages column with list of messages and an answer
-            column for evaluation. { "messages": [ {"role": "user", "content": "Hello,
-            my name is John Doe."}, {"role": "assistant", "content": "Hello, John
-            Doe. How can I help you today?"}, {"role": "user", "content": "What's
-            my name?"}, ], "answer": "John Doe" }
-        source:
-          $ref: '#/components/schemas/DataSource'
-          description: >-
-            The data source of the dataset. Ensure that the data source schema is
-            compatible with the purpose of the dataset. Examples: - { "type": "uri",
-            "uri": "https://mywebsite.com/mydata.jsonl" } - { "type": "uri", "uri":
-            "lsfs://mydata.jsonl" } - { "type": "uri", "uri": "data:csv;base64,{base64_content}"
-            } - { "type": "uri", "uri": "huggingface://llamastack/simpleqa?split=train"
-            } - { "type": "rows", "rows": [ { "messages": [ {"role": "user", "content":
-            "Hello, world!"}, {"role": "assistant", "content": "Hello, world!"}, ]
-            } ] }
-        metadata:
-          type: object
-          additionalProperties:
-            oneOf:
-              - type: 'null'
-              - type: boolean
-              - type: number
-              - type: string
-              - type: array
-              - type: object
-          description: >-
-            The metadata for the dataset. - E.g. {"description": "My dataset"}.
-        dataset_id:
-          type: string
-          description: >-
-            The ID of the dataset. If not provided, an ID will be generated.
-      additionalProperties: false
-      required:
-        - purpose
-        - source
-      title: RegisterDatasetRequest
-    Benchmark:
-      type: object
-      properties:
-        identifier:
-          type: string
-        provider_resource_id:
-          type: string
-        provider_id:
-          type: string
-        type:
-          type: string
-          enum:
-            - model
-            - shield
-            - vector_store
-            - dataset
-            - scoring_function
-            - benchmark
-            - tool
-            - tool_group
-            - prompt
-          const: benchmark
-          default: benchmark
-          description: The resource type, always benchmark
-        dataset_id:
-          type: string
-          description: >-
-            Identifier of the dataset to use for the benchmark evaluation
-        scoring_functions:
-          type: array
-          items:
-            type: string
-          description: >-
-            List of scoring function identifiers to apply during evaluation
-        metadata:
-          type: object
-          additionalProperties:
-            oneOf:
-              - type: 'null'
-              - type: boolean
-              - type: number
-              - type: string
-              - type: array
-              - type: object
-          description: Metadata for this evaluation task
-      additionalProperties: false
-      required:
-        - identifier
-        - provider_id
-        - type
-        - dataset_id
-        - scoring_functions
-        - metadata
-      title: Benchmark
-      description: >-
-        A benchmark resource for evaluating model performance.
-    ListBenchmarksResponse:
-      type: object
-      properties:
-        data:
-          type: array
-          items:
-            $ref: '#/components/schemas/Benchmark'
-      additionalProperties: false
-      required:
-        - data
-      title: ListBenchmarksResponse
-    RegisterBenchmarkRequest:
-      type: object
-      properties:
-        benchmark_id:
-          type: string
-          description: The ID of the benchmark to register.
-        dataset_id:
-          type: string
-          description: >-
-            The ID of the dataset to use for the benchmark.
-        scoring_functions:
-          type: array
-          items:
-            type: string
-          description: >-
-            The scoring functions to use for the benchmark.
-        provider_benchmark_id:
-          type: string
-          description: >-
-            The ID of the provider benchmark to use for the benchmark.
-        provider_id:
-          type: string
-          description: >-
-            The ID of the provider to use for the benchmark.
-        metadata:
-          type: object
-          additionalProperties:
-            oneOf:
-              - type: 'null'
-              - type: boolean
-              - type: number
-              - type: string
-              - type: array
-              - type: object
-          description: The metadata to use for the benchmark.
-      additionalProperties: false
-      required:
-        - benchmark_id
-        - dataset_id
-        - scoring_functions
-      title: RegisterBenchmarkRequest
-    AgentCandidate:
-      type: object
-      properties:
-        type:
-          type: string
-          const: agent
-          default: agent
-        config:
-          $ref: '#/components/schemas/AgentConfig'
-          description: >-
-            The configuration for the agent candidate.
-      additionalProperties: false
-      required:
-        - type
-        - config
-      title: AgentCandidate
-      description: An agent candidate for evaluation.
-    AggregationFunctionType:
-      type: string
-      enum:
-        - average
-        - weighted_average
-        - median
-        - categorical_count
-        - accuracy
-      title: AggregationFunctionType
-      description: >-
-        Types of aggregation functions for scoring results.
-    BasicScoringFnParams:
-      type: object
-      properties:
-        type:
-          $ref: '#/components/schemas/ScoringFnParamsType'
-          const: basic
-          default: basic
-          description: >-
-            The type of scoring function parameters, always basic
-        aggregation_functions:
-          type: array
-          items:
-            $ref: '#/components/schemas/AggregationFunctionType'
-          description: >-
-            Aggregation functions to apply to the scores of each row
-      additionalProperties: false
-      required:
-        - type
-        - aggregation_functions
-      title: BasicScoringFnParams
-      description: >-
-        Parameters for basic scoring function configuration.
-    BenchmarkConfig:
-      type: object
-      properties:
-        eval_candidate:
-          oneOf:
-            - $ref: '#/components/schemas/ModelCandidate'
-            - $ref: '#/components/schemas/AgentCandidate'
-          discriminator:
-            propertyName: type
-            mapping:
-              model: '#/components/schemas/ModelCandidate'
-              agent: '#/components/schemas/AgentCandidate'
-          description: The candidate to evaluate.
-        scoring_params:
-          type: object
-          additionalProperties:
-            $ref: '#/components/schemas/ScoringFnParams'
-          description: >-
-            Map between scoring function id and parameters for each scoring function
-            you want to run
-        num_examples:
-          type: integer
-          description: >-
-            (Optional) The number of examples to evaluate. If not provided, all examples
-            in the dataset will be evaluated
-      additionalProperties: false
-      required:
-        - eval_candidate
-        - scoring_params
-      title: BenchmarkConfig
-      description: >-
-        A benchmark configuration for evaluation.
-    LLMAsJudgeScoringFnParams:
-      type: object
-      properties:
-        type:
-          $ref: '#/components/schemas/ScoringFnParamsType'
-          const: llm_as_judge
-          default: llm_as_judge
-          description: >-
-            The type of scoring function parameters, always llm_as_judge
-        judge_model:
-          type: string
-          description: >-
-            Identifier of the LLM model to use as a judge for scoring
-        prompt_template:
-          type: string
-          description: >-
-            (Optional) Custom prompt template for the judge model
-        judge_score_regexes:
-          type: array
-          items:
-            type: string
-          description: >-
-            Regexes to extract the answer from generated response
-        aggregation_functions:
-          type: array
-          items:
-            $ref: '#/components/schemas/AggregationFunctionType'
-          description: >-
-            Aggregation functions to apply to the scores of each row
-      additionalProperties: false
-      required:
-        - type
-        - judge_model
-        - judge_score_regexes
-        - aggregation_functions
-      title: LLMAsJudgeScoringFnParams
-      description: >-
-        Parameters for LLM-as-judge scoring function configuration.
-    ModelCandidate:
-      type: object
-      properties:
-        type:
-          type: string
-          const: model
-          default: model
-        model:
-          type: string
-          description: The model ID to evaluate.
-        sampling_params:
-          $ref: '#/components/schemas/SamplingParams'
-          description: The sampling parameters for the model.
-        system_message:
-          $ref: '#/components/schemas/SystemMessage'
-          description: >-
-            (Optional) The system message providing instructions or context to the
-            model.
-      additionalProperties: false
-      required:
-        - type
-        - model
-        - sampling_params
-      title: ModelCandidate
-      description: A model candidate for evaluation.
-    RegexParserScoringFnParams:
-      type: object
-      properties:
-        type:
-          $ref: '#/components/schemas/ScoringFnParamsType'
-          const: regex_parser
-          default: regex_parser
-          description: >-
-            The type of scoring function parameters, always regex_parser
-        parsing_regexes:
-          type: array
-          items:
-            type: string
-          description: >-
-            Regex to extract the answer from generated response
-        aggregation_functions:
-          type: array
-          items:
-            $ref: '#/components/schemas/AggregationFunctionType'
-          description: >-
-            Aggregation functions to apply to the scores of each row
-      additionalProperties: false
-      required:
-        - type
-        - parsing_regexes
-        - aggregation_functions
-      title: RegexParserScoringFnParams
-      description: >-
-        Parameters for regex parser scoring function configuration.
-    ScoringFnParams:
-      oneOf:
-        - $ref: '#/components/schemas/LLMAsJudgeScoringFnParams'
-        - $ref: '#/components/schemas/RegexParserScoringFnParams'
-        - $ref: '#/components/schemas/BasicScoringFnParams'
-      discriminator:
-        propertyName: type
-        mapping:
-          llm_as_judge: '#/components/schemas/LLMAsJudgeScoringFnParams'
-          regex_parser: '#/components/schemas/RegexParserScoringFnParams'
-          basic: '#/components/schemas/BasicScoringFnParams'
-    ScoringFnParamsType:
-      type: string
-      enum:
-        - llm_as_judge
-        - regex_parser
-        - basic
-      title: ScoringFnParamsType
-      description: >-
-        Types of scoring function parameter configurations.
-    SystemMessage:
-      type: object
-      properties:
-        role:
-          type: string
-          const: system
-          default: system
-          description: >-
-            Must be "system" to identify this as a system message
-        content:
-          $ref: '#/components/schemas/InterleavedContent'
-          description: >-
-            The content of the "system prompt". If multiple system messages are provided,
-            they are concatenated. The underlying Llama Stack code may also add other
-            system messages (for example, for formatting tool definitions).
-      additionalProperties: false
-      required:
-        - role
-        - content
-      title: SystemMessage
-      description: >-
-        A system message providing instructions or context to the model.
-    EvaluateRowsRequest:
-      type: object
-      properties:
-        input_rows:
-          type: array
-          items:
-            type: object
-            additionalProperties:
-              oneOf:
-                - type: 'null'
-                - type: boolean
-                - type: number
-                - type: string
-                - type: array
-                - type: object
-          description: The rows to evaluate.
-        scoring_functions:
-          type: array
-          items:
-            type: string
-          description: >-
-            The scoring functions to use for the evaluation.
-        benchmark_config:
-          $ref: '#/components/schemas/BenchmarkConfig'
-          description: The configuration for the benchmark.
-      additionalProperties: false
-      required:
-        - input_rows
-        - scoring_functions
-        - benchmark_config
-      title: EvaluateRowsRequest
-    EvaluateResponse:
-      type: object
-      properties:
-        generations:
-          type: array
-          items:
-            type: object
-            additionalProperties:
-              oneOf:
-                - type: 'null'
-                - type: boolean
-                - type: number
-                - type: string
-                - type: array
-                - type: object
-          description: The generations from the evaluation.
-        scores:
-          type: object
-          additionalProperties:
-            $ref: '#/components/schemas/ScoringResult'
-          description: The scores from the evaluation.
-      additionalProperties: false
-      required:
-        - generations
-        - scores
-      title: EvaluateResponse
-      description: The response from an evaluation.
-    ScoringResult:
-      type: object
-      properties:
-        score_rows:
-          type: array
-          items:
-            type: object
-            additionalProperties:
-              oneOf:
-                - type: 'null'
-                - type: boolean
-                - type: number
-                - type: string
-                - type: array
-                - type: object
-          description: >-
-            The scoring result for each row. Each row is a map of column name to value.
-        aggregated_results:
-          type: object
-          additionalProperties:
-            oneOf:
-              - type: 'null'
-              - type: boolean
-              - type: number
-              - type: string
-              - type: array
-              - type: object
-          description: Map of metric name to aggregated value
-      additionalProperties: false
-      required:
-        - score_rows
-        - aggregated_results
-      title: ScoringResult
-      description: A scoring result for a single row.
-    RunEvalRequest:
-      type: object
-      properties:
-        benchmark_config:
-          $ref: '#/components/schemas/BenchmarkConfig'
-          description: The configuration for the benchmark.
-      additionalProperties: false
-      required:
-        - benchmark_config
-      title: RunEvalRequest
-    Job:
-      type: object
-      properties:
-        job_id:
-          type: string
-          description: Unique identifier for the job
-        status:
-          type: string
-          enum:
-            - completed
-            - in_progress
-            - failed
-            - scheduled
-            - cancelled
-          description: Current execution status of the job
-      additionalProperties: false
-      required:
-        - job_id
-        - status
-      title: Job
-      description: >-
-        A job execution instance with status tracking.
-    Checkpoint:
-      type: object
-      properties:
-        identifier:
-          type: string
-          description: Unique identifier for the checkpoint
-        created_at:
-          type: string
-          format: date-time
-          description: >-
-            Timestamp when the checkpoint was created
-        epoch:
-          type: integer
-          description: >-
-            Training epoch when the checkpoint was saved
-        post_training_job_id:
-          type: string
-          description: >-
-            Identifier of the training job that created this checkpoint
-        path:
-          type: string
-          description: >-
-            File system path where the checkpoint is stored
-        training_metrics:
-          $ref: '#/components/schemas/PostTrainingMetric'
-          description: >-
-            (Optional) Training metrics associated with this checkpoint
-      additionalProperties: false
-      required:
-        - identifier
-        - created_at
-        - epoch
-        - post_training_job_id
-        - path
-      title: Checkpoint
-      description: Checkpoint created during training runs.
-    PostTrainingJobArtifactsResponse:
-      type: object
-      properties:
-        job_uuid:
-          type: string
-          description: Unique identifier for the training job
-        checkpoints:
-          type: array
-          items:
-            $ref: '#/components/schemas/Checkpoint'
-          description: >-
-            List of model checkpoints created during training
-      additionalProperties: false
-      required:
-        - job_uuid
-        - checkpoints
-      title: PostTrainingJobArtifactsResponse
-      description: Artifacts of a finetuning job.
-    PostTrainingMetric:
-      type: object
-      properties:
-        epoch:
-          type: integer
-          description: Training epoch number
-        train_loss:
-          type: number
-          description: Loss value on the training dataset
-        validation_loss:
-          type: number
-          description: Loss value on the validation dataset
-        perplexity:
-          type: number
-          description: >-
-            Perplexity metric indicating model confidence
-      additionalProperties: false
-      required:
-        - epoch
-        - train_loss
-        - validation_loss
-        - perplexity
-      title: PostTrainingMetric
-      description: >-
-        Training metrics captured during post-training jobs.
-    CancelTrainingJobRequest:
-      type: object
-      properties:
-        job_uuid:
-          type: string
-          description: The UUID of the job to cancel.
-      additionalProperties: false
-      required:
-        - job_uuid
-      title: CancelTrainingJobRequest
-    PostTrainingJobStatusResponse:
-      type: object
-      properties:
-        job_uuid:
-          type: string
-          description: Unique identifier for the training job
-        status:
-          type: string
-          enum:
-            - completed
-            - in_progress
-            - failed
-            - scheduled
-            - cancelled
-          description: Current status of the training job
-        scheduled_at:
-          type: string
-          format: date-time
-          description: >-
-            (Optional) Timestamp when the job was scheduled
-        started_at:
-          type: string
-          format: date-time
-          description: >-
-            (Optional) Timestamp when the job execution began
-        completed_at:
-          type: string
-          format: date-time
-          description: >-
-            (Optional) Timestamp when the job finished, if completed
-        resources_allocated:
-          type: object
-          additionalProperties:
-            oneOf:
-              - type: 'null'
-              - type: boolean
-              - type: number
-              - type: string
-              - type: array
-              - type: object
-          description: >-
-            (Optional) Information about computational resources allocated to the
-            job
-        checkpoints:
-          type: array
-          items:
-            $ref: '#/components/schemas/Checkpoint'
-          description: >-
-            List of model checkpoints created during training
-      additionalProperties: false
-      required:
-        - job_uuid
-        - status
-        - checkpoints
-      title: PostTrainingJobStatusResponse
-      description: Status of a finetuning job.
-    ListPostTrainingJobsResponse:
-      type: object
-      properties:
-        data:
-          type: array
-          items:
-            type: object
-            properties:
-              job_uuid:
-                type: string
-            additionalProperties: false
-            required:
-              - job_uuid
-            title: PostTrainingJob
-      additionalProperties: false
-      required:
-        - data
-      title: ListPostTrainingJobsResponse
-    DPOAlignmentConfig:
-      type: object
-      properties:
-        beta:
-          type: number
-          description: Temperature parameter for the DPO loss
-        loss_type:
-          $ref: '#/components/schemas/DPOLossType'
-          default: sigmoid
-          description: The type of loss function to use for DPO
-      additionalProperties: false
-      required:
-        - beta
-        - loss_type
-      title: DPOAlignmentConfig
-      description: >-
-        Configuration for Direct Preference Optimization (DPO) alignment.
-    DPOLossType:
-      type: string
-      enum:
-        - sigmoid
-        - hinge
-        - ipo
-        - kto_pair
-      title: DPOLossType
-    DataConfig:
-      type: object
-      properties:
-        dataset_id:
-          type: string
-          description: >-
-            Unique identifier for the training dataset
-        batch_size:
-          type: integer
-          description: Number of samples per training batch
-        shuffle:
-          type: boolean
-          description: >-
-            Whether to shuffle the dataset during training
-        data_format:
-          $ref: '#/components/schemas/DatasetFormat'
-          description: >-
-            Format of the dataset (instruct or dialog)
-        validation_dataset_id:
-          type: string
-          description: >-
-            (Optional) Unique identifier for the validation dataset
-        packed:
-          type: boolean
-          default: false
-          description: >-
-            (Optional) Whether to pack multiple samples into a single sequence for
-            efficiency
-        train_on_input:
-          type: boolean
-          default: false
-          description: >-
-            (Optional) Whether to compute loss on input tokens as well as output tokens
-      additionalProperties: false
-      required:
-        - dataset_id
-        - batch_size
-        - shuffle
-        - data_format
-      title: DataConfig
-      description: >-
-        Configuration for training data and data loading.
-    DatasetFormat:
-      type: string
-      enum:
-        - instruct
-        - dialog
-      title: DatasetFormat
-      description: Format of the training dataset.
-    EfficiencyConfig:
-      type: object
-      properties:
-        enable_activation_checkpointing:
-          type: boolean
-          default: false
-          description: >-
-            (Optional) Whether to use activation checkpointing to reduce memory usage
-        enable_activation_offloading:
-          type: boolean
-          default: false
-          description: >-
-            (Optional) Whether to offload activations to CPU to save GPU memory
-        memory_efficient_fsdp_wrap:
-          type: boolean
-          default: false
-          description: >-
-            (Optional) Whether to use memory-efficient FSDP wrapping
-        fsdp_cpu_offload:
-          type: boolean
-          default: false
-          description: >-
-            (Optional) Whether to offload FSDP parameters to CPU
-      additionalProperties: false
-      title: EfficiencyConfig
-      description: >-
-        Configuration for memory and compute efficiency optimizations.
-    OptimizerConfig:
-      type: object
-      properties:
-        optimizer_type:
-          $ref: '#/components/schemas/OptimizerType'
-          description: >-
-            Type of optimizer to use (adam, adamw, or sgd)
-        lr:
-          type: number
-          description: Learning rate for the optimizer
-        weight_decay:
-          type: number
-          description: >-
-            Weight decay coefficient for regularization
-        num_warmup_steps:
-          type: integer
-          description: Number of steps for learning rate warmup
-      additionalProperties: false
-      required:
-        - optimizer_type
-        - lr
-        - weight_decay
-        - num_warmup_steps
-      title: OptimizerConfig
-      description: >-
-        Configuration parameters for the optimization algorithm.
-    OptimizerType:
-      type: string
-      enum:
-        - adam
-        - adamw
-        - sgd
-      title: OptimizerType
-      description: >-
-        Available optimizer algorithms for training.
-    TrainingConfig:
-      type: object
-      properties:
-        n_epochs:
-          type: integer
-          description: Number of training epochs to run
-        max_steps_per_epoch:
-          type: integer
-          default: 1
-          description: Maximum number of steps to run per epoch
-        gradient_accumulation_steps:
-          type: integer
-          default: 1
-          description: >-
-            Number of steps to accumulate gradients before updating
-        max_validation_steps:
-          type: integer
-          default: 1
-          description: >-
-            (Optional) Maximum number of validation steps per epoch
-        data_config:
-          $ref: '#/components/schemas/DataConfig'
-          description: >-
-            (Optional) Configuration for data loading and formatting
-        optimizer_config:
-          $ref: '#/components/schemas/OptimizerConfig'
-          description: >-
-            (Optional) Configuration for the optimization algorithm
-        efficiency_config:
-          $ref: '#/components/schemas/EfficiencyConfig'
-          description: >-
-            (Optional) Configuration for memory and compute optimizations
-        dtype:
-          type: string
-          default: bf16
-          description: >-
-            (Optional) Data type for model parameters (bf16, fp16, fp32)
-      additionalProperties: false
-      required:
-        - n_epochs
-        - max_steps_per_epoch
-        - gradient_accumulation_steps
-      title: TrainingConfig
-      description: >-
-        Comprehensive configuration for the training process.
-    PreferenceOptimizeRequest:
-      type: object
-      properties:
-        job_uuid:
-          type: string
-          description: The UUID of the job to create.
-        finetuned_model:
-          type: string
-          description: The model to fine-tune.
-        algorithm_config:
-          $ref: '#/components/schemas/DPOAlignmentConfig'
-          description: The algorithm configuration.
-        training_config:
-          $ref: '#/components/schemas/TrainingConfig'
-          description: The training configuration.
-        hyperparam_search_config:
-          type: object
-          additionalProperties:
-            oneOf:
-              - type: 'null'
-              - type: boolean
-              - type: number
-              - type: string
-              - type: array
-              - type: object
-          description: The hyperparam search configuration.
-        logger_config:
-          type: object
-          additionalProperties:
-            oneOf:
-              - type: 'null'
-              - type: boolean
-              - type: number
-              - type: string
-              - type: array
-              - type: object
-          description: The logger configuration.
-      additionalProperties: false
-      required:
-        - job_uuid
-        - finetuned_model
-        - algorithm_config
-        - training_config
-        - hyperparam_search_config
-        - logger_config
-      title: PreferenceOptimizeRequest
-    PostTrainingJob:
-      type: object
-      properties:
-        job_uuid:
-          type: string
-      additionalProperties: false
-      required:
-        - job_uuid
-      title: PostTrainingJob
-    AlgorithmConfig:
-      oneOf:
-        - $ref: '#/components/schemas/LoraFinetuningConfig'
-        - $ref: '#/components/schemas/QATFinetuningConfig'
-      discriminator:
-        propertyName: type
-        mapping:
-          LoRA: '#/components/schemas/LoraFinetuningConfig'
-          QAT: '#/components/schemas/QATFinetuningConfig'
-    LoraFinetuningConfig:
-      type: object
-      properties:
-        type:
-          type: string
-          const: LoRA
-          default: LoRA
-          description: Algorithm type identifier, always "LoRA"
-        lora_attn_modules:
-          type: array
-          items:
-            type: string
-          description: >-
-            List of attention module names to apply LoRA to
-        apply_lora_to_mlp:
-          type: boolean
-          description: Whether to apply LoRA to MLP layers
-        apply_lora_to_output:
-          type: boolean
-          description: >-
-            Whether to apply LoRA to output projection layers
-        rank:
-          type: integer
-          description: >-
-            Rank of the LoRA adaptation (lower rank = fewer parameters)
-        alpha:
-          type: integer
-          description: >-
-            LoRA scaling parameter that controls adaptation strength
-        use_dora:
-          type: boolean
-          default: false
-          description: >-
-            (Optional) Whether to use DoRA (Weight-Decomposed Low-Rank Adaptation)
-        quantize_base:
-          type: boolean
-          default: false
-          description: >-
-            (Optional) Whether to quantize the base model weights
-      additionalProperties: false
-      required:
-        - type
-        - lora_attn_modules
-        - apply_lora_to_mlp
-        - apply_lora_to_output
-        - rank
-        - alpha
-      title: LoraFinetuningConfig
-      description: >-
-        Configuration for Low-Rank Adaptation (LoRA) fine-tuning.
-    QATFinetuningConfig:
-      type: object
-      properties:
-        type:
-          type: string
-          const: QAT
-          default: QAT
-          description: Algorithm type identifier, always "QAT"
-        quantizer_name:
-          type: string
-          description: >-
-            Name of the quantization algorithm to use
-        group_size:
-          type: integer
-          description: Size of groups for grouped quantization
-      additionalProperties: false
-      required:
-        - type
-        - quantizer_name
-        - group_size
-      title: QATFinetuningConfig
-      description: >-
-        Configuration for Quantization-Aware Training (QAT) fine-tuning.
-    SupervisedFineTuneRequest:
-      type: object
-      properties:
-        job_uuid:
-          type: string
-          description: The UUID of the job to create.
-        training_config:
-          $ref: '#/components/schemas/TrainingConfig'
-          description: The training configuration.
-        hyperparam_search_config:
-          type: object
-          additionalProperties:
-            oneOf:
-              - type: 'null'
-              - type: boolean
-              - type: number
-              - type: string
-              - type: array
-              - type: object
-          description: The hyperparam search configuration.
-        logger_config:
-          type: object
-          additionalProperties:
-            oneOf:
-              - type: 'null'
-              - type: boolean
-              - type: number
-              - type: string
-              - type: array
-              - type: object
-          description: The logger configuration.
-        model:
-          type: string
-          description: The model to fine-tune.
-        checkpoint_dir:
-          type: string
-          description: The directory to save checkpoint(s) to.
-        algorithm_config:
-          $ref: '#/components/schemas/AlgorithmConfig'
-          description: The algorithm configuration.
-      additionalProperties: false
-      required:
-        - job_uuid
-        - training_config
-        - hyperparam_search_config
-        - logger_config
-      title: SupervisedFineTuneRequest
   responses:
     BadRequest400:
       description: The request was invalid or malformed
@@ -3901,46 +93,4 @@ components:
             detail: An unexpected error occurred
 security:
   - Default: []
-tags:
-  - name: Agents
-    description: >
-      APIs for creating and interacting with agentic systems.
-
-
-      ## Deprecated APIs
-
-
-      > **⚠️ DEPRECATED**: These APIs are provided for migration reference and will
-      be removed in future versions. Not recommended for new projects.
-
-
-      ### Migration Guidance
-
-
-      If you are using deprecated versions of the Agents or Responses APIs, please
-      migrate to:
-
-
-      - **Responses API**: Use the stable v1 Responses API endpoints
-    x-displayName: Agents
-  - name: Benchmarks
-    description: ''
-  - name: DatasetIO
-    description: ''
-  - name: Datasets
-    description: ''
-  - name: Eval
-    description: >-
-      Llama Stack Evaluation API for running evaluations on model and agent candidates.
-    x-displayName: Evaluations
-  - name: PostTraining (Coming Soon)
-    description: ''
-x-tagGroups:
-  - name: Operations
-    tags:
-      - Agents
-      - Benchmarks
-      - DatasetIO
-      - Datasets
-      - Eval
-      - PostTraining (Coming Soon)
+tags: []
diff --git a/src/llama_stack/apis/benchmarks/benchmarks.py b/src/llama_stack/apis/benchmarks/benchmarks.py
index 030daeb60..933205489 100644
--- a/src/llama_stack/apis/benchmarks/benchmarks.py
+++ b/src/llama_stack/apis/benchmarks/benchmarks.py
@@ -8,7 +8,7 @@ from typing import Any, Literal, Protocol, runtime_checkable
 from pydantic import BaseModel, Field
 
 from llama_stack.apis.resource import Resource, ResourceType
-from llama_stack.apis.version import LLAMA_STACK_API_V1, LLAMA_STACK_API_V1ALPHA
+from llama_stack.apis.version import LLAMA_STACK_API_V1ALPHA
 from llama_stack.schema_utils import json_schema_type, webmethod
 
 
diff --git a/src/llama_stack/apis/datasetio/datasetio.py b/src/llama_stack/apis/datasetio/datasetio.py
index 77adcf9b3..a0c4a1afc 100644
--- a/src/llama_stack/apis/datasetio/datasetio.py
+++ b/src/llama_stack/apis/datasetio/datasetio.py
@@ -8,7 +8,7 @@ from typing import Any, Protocol, runtime_checkable
 
 from llama_stack.apis.common.responses import PaginatedResponse
 from llama_stack.apis.datasets import Dataset
-from llama_stack.apis.version import LLAMA_STACK_API_V1, LLAMA_STACK_API_V1BETA
+from llama_stack.apis.version import LLAMA_STACK_API_V1BETA
 from llama_stack.schema_utils import webmethod
 
 
diff --git a/src/llama_stack/apis/datasets/datasets.py b/src/llama_stack/apis/datasets/datasets.py
index 5d6c76ada..ed4ecec22 100644
--- a/src/llama_stack/apis/datasets/datasets.py
+++ b/src/llama_stack/apis/datasets/datasets.py
@@ -10,7 +10,7 @@ from typing import Annotated, Any, Literal, Protocol
 from pydantic import BaseModel, Field
 
 from llama_stack.apis.resource import Resource, ResourceType
-from llama_stack.apis.version import LLAMA_STACK_API_V1, LLAMA_STACK_API_V1BETA
+from llama_stack.apis.version import LLAMA_STACK_API_V1BETA
 from llama_stack.schema_utils import json_schema_type, register_schema, webmethod
 
 
diff --git a/src/llama_stack/apis/eval/eval.py b/src/llama_stack/apis/eval/eval.py
index b984a2f45..424c90674 100644
--- a/src/llama_stack/apis/eval/eval.py
+++ b/src/llama_stack/apis/eval/eval.py
@@ -13,7 +13,7 @@ from llama_stack.apis.common.job_types import Job
 from llama_stack.apis.inference import SamplingParams, SystemMessage
 from llama_stack.apis.scoring import ScoringResult
 from llama_stack.apis.scoring_functions import ScoringFnParams
-from llama_stack.apis.version import LLAMA_STACK_API_V1, LLAMA_STACK_API_V1ALPHA
+from llama_stack.apis.version import LLAMA_STACK_API_V1ALPHA
 from llama_stack.schema_utils import json_schema_type, register_schema, webmethod
 
 
diff --git a/src/llama_stack/apis/post_training/post_training.py b/src/llama_stack/apis/post_training/post_training.py
index 83cb3a34f..2b7a6222f 100644
--- a/src/llama_stack/apis/post_training/post_training.py
+++ b/src/llama_stack/apis/post_training/post_training.py
@@ -13,7 +13,7 @@ from pydantic import BaseModel, Field
 from llama_stack.apis.common.content_types import URL
 from llama_stack.apis.common.job_types import JobStatus
 from llama_stack.apis.common.training_types import Checkpoint
-from llama_stack.apis.version import LLAMA_STACK_API_V1, LLAMA_STACK_API_V1ALPHA
+from llama_stack.apis.version import LLAMA_STACK_API_V1ALPHA
 from llama_stack.schema_utils import json_schema_type, register_schema, webmethod